{"id":"https://openalex.org/W7125924572","doi":"https://doi.org/10.1109/ase63991.2025.00386","title":"StackPlagger: A System for Identifying AI-Code Plagiarism on Stack Overflow","display_name":"StackPlagger: A System for Identifying AI-Code Plagiarism on Stack Overflow","publication_year":2025,"publication_date":"2025-11-16","ids":{"openalex":"https://openalex.org/W7125924572","doi":"https://doi.org/10.1109/ase63991.2025.00386"},"language":null,"primary_location":{"id":"doi:10.1109/ase63991.2025.00386","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ase63991.2025.00386","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 40th IEEE/ACM International Conference on Automated Software Engineering (ASE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084068350","display_name":"Aman Swaraj","orcid":null},"institutions":[{"id":"https://openalex.org/I154851008","display_name":"Indian Institute of Technology Roorkee","ror":"https://ror.org/00582g326","country_code":"IN","type":"education","lineage":["https://openalex.org/I154851008"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Aman Swaraj","raw_affiliation_strings":["Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India","institution_ids":["https://openalex.org/I154851008"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102501969","display_name":"Harsh Goyal","orcid":null},"institutions":[{"id":"https://openalex.org/I154851008","display_name":"Indian Institute of Technology Roorkee","ror":"https://ror.org/00582g326","country_code":"IN","type":"education","lineage":["https://openalex.org/I154851008"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Harsh Goyal","raw_affiliation_strings":["Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India","institution_ids":["https://openalex.org/I154851008"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124108970","display_name":"Sumit Chadgal","orcid":null},"institutions":[{"id":"https://openalex.org/I154851008","display_name":"Indian Institute of Technology Roorkee","ror":"https://ror.org/00582g326","country_code":"IN","type":"education","lineage":["https://openalex.org/I154851008"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sumit Chadgal","raw_affiliation_strings":["Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India","institution_ids":["https://openalex.org/I154851008"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100633096","display_name":"Sandeep Kumar","orcid":"https://orcid.org/0000-0003-0747-6776"},"institutions":[{"id":"https://openalex.org/I154851008","display_name":"Indian Institute of Technology Roorkee","ror":"https://ror.org/00582g326","country_code":"IN","type":"education","lineage":["https://openalex.org/I154851008"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sandeep Kumar","raw_affiliation_strings":["Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Technology,Department of Computer Science and Engineering,Roorkee,India","institution_ids":["https://openalex.org/I154851008"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5084068350"],"corresponding_institution_ids":["https://openalex.org/I154851008"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.81848839,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4106","last_page":"4109"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.5083000063896179,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.5083000063896179,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.08810000121593475,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.0812000036239624,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.675000011920929},{"id":"https://openalex.org/keywords/snippet","display_name":"Snippet","score":0.4424999952316284},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.42809998989105225},{"id":"https://openalex.org/keywords/plagiarism-detection","display_name":"Plagiarism detection","score":0.4268999993801117},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.41510000824928284},{"id":"https://openalex.org/keywords/extension","display_name":"Extension (predicate logic)","score":0.376800000667572},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.3718999922275543}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8209999799728394},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.675000011920929},{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.4424999952316284},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.42809998989105225},{"id":"https://openalex.org/C2780907237","wikidata":"https://www.wikidata.org/wiki/Q2986238","display_name":"Plagiarism detection","level":2,"score":0.4268999993801117},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.41510000824928284},{"id":"https://openalex.org/C2778029271","wikidata":"https://www.wikidata.org/wiki/Q5421931","display_name":"Extension (predicate logic)","level":2,"score":0.376800000667572},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.3718999922275543},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3544999957084656},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.352400004863739},{"id":"https://openalex.org/C35525427","wikidata":"https://www.wikidata.org/wiki/Q745881","display_name":"Intrusion detection system","level":2,"score":0.3483999967575073},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3343999981880188},{"id":"https://openalex.org/C9395851","wikidata":"https://www.wikidata.org/wiki/Q177929","display_name":"Stack (abstract data type)","level":2,"score":0.33230000734329224},{"id":"https://openalex.org/C43364308","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Byte","level":2,"score":0.31869998574256897},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3165999948978424},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C40305131","wikidata":"https://www.wikidata.org/wiki/Q2616305","display_name":"Obfuscation","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2919999957084656},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.2775000035762787},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C15569618","wikidata":"https://www.wikidata.org/wiki/Q3561421","display_name":"Liveness","level":2,"score":0.26600000262260437},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26579999923706055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ase63991.2025.00386","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ase63991.2025.00386","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 40th IEEE/ACM International Conference on Automated Software Engineering (ASE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.44966429471969604}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W3098605233","https://openalex.org/W4221166942","https://openalex.org/W4375949262","https://openalex.org/W4388954848","https://openalex.org/W4389519352","https://openalex.org/W4393157398","https://openalex.org/W4394859329","https://openalex.org/W4398766125","https://openalex.org/W4406867827","https://openalex.org/W4410552802"],"related_works":[],"abstract_inverted_index":{"Identifying":[0],"AI":[1,154],"code":[2,29,73,121,148],"plagiarism":[3],"on":[4,34,109],"technical":[5],"forums":[6],"like":[7],"Stack":[8],"Overflow":[9],"(SO)":[10],"is":[11],"critical,":[12],"as":[13,137],"it":[14],"can":[15,53,145,166],"directly":[16],"impact":[17],"the":[18,66,124,160],"platform\u2019s":[19],"trust":[20],"and":[21,40,50,81,152,159,171],"credibility.":[22],"While":[23,104],"previous":[24],"studies":[25],"have":[26,32,61],"explored":[27],"AI-generated":[28,147],"detection,":[30],"they":[31],"focused":[33],"long,":[35],"standalone":[36],"samples":[37],"from":[38],"repositories":[39],"competitions.":[41],"In":[42],"contrast,":[43],"SO":[44,150],"snippets":[45],"are":[46,75],"often":[47],"short,":[48],"fragmented,":[49],"context-specific,":[51],"which":[52,144],"make":[54],"detection":[55,129],"more":[56],"challenging.":[57],"Furthermore,":[58],"existing":[59],"methods":[60,106],"also":[62],"not":[63],"adequately":[64],"addressed":[65],"concern":[67],"of":[68,94,120,163],"obfuscated":[69],"or":[70],"adversarially":[71],"prompted":[72],"that":[74],"crafted":[76],"to":[77,127],"mimic":[78],"human":[79],"style":[80],"evade":[82],"detection.":[83],"To":[84],"address":[85],"these":[86],"gaps,":[87],"we":[88,112,132],"first":[89],"introduce":[90],"a":[91,138],"curated":[92],"dataset":[93],"8000":[95],"SO-ChatGPT":[96],"snippet":[97],"pairs":[98],"generated":[99],"using":[100],"multiple":[101],"adversarial":[102],"prompts.":[103],"earlier":[105],"solely":[107],"relied":[108],"pre-trained":[110,125],"models,":[111],"propose":[113],"an":[114],"ensemble":[115],"approach":[116],"combining":[117],"stylometric":[118],"features":[119],"along":[122],"with":[123],"embeddings":[126],"improve":[128],"performance.":[130],"Finally,":[131],"deploy":[133],"our":[134,164],"fine-tuned":[135],"model":[136],"Google":[139],"Chrome":[140],"extension":[141],"called":[142],"\u2018StackPlagger\u2019,":[143],"flag":[146],"in":[149],"answers":[151],"display":[153],"confidence":[155],"scores.":[156],"Video":[157],"demonstration":[158],"associated":[161],"artifacts":[162],"tool":[165],"be":[167],"found":[168],"at":[169],"https://youtu.be/6O9Urp2mvbI":[170],"https://github.com/harsh-g1/StackPlagger,":[172],"respectively.":[173]},"counts_by_year":[],"updated_date":"2026-02-23T20:09:44.859080","created_date":"2026-01-29T00:00:00"}
