{"id":"https://openalex.org/W4392542342","doi":"https://doi.org/10.1145/3626252.3630826","title":"Detecting ChatGPT-Generated Code Submissions in a CS1 Course Using Machine Learning Models","display_name":"Detecting ChatGPT-Generated Code Submissions in a CS1 Course Using Machine Learning Models","publication_year":2024,"publication_date":"2024-03-07","ids":{"openalex":"https://openalex.org/W4392542342","doi":"https://doi.org/10.1145/3626252.3630826"},"language":"en","primary_location":{"id":"doi:10.1145/3626252.3630826","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626252.3630826","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 55th ACM Technical Symposium on Computer Science Education V. 1","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027964018","display_name":"Muntasir Hoq","orcid":"https://orcid.org/0000-0003-2591-0476"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Muntasir Hoq","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"raw_orcid":"https://orcid.org/0000-0003-2591-0476","affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069526885","display_name":"Yang Shi","orcid":"https://orcid.org/0000-0001-6486-4340"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yang Shi","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"raw_orcid":"https://orcid.org/0000-0001-6486-4340","affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041367899","display_name":"Juho Leinonen","orcid":"https://orcid.org/0000-0001-6829-9449"},"institutions":[{"id":"https://openalex.org/I154130895","display_name":"University of Auckland","ror":"https://ror.org/03b94tp07","country_code":"NZ","type":"education","lineage":["https://openalex.org/I154130895"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Juho Leinonen","raw_affiliation_strings":["The University of Auckland, Auckland, New Zealand"],"raw_orcid":"https://orcid.org/0000-0001-6829-9449","affiliations":[{"raw_affiliation_string":"The University of Auckland, Auckland, New Zealand","institution_ids":["https://openalex.org/I154130895"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075625073","display_name":"Damilola Babalola","orcid":"https://orcid.org/0009-0007-4160-9030"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Damilola Babalola","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"raw_orcid":"https://orcid.org/0009-0007-4160-9030","affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015273609","display_name":"Collin Lynch","orcid":"https://orcid.org/0000-0001-6958-9368"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Collin Lynch","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"raw_orcid":"https://orcid.org/0000-0001-6958-9368","affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064676990","display_name":"Thomas Price","orcid":"https://orcid.org/0000-0001-9375-2292"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thomas Price","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"raw_orcid":"https://orcid.org/0000-0001-9375-2292","affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000710051","display_name":"Bita Akram","orcid":"https://orcid.org/0000-0001-5195-5841"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bita Akram","raw_affiliation_strings":["North Carolina State University, Raleigh, NC, USA"],"raw_orcid":"https://orcid.org/0000-0001-5195-5841","affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, NC, USA","institution_ids":["https://openalex.org/I137902535"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5027964018"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":null,"apc_paid":null,"fwci":34.3161,"has_fulltext":false,"cited_by_count":46,"citation_normalized_percentile":{"value":0.99759675,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"526","last_page":"532"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9890000224113464,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11492","display_name":"Academic integrity and plagiarism","score":0.9767000079154968,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8238610029220581},{"id":"https://openalex.org/keywords/cheating","display_name":"Cheating","score":0.6519058346748352},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6182149052619934},{"id":"https://openalex.org/keywords/programmer","display_name":"Programmer","score":0.6055651307106018},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5476155281066895},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5467761754989624},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5159321427345276},{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.4679381251335144},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.45736393332481384},{"id":"https://openalex.org/keywords/debugging","display_name":"Debugging","score":0.42078739404678345},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4165847897529602},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2641182541847229},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.15897297859191895}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8238610029220581},{"id":"https://openalex.org/C2778024590","wikidata":"https://www.wikidata.org/wiki/Q2357432","display_name":"Cheating","level":2,"score":0.6519058346748352},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6182149052619934},{"id":"https://openalex.org/C2778514511","wikidata":"https://www.wikidata.org/wiki/Q1374194","display_name":"Programmer","level":2,"score":0.6055651307106018},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5476155281066895},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5467761754989624},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5159321427345276},{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.4679381251335144},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.45736393332481384},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.42078739404678345},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4165847897529602},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2641182541847229},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.15897297859191895},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3626252.3630826","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626252.3630826","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 55th ACM Technical Symposium on Computer Science Education V. 1","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8700000047683716,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W1969795835","https://openalex.org/W1972905078","https://openalex.org/W1975294938","https://openalex.org/W2001319819","https://openalex.org/W2056655097","https://openalex.org/W2067303125","https://openalex.org/W2072470757","https://openalex.org/W2100649993","https://openalex.org/W2111227071","https://openalex.org/W2115269749","https://openalex.org/W2548736017","https://openalex.org/W2563587725","https://openalex.org/W2728842346","https://openalex.org/W2795143051","https://openalex.org/W2808967136","https://openalex.org/W2945309808","https://openalex.org/W2955426500","https://openalex.org/W2996517729","https://openalex.org/W3014339000","https://openalex.org/W3043078865","https://openalex.org/W3043305339","https://openalex.org/W3096674504","https://openalex.org/W3135677775","https://openalex.org/W3136693267","https://openalex.org/W4211263275","https://openalex.org/W4213130063","https://openalex.org/W4213415725","https://openalex.org/W4213445264","https://openalex.org/W4226257674","https://openalex.org/W4283705032","https://openalex.org/W4292014584","https://openalex.org/W4302551304","https://openalex.org/W4323033692","https://openalex.org/W4323033785","https://openalex.org/W4323033814","https://openalex.org/W4323037544","https://openalex.org/W4380353816","https://openalex.org/W4382654294","https://openalex.org/W4387847256","https://openalex.org/W6681648988"],"related_works":["https://openalex.org/W2012288173","https://openalex.org/W1968538666","https://openalex.org/W2097662580","https://openalex.org/W3199302685","https://openalex.org/W2168928134","https://openalex.org/W2112040168","https://openalex.org/W4241972157","https://openalex.org/W2053897590","https://openalex.org/W4242556954","https://openalex.org/W3007026952"],"abstract_inverted_index":{"The":[0],"emergence":[1],"of":[2,15,18,81,96,116,165,228],"publicly":[3],"accessible":[4,177],"large":[5],"language":[6],"models":[7,85,121,129,146,151,167,189,231],"(LLMs)":[8],"such":[9,166],"as":[10],"ChatGPT":[11,58,104,132,193,212],"poses":[12],"unprecedented":[13],"risks":[14],"new":[16],"types":[17],"plagiarism":[19],"and":[20,45,62,102,111,122,147,171],"cheating":[21,204],"where":[22],"students":[23],"use":[24,200],"LLMs":[25],"to":[26,70,178,201,213],"solve":[27],"exercises":[28],"for":[29,86,99,107,232],"them.":[30],"Detecting":[31],"this":[32,75],"behavior":[33],"will":[34],"be":[35,48],"a":[36,215],"necessary":[37],"component":[38],"in":[39,130,154],"introductory":[40,234],"computer":[41,235],"science":[42,236],"(CS1)":[43],"courses,":[44],"educators":[46],"should":[47],"well-equipped":[49],"with":[50,158],"detection":[51,88],"tools":[52],"when":[53],"the":[54,79,87,108,114,163,183,219,225],"need":[55],"arises.":[56],"However,":[57],"generates":[59],"code":[60,106,133,136,157,194,220],"non-deterministically,":[61],"thus,":[63],"traditional":[64,118,143],"similarity":[65],"detectors":[66],"might":[67],"not":[68,175],"suffice":[69],"detect":[71,202],"AI-created":[72],"code.":[73],"In":[74],"work,":[76],"we":[77,180],"explore":[78,182,208],"affordances":[80],"Machine":[82],"Learning":[83],"(ML)":[84],"task.":[89],"We":[90,206,222],"used":[91],"an":[92],"openly":[93],"available":[94],"dataset":[95],"student":[97,135],"programs":[98],"CS1":[100],"assignments":[101],"had":[103],"generate":[105],"same":[109],"assignments,":[110],"then":[112],"evaluated":[113],"performance":[115],"both":[117,142],"machine":[119,144],"learning":[120,128,145,150,188],"Abstract":[123],"Syntax":[124],"Tree-based":[125],"(AST-based)":[126],"deep":[127,149,187],"detecting":[131],"from":[134],"submissions.":[137],"Our":[138],"results":[139],"suggest":[140],"that":[141,173,190],"AST-based":[148],"are":[152,174],"effective":[153],"identifying":[155],"ChatGPT-generated":[156],"accuracy":[159],"above":[160],"90%.":[161],"Since":[162],"deployment":[164],"requires":[168],"ML":[169],"knowledge":[170],"resources":[172],"always":[176],"instructors,":[179],"also":[181,207],"patterns":[184],"detected":[185],"by":[186],"indicate":[191],"possible":[192],"signatures,":[195],"which":[196],"instructors":[197],"could":[198],"possibly":[199],"LLM-based":[203],"manually.":[205],"whether":[209],"explicitly":[210],"asking":[211],"impersonate":[214],"novice":[216],"programmer":[217],"affects":[218],"produced.":[221],"further":[223],"discuss":[224],"potential":[226],"applications":[227],"our":[229],"proposed":[230],"enhancing":[233],"instruction.":[237]},"counts_by_year":[{"year":2026,"cited_by_count":7},{"year":2025,"cited_by_count":27},{"year":2024,"cited_by_count":12}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
