{"id":"https://openalex.org/W4392858532","doi":"https://doi.org/10.1145/3626253.3635542","title":"Evaluating Large Language Model Code Generation as an Autograding Mechanism for \"Explain in Plain English\" Questions","display_name":"Evaluating Large Language Model Code Generation as an Autograding Mechanism for \"Explain in Plain English\" Questions","publication_year":2024,"publication_date":"2024-03-14","ids":{"openalex":"https://openalex.org/W4392858532","doi":"https://doi.org/10.1145/3626253.3635542"},"language":"en","primary_location":{"id":"doi:10.1145/3626253.3635542","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626253.3635542","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 55th ACM Technical Symposium on Computer Science Education V. 2","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014942043","display_name":"David H. Smith","orcid":"https://orcid.org/0000-0002-6572-4347"},"institutions":[{"id":"https://openalex.org/I2801919071","display_name":"University of Illinois System","ror":"https://ror.org/05e94g991","country_code":"US","type":"education","lineage":["https://openalex.org/I2801919071"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"David H. Smith","raw_affiliation_strings":["University of Illinois, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois, Urbana, IL, USA","institution_ids":["https://openalex.org/I2801919071"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066756473","display_name":"Craig Zilles","orcid":"https://orcid.org/0000-0003-4601-4398"},"institutions":[{"id":"https://openalex.org/I2801919071","display_name":"University of Illinois System","ror":"https://ror.org/05e94g991","country_code":"US","type":"education","lineage":["https://openalex.org/I2801919071"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Craig Zilles","raw_affiliation_strings":["University of Illinois, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois, Urbana, IL, USA","institution_ids":["https://openalex.org/I2801919071"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5014942043"],"corresponding_institution_ids":["https://openalex.org/I2801919071"],"apc_list":null,"apc_paid":null,"fwci":0.8579,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.78682575,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1824","last_page":"1825"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10533","display_name":"Teaching and Learning Programming","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10533","display_name":"Teaching and Learning Programming","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grading","display_name":"Grading (engineering)","score":0.8344342708587646},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7601454257965088},{"id":"https://openalex.org/keywords/unit-testing","display_name":"Unit testing","score":0.6353247165679932},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.5453769564628601},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5249678492546082},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.515814483165741},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4637976288795471},{"id":"https://openalex.org/keywords/mathematics-education","display_name":"Mathematics education","score":0.37879589200019836},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.3488907814025879},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.18263399600982666},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.08764252066612244},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08454284071922302}],"concepts":[{"id":"https://openalex.org/C2777286243","wikidata":"https://www.wikidata.org/wiki/Q5591926","display_name":"Grading (engineering)","level":2,"score":0.8344342708587646},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7601454257965088},{"id":"https://openalex.org/C148027188","wikidata":"https://www.wikidata.org/wiki/Q907375","display_name":"Unit testing","level":3,"score":0.6353247165679932},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.5453769564628601},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5249678492546082},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.515814483165741},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4637976288795471},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.37879589200019836},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.3488907814025879},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.18263399600982666},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.08764252066612244},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08454284071922302},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C147176958","wikidata":"https://www.wikidata.org/wiki/Q77590","display_name":"Civil engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3626253.3635542","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3626253.3635542","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 55th ACM Technical Symposium on Computer Science Education V. 2","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W2029974693","https://openalex.org/W3161516024","https://openalex.org/W3177928934"],"related_works":["https://openalex.org/W2615173508","https://openalex.org/W2064165679","https://openalex.org/W1588461101","https://openalex.org/W3208525924","https://openalex.org/W2591833644","https://openalex.org/W2885058781","https://openalex.org/W3127248583","https://openalex.org/W1552490082","https://openalex.org/W4236439135","https://openalex.org/W2189583758"],"abstract_inverted_index":{"The":[0,59],"ability":[1],"of":[2,12,61,68,94,124,137,156,183],"students":[3,19,34],"to":[4,24,35,83,121,167,170],"''Explain":[5],"in":[6,20],"Plain":[7],"English''":[8],"(EiPE)":[9],"the":[10,66,92,135,150,154,157,162],"purpose":[11],"code":[13,39,69,100,172],"is":[14,52],"a":[15,31,63,72,80,109,122],"critical":[16],"skill":[17,45],"for":[18,33,65,71,112],"introductory":[21],"programming":[22],"courses":[23],"develop.":[25],"EiPE":[26,85,106,113,125],"questions":[27],"serve":[28],"as":[29,49,108],"both":[30],"mechanism":[32,111],"develop":[36],"and":[37,55,141,153],"demonstrate":[38],"comprehension":[40],"skills.":[41],"However,":[42],"evaluating":[43],"this":[44,88,117,138],"has":[46],"been":[47],"challenging":[48],"manual":[50],"grading":[51,110,119,139],"time":[53],"consuming":[54],"not":[56],"easily":[57],"automated.":[58],"process":[60],"constructing":[62,84],"prompt":[64],"purposes":[67],"generation":[70,173],"Large":[73],"Language":[74],"Model,":[75],"such":[76],"OpenAI's":[77],"GPT-4,":[78],"bears":[79],"striking":[81],"resemblance":[82],"responses.":[86],"In":[87],"paper,":[89],"we":[90,145],"explore":[91],"potential":[93],"using":[95],"test":[96],"cases":[97],"run":[98,160],"on":[99,161,180],"generated":[101,163],"by":[102],"GPT-4":[103],"from":[104,128],"students'":[105],"responses":[107,126],"questions.":[114],"We":[115],"applied":[116],"proposed":[118],"method":[120,140],"corpus":[123],"collected":[127],"past":[129],"exams,":[130],"then":[131],"measured":[132],"agreement":[133,148],"between":[134,149],"results":[136,155],"human":[142,151,178],"graders.":[143],"Overall,":[144],"find":[146],"moderate":[147],"raters":[152],"unit":[158],"tests":[159],"code.":[164,184],"This":[165],"appears":[166],"be":[168],"attributable":[169],"GPT-4's":[171],"being":[174],"more":[175],"lenient":[176],"than":[177],"graders":[179],"low-level":[181],"descriptions":[182]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
