{"id":"https://openalex.org/W4414872683","doi":"https://doi.org/10.1145/3736251.3757100","title":"The Great Grade-Off: LLMs vs. Humans","display_name":"The Great Grade-Off: LLMs vs. Humans","publication_year":2025,"publication_date":"2025-10-06","ids":{"openalex":"https://openalex.org/W4414872683","doi":"https://doi.org/10.1145/3736251.3757100"},"language":"en","primary_location":{"id":"doi:10.1145/3736251.3757100","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3736251.3757100","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Global Computing Education Conference 2025 - Volume 2","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094167225","display_name":"Samuel B. Mazzone","orcid":"https://orcid.org/0009-0008-6480-2973"},"institutions":[{"id":"https://openalex.org/I102461120","display_name":"Marquette University","ror":"https://ror.org/04gr4te78","country_code":"US","type":"education","lineage":["https://openalex.org/I102461120"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Samuel B. Mazzone","raw_affiliation_strings":["Marquette University, Milwaukee, WI, USA"],"raw_orcid":"https://orcid.org/0009-0008-6480-2973","affiliations":[{"raw_affiliation_string":"Marquette University, Milwaukee, WI, USA","institution_ids":["https://openalex.org/I102461120"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5094167225"],"corresponding_institution_ids":["https://openalex.org/I102461120"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41176758,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"418","last_page":"418"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12755","display_name":"Legal Education and Practice Innovations","score":0.9298999905586243,"subfield":{"id":"https://openalex.org/subfields/3308","display_name":"Law"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12755","display_name":"Legal Education and Practice Innovations","score":0.9298999905586243,"subfield":{"id":"https://openalex.org/subfields/3308","display_name":"Law"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13075","display_name":"Legal Systems and Judicial Processes","score":0.920799970626831,"subfield":{"id":"https://openalex.org/subfields/3320","display_name":"Political Science and International Relations"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/grading","display_name":"Grading (engineering)","score":0.8230999708175659},{"id":"https://openalex.org/keywords/rubric","display_name":"Rubric","score":0.8194000124931335},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4101000130176544},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.4090000092983246},{"id":"https://openalex.org/keywords/toolbox","display_name":"Toolbox","score":0.37599998712539673}],"concepts":[{"id":"https://openalex.org/C2777286243","wikidata":"https://www.wikidata.org/wiki/Q5591926","display_name":"Grading (engineering)","level":2,"score":0.8230999708175659},{"id":"https://openalex.org/C111640148","wikidata":"https://www.wikidata.org/wiki/Q847349","display_name":"Rubric","level":2,"score":0.8194000124931335},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5598999857902527},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4700999855995178},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4101000130176544},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.4090000092983246},{"id":"https://openalex.org/C2777655017","wikidata":"https://www.wikidata.org/wiki/Q1501161","display_name":"Toolbox","level":2,"score":0.37599998712539673},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.3084000051021576},{"id":"https://openalex.org/C55587333","wikidata":"https://www.wikidata.org/wiki/Q1133029","display_name":"Engineering ethics","level":1,"score":0.3059999942779541},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2782000005245209},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2766000032424927},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.26489999890327454},{"id":"https://openalex.org/C47177190","wikidata":"https://www.wikidata.org/wiki/Q207137","display_name":"Curriculum","level":2,"score":0.2614000141620636}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3736251.3757100","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3736251.3757100","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Global Computing Education Conference 2025 - Volume 2","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Grading":[0],"computer":[1],"science":[2],"(CS)":[3],"assignments":[4],"poses":[5],"challenges":[6],"because":[7],"of":[8,13,29],"the":[9,26,124],"inefficiencies":[10],"and":[11,46,59,66,85,115,127,167,188,219,224,228,244],"inconsistencies":[12],"manual":[14],"grading.":[15],"Automated":[16],"Assessment":[17],"Tools":[18],"(AATs)":[19],"focus":[20],"on":[21,123],"strict":[22],"correctness,":[23],"often":[24],"overlooking":[25],"holistic":[27],"quality":[28],"student":[30],"submissions.":[31],"As":[32],"a":[33,52,200],"result,":[34],"instructors":[35,68],"must":[36],"spend":[37],"additional":[38],"effort":[39],"addressing":[40],"these":[41,98],"limitations.":[42],"Generative":[43],"AI":[44],"(GAI)":[45],"Large":[47],"Language":[48],"Models":[49],"(LLMs)":[50],"offer":[51],"promising":[53],"solution.":[54],"LLMs":[55,96,147],"can":[56],"generate":[57],"feedback":[58],"code":[60],"suggestions,":[61],"helping":[62],"students":[63],"understand":[64],"grades":[65],"aiding":[67],"by":[69,100,171],"identifying":[70],"common":[71,181],"challenges.":[72],"Despite":[73],"their":[74],"potential,":[75],"educators":[76],"face":[77],"difficulties":[78],"implementing":[79],"LLMs,":[80],"primarily":[81],"due":[82],"to":[83,141,157,194,217,239],"privacy":[84],"ethical":[86],"concerns":[87,99],"associated":[88],"with":[89,130,135],"cloud-based":[90],"GAI":[91,220],"solutions.":[92],"Open-source,":[93],"locally-hosted":[94],"(OSLH)":[95],"address":[97],"offering":[101],"private,":[102],"customizable":[103],"environments":[104],"without":[105],"external":[106],"services.":[107],"Recent":[108],"studies":[109],"demonstrate":[110],"improvements":[111],"in":[112,151],"grading":[113,175,226,230,241,248],"consistency":[114],"efficiency":[116],"within":[117],"education.":[118],"However,":[119],"results":[120],"vary":[121],"based":[122],"specific":[125,214],"LLM":[126],"rubric":[128],"used,":[129],"ongoing":[131],"questions":[132],"about":[133],"alignment":[134],"human":[136,149,165,218],"evaluations.":[137],"This":[138],"research":[139,237],"aims":[140,238],"systematically":[142],"evaluate":[143],"how":[144],"closely":[145,163],"OSLH":[146],"match":[148],"graders":[150],"assessing":[152],"CS1":[153,182],"assignments.":[154],"It":[155],"seeks":[156],"identify":[158],"contexts":[159],"where":[160],"automated":[161],"assessments":[162],"mimic":[164],"judgment":[166],"pinpoint":[168],"discrepancies":[169],"caused":[170],"model":[172],"limitations":[173],"or":[174],"complexity.":[176],"The":[177],"methodology":[178],"involves":[179],"categorizing":[180],"programming":[183],"errors,":[184],"establishing":[185,222],"standardized":[186],"penalties,":[187],"updating":[189],"TA-Bot,":[190],"an":[191],"existing":[192],"AAT,":[193],"collect":[195],"detailed":[196,202],"error":[197],"data":[198],"for":[199,232],"more":[201],"comparison":[203],"against":[204],"LLM-generated":[205],"scores.":[206],"Planned":[207],"contributions":[208],"include":[209],"creating":[210],"benchmark":[211],"datasets":[212],"linking":[213],"coding":[215],"errors":[216],"evaluations,":[221],"replicable":[223],"transparent":[225],"methodologies,":[227],"refining":[229],"tools":[231],"practical":[233],"adoption.":[234],"Ultimately,":[235],"this":[236],"enhance":[240],"consistency,":[242],"transparency,":[243],"fairness,":[245],"advancing":[246],"overall":[247],"practices.":[249]},"counts_by_year":[],"updated_date":"2026-02-07T06:11:34.122080","created_date":"2025-10-10T00:00:00"}
