{"id":"https://openalex.org/W7128633186","doi":"https://doi.org/10.48550/arxiv.2602.09832","title":"LLM Reasoning Predicts When Models Are Right: Evidence from Coding Classroom Discourse","display_name":"LLM Reasoning Predicts When Models Are Right: Evidence from Coding Classroom Discourse","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7128633186","doi":"https://doi.org/10.48550/arxiv.2602.09832"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.09832","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Ahtisham, Bakhtawar","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ahtisham, Bakhtawar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090326226","display_name":"Kirk Vanacore","orcid":"https://orcid.org/0000-0003-0673-5721"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vanacore, Kirk","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123508488","display_name":"Zhuqian Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Zhuqian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123499744","display_name":"Jinsook Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Jinsook","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5124971116","display_name":"Ren\u00e9 F. Kizilcec","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kizilcec, Rene F.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.29120001196861267,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.29120001196861267,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1316000074148178,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.07400000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.701200008392334},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6148999929428101},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5002999901771545},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4334999918937683},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.4323999881744385},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.4320000112056732},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.42980000376701355},{"id":"https://openalex.org/keywords/mean-length-of-utterance","display_name":"Mean length of utterance","score":0.3939000070095062},{"id":"https://openalex.org/keywords/metacognition","display_name":"Metacognition","score":0.3763999938964844},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.37380000948905945}],"concepts":[{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.701200008392334},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6535999774932861},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6148999929428101},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5199999809265137},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5002999901771545},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4334999918937683},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.4323999881744385},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.4320000112056732},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.42980000376701355},{"id":"https://openalex.org/C95975521","wikidata":"https://www.wikidata.org/wiki/Q6803628","display_name":"Mean length of utterance","level":3,"score":0.3939000070095062},{"id":"https://openalex.org/C118147538","wikidata":"https://www.wikidata.org/wiki/Q1126970","display_name":"Metacognition","level":3,"score":0.3763999938964844},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.37380000948905945},{"id":"https://openalex.org/C36964233","wikidata":"https://www.wikidata.org/wiki/Q7920942","display_name":"Verbal reasoning","level":3,"score":0.33889999985694885},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.33640000224113464},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.32839998602867126},{"id":"https://openalex.org/C134141054","wikidata":"https://www.wikidata.org/wiki/Q965415","display_name":"Performative utterance","level":2,"score":0.32600000500679016},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.32249999046325684},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C11693617","wikidata":"https://www.wikidata.org/wiki/Q181839","display_name":"Pragmatics","level":2,"score":0.3174999952316284},{"id":"https://openalex.org/C169258074","wikidata":"https://www.wikidata.org/wiki/Q245748","display_name":"Random forest","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C121934690","wikidata":"https://www.wikidata.org/wiki/Q1084","display_name":"Noun","level":2,"score":0.3082999885082245},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.30660000443458557},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.295199990272522},{"id":"https://openalex.org/C194926167","wikidata":"https://www.wikidata.org/wiki/Q6554066","display_name":"Linguistic sequence complexity","level":2,"score":0.28619998693466187},{"id":"https://openalex.org/C43971567","wikidata":"https://www.wikidata.org/wiki/Q3142865","display_name":"Logical reasoning","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.28349998593330383},{"id":"https://openalex.org/C84389358","wikidata":"https://www.wikidata.org/wiki/Q1129466","display_name":"Discourse analysis","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.27559998631477356},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2750999927520752},{"id":"https://openalex.org/C2777096784","wikidata":"https://www.wikidata.org/wiki/Q3826351","display_name":"Referent","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2728999853134155},{"id":"https://openalex.org/C2779267917","wikidata":"https://www.wikidata.org/wiki/Q170028","display_name":"Deception","level":2,"score":0.27250000834465027},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.26589998602867126},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.2623000144958496}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.09832","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.09832","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09832","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.09832","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8660006523132324,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"are":[4,26],"increasingly":[5],"deployed":[6],"to":[7,22,38,187,230],"automatically":[8],"label":[9,84],"and":[10,66,101,124,154,169,195,210,227],"analyze":[11,48],"educational":[12,235],"dialogue":[13,236],"at":[14],"scale,":[15],"yet":[16],"current":[17],"pipelines":[18],"lack":[19],"reliable":[20],"ways":[21],"detect":[23],"when":[24],"models":[25],"wrong.":[27],"We":[28,47,91],"investigate":[29],"whether":[30,80],"reasoning":[31,94,182,212],"generated":[32],"by":[33,57],"LLMs":[34,60],"can":[35],"be":[36],"used":[37],"predict":[39],"the":[40,76,151],"correctness":[41],"of":[42,114,164],"a":[43,81,86,225],"model's":[44,82],"own":[45],"predictions.":[46],"30,300":[49],"teacher":[50],"utterances":[51],"from":[52,146,207],"classroom":[53],"dialogue,":[54],"each":[55],"labeled":[56],"multiple":[58],"state-of-the-art":[59],"with":[61],"an":[62,67,111],"instructional":[63,132],"move":[64,133],"construct":[65],"accompanying":[68],"reasoning.":[69],"Using":[70,150],"human-verified":[71],"ground-truth":[72],"labels,":[73],"we":[74,159],"frame":[75],"task":[77],"as":[78],"predicting":[79],"assigned":[83],"for":[85,130],"given":[87],"utterance":[88],"is":[89,183,213],"correct.":[90],"encode":[92],"LLM":[93],"using":[95],"Term":[96],"Frequency-Inverse":[97],"Document":[98],"Frequency":[99],"(TF-IDF)":[100],"evaluate":[102],"five":[103],"supervised":[104],"classifiers.":[105],"A":[106],"Random":[107],"Forest":[108],"classifier":[109],"achieves":[110],"F1":[112],"score":[113],"0.83":[115],"(Recall":[116],"=":[117],"0.854),":[118],"successfully":[119],"identifying":[120],"most":[121],"incorrect":[122,181,208],"predictions":[123,172],"outperforming":[125],"baselines.":[126],"Training":[127],"specialist":[128],"detectors":[129],"specific":[131],"constructs":[134],"further":[135],"improves":[136],"performance":[137],"on":[138,189],"difficult":[139],"constructs,":[140],"indicating":[141],"that":[142,220],"error":[143,222],"detection":[144,223],"benefits":[145],"construct-specific":[147],"linguistic":[148,162],"cues.":[149],"Linguistic":[152],"Inquiry":[153],"Word":[155],"Count":[156],"(LIWC)":[157],"framework,":[158],"examine":[160],"four":[161],"markers":[163],"correctness:":[165],"Causation,":[166],"Differentiation,":[167],"Tentativeness,":[168],"Insight.":[170],"Correct":[171],"exhibit":[173],"grounded":[174],"causal":[175],"language":[176],"(e.g.,":[177,192,198],"because,":[178],"therefore),":[179],"while":[180],"substantially":[184],"more":[185,215],"likely":[186],"rely":[188],"epistemic":[190],"hedging":[191],"might,":[193],"could)":[194],"performative":[196],"metacognition":[197],"think,":[199],"realize).":[200],"Syntactic":[201],"complexity":[202],"does":[203],"not":[204,214],"distinguish":[205],"correct":[206],"reasoning,":[209],"longer":[211],"reliable.":[216],"These":[217],"findings":[218],"demonstrate":[219],"reasoning-based":[221],"offers":[224],"practical":[226],"scalable":[228],"approach":[229],"quality":[231],"control":[232],"in":[233],"automated":[234],"analysis.":[237]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-12T00:00:00"}
