{"id":"https://openalex.org/W7154683402","doi":"https://doi.org/10.48550/arxiv.2604.14188","title":"Grading the Unspoken: Evaluating Tacit Reasoning in Quantum Field Theory and String Theory with LLMs","display_name":"Grading the Unspoken: Evaluating Tacit Reasoning in Quantum Field Theory and String Theory with LLMs","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7154683402","doi":"https://doi.org/10.48550/arxiv.2604.14188"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.14188","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14188","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.14188","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133836484","display_name":"Xingyang Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yu, Xingyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133892398","display_name":"Yinghuan Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yinghuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133855219","display_name":"Yufei Zhang","orcid":"https://orcid.org/0009-0002-8623-8994"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yufei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5038674626","display_name":"Zijun Cui","orcid":"https://orcid.org/0000-0002-4362-197X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Zijun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5133836484"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.38519999384880066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.38519999384880066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.06449999660253525,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.05999999865889549,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.5245000123977661},{"id":"https://openalex.org/keywords/rubric","display_name":"Rubric","score":0.4950999915599823},{"id":"https://openalex.org/keywords/framing","display_name":"Framing (construction)","score":0.41940000653266907},{"id":"https://openalex.org/keywords/quantum-field-theory","display_name":"Quantum field theory","score":0.38359999656677246},{"id":"https://openalex.org/keywords/grading","display_name":"Grading (engineering)","score":0.34709998965263367},{"id":"https://openalex.org/keywords/imperfect","display_name":"Imperfect","score":0.33160001039505005},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.3296000063419342},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.3203999996185303}],"concepts":[{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.5245000123977661},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5058000087738037},{"id":"https://openalex.org/C111640148","wikidata":"https://www.wikidata.org/wiki/Q847349","display_name":"Rubric","level":2,"score":0.4950999915599823},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.41940000653266907},{"id":"https://openalex.org/C115047598","wikidata":"https://www.wikidata.org/wiki/Q54505","display_name":"Quantum field theory","level":2,"score":0.38359999656677246},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35010001063346863},{"id":"https://openalex.org/C2777286243","wikidata":"https://www.wikidata.org/wiki/Q5591926","display_name":"Grading (engineering)","level":2,"score":0.34709998965263367},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33970001339912415},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.33160001039505005},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.3305000066757202},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.33000001311302185},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3296000063419342},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.3203999996185303},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.3172000050544739},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.3154999911785126},{"id":"https://openalex.org/C161301231","wikidata":"https://www.wikidata.org/wiki/Q3478658","display_name":"Knowledge representation and reasoning","level":2,"score":0.3122999966144562},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.2973000109195709},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C43091099","wikidata":"https://www.wikidata.org/wiki/Q1067788","display_name":"Through-the-lens metering","level":3,"score":0.29499998688697815},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2912999987602234},{"id":"https://openalex.org/C49987212","wikidata":"https://www.wikidata.org/wiki/Q33198","display_name":"String theory","level":2,"score":0.2856000065803528},{"id":"https://openalex.org/C33332235","wikidata":"https://www.wikidata.org/wiki/Q18362","display_name":"Theoretical physics","level":1,"score":0.27250000834465027},{"id":"https://openalex.org/C2777686260","wikidata":"https://www.wikidata.org/wiki/Q144037","display_name":"Calculus (dental)","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.26089999079704285}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.14188","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14188","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.14188","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14188","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6243813037872314,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"models":[2,20,164],"have":[3],"demonstrated":[4],"impressive":[5],"performance":[6,120],"across":[7],"many":[8],"domains":[9,47],"of":[10,80,86,135,141,194],"mathematics":[11],"and":[12,34,51,90,93,111],"physics.":[13],"One":[14],"natural":[15],"question":[16],"is":[17,48],"whether":[18,60,68],"such":[19,29],"can":[21],"support":[22],"research":[23],"in":[24,45,161],"highly":[25,181],"abstract":[26,182],"theoretical":[27,183],"fields":[28],"as":[30],"quantum":[31,87],"field":[32,88],"theory":[33,89],"string":[35,91],"theory.":[36],"Evaluating":[37,113],"this":[38],"possibility":[39],"faces":[40],"an":[41,159],"immediate":[42],"challenge:":[43],"correctness":[44],"these":[46],"layered,":[49],"tacit,":[50],"fundamentally":[52],"non-binary.":[53],"Standard":[54],"answer-matching":[55],"metrics":[56],"fail":[57,166],"to":[58,167,174],"capture":[59],"intermediate":[61,155],"conceptual":[62,126,171],"steps":[63,138],"are":[64,72,149],"properly":[65],"reconstructed":[66],"or":[67,139],"implicit":[69,176],"structural":[70],"constraints":[71],"respected.":[73],"We":[74,178],"construct":[75],"a":[76,95,186],"compact":[77],"expert-curated":[78],"dataset":[79],"twelve":[81],"questions":[82],"spanning":[83],"core":[84],"areas":[85],"theory,":[92],"introduce":[94],"five-level":[96],"grading":[97],"rubric":[98],"separating":[99],"statement":[100],"correctness,":[101],"key":[102],"concept":[103],"awareness,":[104],"reasoning":[105,137],"chain":[106],"presence,":[107],"tacit":[108],"step":[109],"reconstruction,":[110],"enrichment.":[112],"multiple":[114],"contemporary":[115],"LLMs,":[116],"we":[117],"observe":[118],"near-ceiling":[119],"on":[121,190],"explicit":[122],"derivations":[123],"within":[124],"stable":[125],"frames,":[127],"but":[128,157],"systematic":[129],"degradation":[130],"when":[131],"tasks":[132],"require":[133],"reconstruction":[134],"omitted":[136],"reorganization":[140],"representations":[142],"under":[143],"global":[144],"consistency":[145],"constraints.":[146],"These":[147],"failures":[148],"driven":[150],"not":[151],"only":[152],"by":[153,158],"missing":[154],"steps,":[156],"instability":[160],"representation":[162],"selection:":[163],"often":[165],"identify":[168],"the":[169,191],"correct":[170],"framing":[172],"required":[173],"resolve":[175],"tensions.":[177],"argue":[179],"that":[180],"physics":[184],"provides":[185],"uniquely":[187],"sensitive":[188],"lens":[189],"epistemic":[192],"limits":[193],"current":[195],"evaluation":[196],"paradigms.":[197]},"counts_by_year":[],"updated_date":"2026-04-18T06:05:20.339008","created_date":"2026-04-18T00:00:00"}
