{"id":"https://openalex.org/W7162813444","doi":"https://doi.org/10.48550/arxiv.2605.29791","title":"ActTraitBench: Quantifying the Knowledge-Decision Gap in Large Language Models via Human-Grounded Behavioral Validation","display_name":"ActTraitBench: Quantifying the Knowledge-Decision Gap in Large Language Models via Human-Grounded Behavioral Validation","publication_year":2026,"publication_date":"2026-05-28","ids":{"openalex":"https://openalex.org/W7162813444","doi":"https://doi.org/10.48550/arxiv.2605.29791"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.29791","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29791","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.29791","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137372940","display_name":"Yutong Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yutong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123167369","display_name":"Chenxi Miao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miao, Chenxi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137319728","display_name":"Weikang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Weikang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137349762","display_name":"Yunfang Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Yunfang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.18230000138282776,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.18230000138282776,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.17260000109672546,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11840000003576279,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6269999742507935},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.5691999793052673},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5379999876022339},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.48739999532699585},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.46389999985694885},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.44020000100135803},{"id":"https://openalex.org/keywords/cognition","display_name":"Cognition","score":0.40639999508857727},{"id":"https://openalex.org/keywords/quantile","display_name":"Quantile","score":0.39879998564720154},{"id":"https://openalex.org/keywords/behavioral-modeling","display_name":"Behavioral modeling","score":0.3806999921798706},{"id":"https://openalex.org/keywords/computational-model","display_name":"Computational model","score":0.37770000100135803}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6273000240325928},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6269999742507935},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.5691999793052673},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5379999876022339},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5350000262260437},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.48739999532699585},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.47769999504089355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4693000018596649},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.46389999985694885},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.44020000100135803},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.40639999508857727},{"id":"https://openalex.org/C118671147","wikidata":"https://www.wikidata.org/wiki/Q578714","display_name":"Quantile","level":2,"score":0.39879998564720154},{"id":"https://openalex.org/C78639753","wikidata":"https://www.wikidata.org/wiki/Q3318160","display_name":"Behavioral modeling","level":2,"score":0.3806999921798706},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.37770000100135803},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.37529999017715454},{"id":"https://openalex.org/C187288502","wikidata":"https://www.wikidata.org/wiki/Q641118","display_name":"Personality","level":2,"score":0.36000001430511475},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.3546999990940094},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.35019999742507935},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.34279999136924744},{"id":"https://openalex.org/C49453240","wikidata":"https://www.wikidata.org/wiki/Q1592163","display_name":"Construct validity","level":3,"score":0.3393000066280365},{"id":"https://openalex.org/C206654554","wikidata":"https://www.wikidata.org/wiki/Q5374247","display_name":"Empirical measure","level":2,"score":0.3091000020503998},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.30250000953674316},{"id":"https://openalex.org/C109574028","wikidata":"https://www.wikidata.org/wiki/Q647525","display_name":"Behavioral economics","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2906000018119812},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C40722632","wikidata":"https://www.wikidata.org/wiki/Q5160137","display_name":"Confirmatory factor analysis","level":3,"score":0.27649998664855957},{"id":"https://openalex.org/C171606756","wikidata":"https://www.wikidata.org/wiki/Q506132","display_name":"Psychometrics","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2721000015735626},{"id":"https://openalex.org/C3019813237","wikidata":"https://www.wikidata.org/wiki/Q65089264","display_name":"Model validation","level":2,"score":0.27000001072883606},{"id":"https://openalex.org/C19875794","wikidata":"https://www.wikidata.org/wiki/Q1207340","display_name":"Item response theory","level":3,"score":0.26499998569488525},{"id":"https://openalex.org/C2780665704","wikidata":"https://www.wikidata.org/wiki/Q959298","display_name":"Intervention (counseling)","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C2865642","wikidata":"https://www.wikidata.org/wiki/Q378132","display_name":"Big Five personality traits","level":3,"score":0.26339998841285706},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C5570062","wikidata":"https://www.wikidata.org/wiki/Q3919817","display_name":"Behavioural sciences","level":2,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.29791","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29791","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.29791","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29791","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7763908505439758,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"Large":[1],"Language":[2],"Models":[3],"(LLMs)":[4],"can":[5],"convincingly":[6],"simulate":[7],"personas":[8],"in":[9,15,42,60,63,139,148],"explicit":[10],"self-reports,":[11],"they":[12],"often":[13,110],"deviate":[14],"implicit":[16],"behavioral":[17,75,113],"decisions,":[18],"revealing":[19],"a":[20,52,79,100,132],"substantial":[21],"Knowledge-Decision":[22],"Gap":[23],"($G_{\\text{KD}}$).":[24],"Existing":[25],"benchmarks":[26],"struggle":[27],"to":[28,33,86],"measure":[29],"this":[30,121],"asymmetry":[31],"due":[32],"limited":[34],"construct":[35],"validity,":[36],"multi-dimensional":[37],"entanglement,":[38],"and":[39,74,77,106],"distributional":[40],"biases":[41],"LLM-based":[43],"evaluation.":[44],"To":[45,119],"address":[46],"these":[47],"issues,":[48],"we":[49,123],"propose":[50],"ActTraitBench,":[51],"human-grounded":[53],"evaluation":[54],"framework":[55],"for":[56],"measuring":[57],"personality":[58],"consistency":[59],"LLMs.":[61],"Grounded":[62],"empirical":[64],"human":[65,92],"data,":[66],"ActTraitBench":[67],"establishes":[68],"one-to-one":[69],"mappings":[70],"between":[71],"psychometric":[72],"facets":[73],"paradigms,":[76],"applies":[78],"Distributional":[80],"Calibration":[81],"via":[82],"Quantile":[83],"Mapping":[84],"procedure":[85],"align":[87],"LLM-judge":[88],"score":[89],"distributions":[90],"with":[91],"norms.":[93],"Experiments":[94],"on":[95],"14":[96],"mainstream":[97],"LLMs":[98],"reveal":[99],"pervasive":[101],"knowledge-decision":[102],"asymmetry,":[103],"where":[104],"larger":[105],"more":[107],"capable":[108],"models":[109,142],"exhibit":[111],"stronger":[112],"divergence":[114],"despite":[115],"highly":[116],"consistent":[117],"self-reports.":[118],"mitigate":[120],"gap,":[122],"further":[124],"introduce":[125],"the":[126],"Chain":[127],"of":[128],"Cognitive":[129],"Alignment":[130],"(CoCA),":[131],"plug-and-play":[133],"inference-time":[134],"intervention":[135],"that":[136],"improves":[137],"alignment":[138],"reasoning-capable":[140],"frontier":[141],"while":[143],"exposing":[144],"clear":[145],"capability":[146],"limitations":[147],"smaller":[149],"architectures.":[150]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-30T00:00:00"}
