{"id":"https://openalex.org/W7152999892","doi":"https://doi.org/10.48550/arxiv.2604.08362","title":"Towards Real-world Human Behavior Simulation: Benchmarking Large Language Models on Long-horizon, Cross-scenario, Heterogeneous Behavior Traces","display_name":"Towards Real-world Human Behavior Simulation: Benchmarking Large Language Models on Long-horizon, Cross-scenario, Heterogeneous Behavior Traces","publication_year":2026,"publication_date":"2026-04-09","ids":{"openalex":"https://openalex.org/W7152999892","doi":"https://doi.org/10.48550/arxiv.2604.08362"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.08362","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.08362","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.08362","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133378936","display_name":"Jiawei Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Chen, Jiawei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100992281","display_name":"Ruoxi Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Ruoxi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133370396","display_name":"Boxi Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Boxi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133319877","display_name":"Ruotong Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Ruotong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133353994","display_name":"Yunfei Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yunfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133383539","display_name":"Yifei Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yifei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133386000","display_name":"Yong Du","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Yong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133342236","display_name":"Tingting Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Tingting","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133332896","display_name":"Yaojie Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Yaojie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133352371","display_name":"Yingfei Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Yingfei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133338633","display_name":"Xianpei Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Xianpei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133370612","display_name":"Le Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Le","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133375540","display_name":"Xiangyu Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Xiangyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133338551","display_name":"Hongyu Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Hongyu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5133378936"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.15860000252723694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.15860000252723694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.11190000176429749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.10239999741315842,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7257999777793884},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6122999787330627},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.583899974822998},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5764999985694885},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.5742999911308289},{"id":"https://openalex.org/keywords/human-behavior","display_name":"Human behavior","score":0.4302000105381012},{"id":"https://openalex.org/keywords/persona","display_name":"Persona","score":0.4025000035762787},{"id":"https://openalex.org/keywords/human-language","display_name":"Human language","score":0.3847000002861023}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7257999777793884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6488000154495239},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6122999787330627},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.583899974822998},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5764999985694885},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.5742999911308289},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4487000107765198},{"id":"https://openalex.org/C117035363","wikidata":"https://www.wikidata.org/wiki/Q3769299","display_name":"Human behavior","level":2,"score":0.4302000105381012},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4203999936580658},{"id":"https://openalex.org/C313442","wikidata":"https://www.wikidata.org/wiki/Q778556","display_name":"Persona","level":2,"score":0.4025000035762787},{"id":"https://openalex.org/C2993724205","wikidata":"https://www.wikidata.org/wiki/Q315","display_name":"Human language","level":2,"score":0.3847000002861023},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.37299999594688416},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.36640000343322754},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3391000032424927},{"id":"https://openalex.org/C206654554","wikidata":"https://www.wikidata.org/wiki/Q5374247","display_name":"Empirical measure","level":2,"score":0.33649998903274536},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.29429998993873596},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2924000024795532},{"id":"https://openalex.org/C2984703881","wikidata":"https://www.wikidata.org/wiki/Q2313085","display_name":"Language evolution","level":2,"score":0.2906999886035919},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.2842999994754791},{"id":"https://openalex.org/C2984309518","wikidata":"https://www.wikidata.org/wiki/Q181784","display_name":"Human trafficking","level":2,"score":0.27129998803138733},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.26489999890327454},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.26170000433921814},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.26080000400543213},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.08362","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.08362","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.08362","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.08362","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7809691429138184,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"emergence":[1],"of":[2,36,98,156],"Large":[3],"Language":[4],"Models":[5],"(LLMs)":[6],"has":[7],"illuminated":[8],"the":[9,33,47,154],"potential":[10],"for":[11,165],"a":[12,65,121,130,139,148],"general-purpose":[13],"user":[14,49],"simulator.":[15],"However,":[16],"existing":[17],"benchmarks":[18],"remain":[19],"constrained":[20],"to":[21,31,106,136],"isolated":[22,81],"scenarios,":[23],"narrow":[24],"action":[25],"spaces,":[26],"or":[27],"synthetic":[28],"data,":[29,56],"failing":[30],"capture":[32],"holistic":[34],"nature":[35],"authentic":[37,127],"human":[38],"behavior.":[39],"To":[40],"bridge":[41],"this":[42,70],"gap,":[43],"we":[44,72],"introduce":[45],"OmniBehavior,":[46],"first":[48,73],"simulation":[50,168],"benchmark":[51],"constructed":[52],"entirely":[53],"from":[54,84],"real-world":[55,88],"integrating":[57],"long-horizon,":[58],"cross-scenario,":[59],"and":[60,126,147,159],"heterogeneous":[61],"behavioral":[62],"patterns":[63],"into":[64],"unified":[66],"framework.":[67],"Based":[68],"on":[69,91],"benchmark,":[71],"provide":[74],"empirical":[75],"evidence":[76],"that":[77,102],"previous":[78],"datasets":[79],"with":[80,112],"scenarios":[82],"suffer":[83],"tunnel":[85],"vision,":[86],"whereas":[87],"decision-making":[89],"relies":[90],"long-term,":[92],"cross-scenario":[93],"causal":[94],"chains.":[95],"Extensive":[96],"evaluations":[97],"state-of-the-art":[99],"LLMs":[100,134],"reveal":[101],"current":[103],"models":[104],"struggle":[105],"accurately":[107],"simulate":[108],"these":[109],"complex":[110],"behaviors,":[111,161],"performance":[113],"plateauing":[114],"even":[115],"as":[116],"context":[117],"windows":[118],"expand.":[119],"Crucially,":[120],"systematic":[122],"comparison":[123],"between":[124],"simulated":[125],"behaviors":[128],"uncovers":[129],"fundamental":[131],"structural":[132],"bias:":[133],"tend":[135],"converge":[137],"toward":[138],"positive":[140],"average":[141],"person,":[142],"exhibiting":[143],"hyper-activity,":[144],"persona":[145],"homogenization,":[146],"Utopian":[149],"bias.":[150],"This":[151],"results":[152],"in":[153],"loss":[155],"individual":[157],"differences":[158],"long-tail":[160],"highlighting":[162],"critical":[163],"directions":[164],"future":[166],"high-fidelity":[167],"research.":[169]},"counts_by_year":[],"updated_date":"2026-04-11T06:19:08.300824","created_date":"2026-04-11T00:00:00"}
