{"id":"https://openalex.org/W7155363274","doi":"https://doi.org/10.48550/arxiv.2604.19787","title":"LLM Agents Predict Social Media Reactions but Do Not Outperform Text Classifiers: Benchmarking Simulation Accuracy Using 120K+ Personas of 1511 Humans","display_name":"LLM Agents Predict Social Media Reactions but Do Not Outperform Text Classifiers: Benchmarking Simulation Accuracy Using 120K+ Personas of 1511 Humans","publication_year":2026,"publication_date":"2026-03-31","ids":{"openalex":"https://openalex.org/W7155363274","doi":"https://doi.org/10.48550/arxiv.2604.19787"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19787","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19787","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19787","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020925570","display_name":"Ljubi\u0161a Boji\u0107","orcid":"https://orcid.org/0000-0002-5371-7975"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bojic, Ljubisa","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033783997","display_name":"Alexander Felfernig","orcid":"https://orcid.org/0000-0003-0108-3146"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Felfernig, Alexander","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127193098","display_name":"Bojana Dini\u0107","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dinic, Bojana","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134455433","display_name":"Velibor Ilic","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ilic, Velibor","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000758128","display_name":"Achim Rettinger","orcid":"https://orcid.org/0000-0003-4950-1167"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rettinger, Achim","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079925446","display_name":"Vera Mevorah","orcid":"https://orcid.org/0000-0002-4313-475X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mevorah, Vera","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5071797963","display_name":"Damian Trilling","orcid":"https://orcid.org/0000-0002-2586-0352"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Trilling, Damian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5020925570"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.18389999866485596,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.18389999866485596,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.1543000042438507,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.08290000259876251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/replicate","display_name":"Replicate","score":0.5842999815940857},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.5532000064849854},{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.5027999877929688},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.4885999858379364},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.40400001406669617},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.36640000343322754},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.36550000309944153},{"id":"https://openalex.org/keywords/corporate-governance","display_name":"Corporate governance","score":0.3384999930858612}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6478999853134155},{"id":"https://openalex.org/C2781162219","wikidata":"https://www.wikidata.org/wiki/Q26250693","display_name":"Replicate","level":2,"score":0.5842999815940857},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.5532000064849854},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5508000254631042},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.5027999877929688},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.4885999858379364},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45840001106262207},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.44190001487731934},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.40400001406669617},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.36640000343322754},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.36550000309944153},{"id":"https://openalex.org/C39389867","wikidata":"https://www.wikidata.org/wiki/Q380767","display_name":"Corporate governance","level":2,"score":0.3384999930858612},{"id":"https://openalex.org/C169903001","wikidata":"https://www.wikidata.org/wiki/Q3264987","display_name":"Reciprocity (cultural anthropology)","level":2,"score":0.3368000090122223},{"id":"https://openalex.org/C20685875","wikidata":"https://www.wikidata.org/wiki/Q7239678","display_name":"Predictive validity","level":2,"score":0.3312999904155731},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3188000023365021},{"id":"https://openalex.org/C313442","wikidata":"https://www.wikidata.org/wiki/Q778556","display_name":"Persona","level":2,"score":0.314300000667572},{"id":"https://openalex.org/C202785102","wikidata":"https://www.wikidata.org/wiki/Q3500657","display_name":"Social simulation","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C199776023","wikidata":"https://www.wikidata.org/wiki/Q202875","display_name":"Negotiation","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.29510000348091125},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.267300009727478},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.2597000002861023},{"id":"https://openalex.org/C176856949","wikidata":"https://www.wikidata.org/wiki/Q2001676","display_name":"Offensive","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.2578999996185303},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2556000053882599}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19787","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19787","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19787","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19787","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.5733245015144348,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Social":[0],"media":[1,69],"platforms":[2],"mediate":[3],"how":[4],"billions":[5],"form":[6],"opinions":[7],"and":[8,31,87,196,231],"engage":[9],"with":[10,100,116],"public":[11],"discourse.":[12],"As":[13],"autonomous":[14],"AI":[15,177,198],"agents":[16,39,50,95,143,165,178,189,205],"increasingly":[17],"participate":[18],"in":[19,65,190],"these":[20],"spaces,":[21],"understanding":[22],"their":[23,214],"behavioral":[24],"fidelity":[25],"becomes":[26],"critical":[27],"for":[28,192],"platform":[29],"governance":[30],"democratic":[32],"resilience.":[33],"Previous":[34],"work":[35],"demonstrates":[36],"that":[37,207],"LLM-powered":[38],"can":[40,51],"replicate":[41],"aggregate":[42],"survey":[43],"responses,":[44],"yet":[45],"few":[46],"studies":[47],"test":[48],"whether":[49],"predict":[52],"specific":[53,57],"individuals'":[54],"reactions":[55,70],"to":[56,186],"content.":[58],"This":[59],"study":[60],"benchmarks":[61],"LLM-based":[62],"agents'":[63],"accuracy":[64],"predicting":[66,193],"human":[67],"social":[68,180],"(like,":[71],"dislike,":[72],"comment,":[73],"share,":[74],"no":[75,210],"reaction)":[76],"across":[77,218],"120,000+":[78],"unique":[79],"agent-persona":[80],"combinations":[81],"derived":[82],"from":[83],"1,511":[84],"Serbian":[85],"participants":[86],"27":[88],"large":[89],"language":[90],"models.":[91],"In":[92],"Study":[93,109],"1,":[94],"achieved":[96,120],"70.7%":[97],"overall":[98],"accuracy,":[99],"LLM":[101,142],"choice":[102],"producing":[103],"a":[104],"13":[105],"percentage-point":[106],"performance":[107],"spread.":[108],"2":[110],"employed":[111],"binary":[112],"forced-choice":[113],"(like/dislike)":[114],"evaluation":[115],"chance-corrected":[117],"metrics.":[118],"Agents":[119],"Matthews":[121],"Correlation":[122],"Coefficient":[123],"(MCC)":[124],"of":[125,145,162,174,202],"0.29,":[126],"indicating":[127],"genuine":[128,159],"predictive":[129,148,160],"signal":[130],"beyond":[131],"chance.":[132],"However,":[133],"conventional":[134],"text-based":[135],"supervised":[136],"classifiers":[137],"using":[138,203],"TF-IDF":[139],"representations":[140],"outperformed":[141],"(MCC":[144],"0.36),":[146],"suggesting":[147],"gains":[149],"reflect":[150],"semantic":[151],"access":[152],"rather":[153],"than":[154],"uniquely":[155],"agentic":[156],"reasoning.":[157],"The":[158,200],"validity":[161],"zero-shot":[163,204],"persona-prompted":[164],"warns":[166],"against":[167],"potential":[168],"manipulation":[169],"through":[170],"easily":[171],"deploying":[172],"swarms":[173],"behaviorally":[175],"distinct":[176],"on":[179],"media,":[181],"while":[182],"simultaneously":[183],"offering":[184],"opportunities":[185],"use":[187],"such":[188],"simulations":[191],"polarization":[194],"dynamics":[195],"informing":[197],"policy.":[199],"advantage":[201],"is":[206],"they":[208],"require":[209],"task-specific":[211],"training,":[212],"making":[213],"large-scale":[215],"deployment":[216],"easy":[217],"diverse":[219],"contexts.":[220],"Limitations":[221],"include":[222],"single-country":[223],"sampling.":[224],"Future":[225],"research":[226],"should":[227],"explore":[228],"multilingual":[229],"testing":[230],"fine-tuning":[232],"approaches.":[233]},"counts_by_year":[],"updated_date":"2026-04-24T06:07:52.864757","created_date":"2026-04-24T00:00:00"}
