{"id":"https://openalex.org/W7135195918","doi":"https://doi.org/10.48550/arxiv.2603.11213","title":"LLMs in social services: How does chatbot accuracy affect human accuracy?","display_name":"LLMs in social services: How does chatbot accuracy affect human accuracy?","publication_year":2026,"publication_date":"2026-03-11","ids":{"openalex":"https://openalex.org/W7135195918","doi":"https://doi.org/10.48550/arxiv.2603.11213"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.11213","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.11213","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.11213","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114336461","display_name":"Jennah Gosciak","orcid":"https://orcid.org/0009-0007-2180-8147"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gosciak, Jennah","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068713525","display_name":"Eric Giannella","orcid":"https://orcid.org/0000-0003-3473-4339"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Giannella, Eric","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038735592","display_name":"Zhaowen Guo","orcid":"https://orcid.org/0000-0002-0900-5866"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Zhaowen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129010874","display_name":"Michael Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5087471530","display_name":"Allison Koenecke","orcid":"https://orcid.org/0000-0002-6233-8256"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koenecke, Allison","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.46209999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12128","display_name":"AI in Service Interactions","score":0.46209999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11519","display_name":"Digital Mental Health Interventions","score":0.1137000024318695,"subfield":{"id":"https://openalex.org/subfields/3202","display_name":"Applied Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13197","display_name":"Spreadsheets and End-User Computing","score":0.11079999804496765,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chatbot","display_name":"Chatbot","score":0.9718999862670898},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.572700023651123},{"id":"https://openalex.org/keywords/outreach","display_name":"Outreach","score":0.536899983882904},{"id":"https://openalex.org/keywords/affect","display_name":"Affect (linguistics)","score":0.42899999022483826},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.41019999980926514},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.3921000063419342}],"concepts":[{"id":"https://openalex.org/C2779041454","wikidata":"https://www.wikidata.org/wiki/Q870780","display_name":"Chatbot","level":2,"score":0.9718999862670898},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.572700023651123},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5533999800682068},{"id":"https://openalex.org/C2781400479","wikidata":"https://www.wikidata.org/wiki/Q11640","display_name":"Outreach","level":2,"score":0.536899983882904},{"id":"https://openalex.org/C2776035688","wikidata":"https://www.wikidata.org/wiki/Q1606558","display_name":"Affect (linguistics)","level":2,"score":0.42899999022483826},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.41019999980926514},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.3921000063419342},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.38690000772476196},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.36340001225471497},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.3506999909877777},{"id":"https://openalex.org/C75630572","wikidata":"https://www.wikidata.org/wiki/Q538904","display_name":"Applied psychology","level":1,"score":0.34310001134872437},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3391999900341034},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.33869999647140503},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.32600000500679016},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.2711000144481659},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.2694000005722046},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.2533000111579895}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.11213","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.11213","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.11213","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.11213","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Zero hunger","score":0.6625434160232544,"id":"https://metadata.un.org/sdg/2"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Social":[0],"service":[1],"programs":[2],"like":[3],"the":[4,61,119,136,177,194,218,231],"Supplemental":[5],"Nutrition":[6],"Assistance":[7],"Program":[8],"(SNAP,":[9],"or":[10,33],"food":[11],"stamps)":[12],"have":[13],"eligibility":[14],"rules":[15],"that":[16,88,142,215],"can":[17],"be":[18,53],"challenging":[19],"to":[20,43,48,71,146,154],"understand.":[21],"For":[22],"nonprofit":[23,111],"caseworkers":[24,108],"who":[25],"often":[26],"support":[27],"clients":[28,49],"in":[29,114,118,135,148,204],"navigating":[30],"a":[31,41,78,89,104,129,187,213,224],"dozen":[32],"more":[34],"complex":[35],"programs,":[36],"LLM-based":[37,65],"chatbots":[38,166],"may":[39,52],"offer":[40],"means":[42],"provide":[44,72],"better,":[45],"faster":[46],"help":[47],"whose":[50],"situations":[51],"less":[54],"common.":[55],"In":[56],"this":[57],"paper,":[58],"we":[59,102,143,216],"measure":[60],"potential":[62],"effects":[63],"of":[64,83,132,233],"chatbot":[66,125,140,162,180,200,210],"suggestions":[67,126,141,181],"on":[68,190],"caseworkers'":[69],"ability":[70],"accurate":[73],"guidance.":[74],"We":[75],"first":[76],"created":[77],"770-question":[79],"multiple-choice":[80],"benchmark":[81,96],"dataset":[82],"difficult,":[84],"but":[85],"realistic":[86],"questions":[87,97,192],"caseworker":[90,170,184,205],"might":[91],"receive.":[92],"Next,":[93],"using":[94],"these":[95],"and":[98,127,229],"corresponding":[99],"expert-verified":[100],"answers,":[101],"conducted":[103],"randomized":[105],"experiment":[106],"with":[107,186,237],"recruited":[109],"from":[110,151],"outreach":[112],"organizations":[113],"Los":[115],"Angeles.":[116],"Caseworkers":[117,134],"control":[120,195],"condition":[121,138],"did":[122],"not":[123],"see":[124],"had":[128],"mean":[130],"accuracy":[131,150,171,206,211],"49%.":[133],"treatment":[137],"saw":[139],"artificially":[144],"varied":[145],"range":[147],"aggregate":[149],"low":[152],"(53%)":[153],"high":[155],"(100%).":[156],"Caseworker":[157],"performance":[158],"significantly":[159],"improves":[160],"as":[161,209],"quality":[163],"improves:":[164],"high-quality":[165],"(96-100%":[167],"accurate)":[168],"improved":[169],"by":[172],"27":[173],"percentage":[174],"points.":[175],"At":[176],"question-level,":[178],"incorrect":[179],"substantially":[182],"reduce":[183],"accuracy,":[185],"two-thirds":[188],"reduction":[189],"easy":[191],"where":[193],"group":[196],"performed":[197],"best":[198],"(without":[199],"suggestions).":[201],"Finally,":[202],"improvements":[203],"level":[207],"off":[208],"increases,":[212],"phenomenon":[214],"call":[217],"\"AI":[219],"underreliance":[220],"plateau,\"":[221],"which":[222],"is":[223],"concern":[225],"for":[226],"real-world":[227],"deployment":[228],"highlights":[230],"importance":[232],"evaluating":[234],"human-in-the-loop":[235],"tools":[236],"their":[238],"users.":[239]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-03-14T00:00:00"}
