{"id":"https://openalex.org/W7127334606","doi":"https://doi.org/10.1145/3774904.3792143","title":"ES-MemEval: Benchmarking Conversational Agents on Personalized Long-Term Emotional Support","display_name":"ES-MemEval: Benchmarking Conversational Agents on Personalized Long-Term Emotional Support","publication_year":2026,"publication_date":"2026-04-12","ids":{"openalex":"https://openalex.org/W7127334606","doi":"https://doi.org/10.1145/3774904.3792143"},"language":null,"primary_location":{"id":"doi:10.1145/3774904.3792143","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792143","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3774904.3792143","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124957197","display_name":"Tiantian Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tiantian Chen","raw_affiliation_strings":["Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-7346-7670","affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124916674","display_name":"Jiaqi Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaqi Lu","raw_affiliation_strings":["Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0006-9236-4531","affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124920543","display_name":"Ying Shen","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Shen","raw_affiliation_strings":["Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-2966-7955","affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124941215","display_name":"Lin Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Zhang","raw_affiliation_strings":["Tongji University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-4360-5523","affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14417935,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5810","last_page":"5821"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.435699999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.435699999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.22370000183582306,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11519","display_name":"Digital Mental Health Interventions","score":0.05810000002384186,"subfield":{"id":"https://openalex.org/subfields/3202","display_name":"Applied Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7315999865531921},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.6863999962806702},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6133999824523926},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5940999984741211},{"id":"https://openalex.org/keywords/sensemaking","display_name":"Sensemaking","score":0.4034999907016754},{"id":"https://openalex.org/keywords/user-modeling","display_name":"User modeling","score":0.36059999465942383},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.3434000015258789}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7315999865531921},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7046999931335449},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.6863999962806702},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6133999824523926},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5940999984741211},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.43320000171661377},{"id":"https://openalex.org/C2780554381","wikidata":"https://www.wikidata.org/wiki/Q2063340","display_name":"Sensemaking","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C67712803","wikidata":"https://www.wikidata.org/wiki/Q7901853","display_name":"User modeling","level":3,"score":0.36059999465942383},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3528999984264374},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.3434000015258789},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.33469998836517334},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3278999924659729},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3118000030517578},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.2962000072002411},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.295199990272522},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.25290000438690186}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3774904.3792143","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792143","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2602.01885","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2602.01885","pdf_url":"https://arxiv.org/pdf/2602.01885","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:doi:10.48550/arxiv.2602.01885","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"doi:10.1145/3774904.3792143","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3774904.3792143","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2026","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.5544096231460571,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G583652794","display_name":null,"funder_award_id":"62272343","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329860","display_name":"National Science and Technology Major Project","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"shown":[5],"strong":[6],"potential":[7,174],"as":[8,29],"conversational":[9],"agents.":[10],"Yet,":[11],"their":[12],"effectiveness":[13],"remains":[14],"limited":[15],"by":[16],"deficiencies":[17],"in":[18,23,50,89],"robust":[19,183],"long-term":[20,25,35,90,115,141,190],"memory,":[21],"particularly":[22],"complex,":[24],"web-based":[26],"services":[27],"such":[28],"online":[30],"emotional":[31,91,116],"support.":[32],"However,":[33],"existing":[34],"dialogue":[36,99,192],"benchmarks":[37],"primarily":[38],"focus":[39],"on":[40,130],"static":[41],"and":[42,59,86,98,124,134,148,165,175,180,187],"explicit":[43,140],"fact":[44],"retrieval,":[45],"failing":[46],"to":[47],"evaluate":[48],"agents":[49],"critical":[51],"scenarios":[52],"where":[53],"user":[54,87,122,126,167],"information":[55,79],"is":[56,143],"dispersed,":[57],"implicit,":[58],"continuously":[60],"evolving.":[61],"To":[62,102],"address":[63],"this":[64],"gap,":[65],"we":[66,106],"introduce":[67],"ES-MemEval,":[68],"a":[69,110],"comprehensive":[70],"benchmark":[71],"that":[72,118,139],"systematically":[73],"evaluates":[74],"five":[75],"core":[76],"memory":[77,142,186],"capabilities:":[78],"extraction,":[80],"temporal":[81,163],"reasoning,":[82],"conflict":[83],"detection,":[84],"abstention,":[85],"modeling,":[88],"support":[92,103,117],"settings,":[93],"covering":[94],"question":[95],"answering,":[96],"summarization,":[97],"generation":[100],"tasks.":[101],"the":[104,153,173],"benchmark,":[105],"also":[107],"propose":[108],"EvoEmo,":[109],"multi-session":[111],"dataset":[112],"for":[113,145,189],"personalized":[114,191],"captures":[119],"fragmented,":[120],"implicit":[121],"disclosures":[123],"evolving":[125,166],"states.":[127,168],"Extensive":[128],"experiments":[129],"open-source":[131],"long-context,":[132],"commercial,":[133],"retrieval-augmented":[135],"(RAG)":[136],"LLMs":[137],"show":[138],"essential":[144],"reducing":[146],"hallucinations":[147],"enabling":[149],"effective":[150],"personalization.":[151],"At":[152],"same":[154],"time,":[155],"RAG":[156],"improves":[157],"factual":[158],"consistency":[159],"but":[160],"struggles":[161],"with":[162],"dynamics":[164],"These":[169],"findings":[170],"highlight":[171],"both":[172],"limitations":[176],"of":[177,185],"current":[178],"paradigms":[179],"motivate":[181],"more":[182],"integration":[184],"retrieval":[188],"systems.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-04T00:00:00"}
