{"id":"https://openalex.org/W7161682031","doi":"https://doi.org/10.48550/arxiv.2605.18734","title":"EgoExoMem: Cross-View Memory Reasoning over Synchronized Egocentric and Exocentric Videos","display_name":"EgoExoMem: Cross-View Memory Reasoning over Synchronized Egocentric and Exocentric Videos","publication_year":2026,"publication_date":"2026-05-18","ids":{"openalex":"https://openalex.org/W7161682031","doi":"https://doi.org/10.48550/arxiv.2605.18734"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.18734","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18734","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.18734","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136474226","display_name":"Ruiping Liu","orcid":"https://orcid.org/0009-0000-1146-3412"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ruiping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136504849","display_name":"Junwei Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Junwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136457193","display_name":"Yufan Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yufan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136462421","display_name":"Di Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Di","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136486713","display_name":"Shaofang Quan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Quan, Shaofang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136461243","display_name":"Chengzhi Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Chengzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136502146","display_name":"Jiaming Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jiaming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136466415","display_name":"Kailun Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Kailun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136497271","display_name":"Kunyu Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Kunyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136463371","display_name":"Rainer Stiefelhagen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stiefelhagen, Rainer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8787999749183655,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8787999749183655,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.07270000129938126,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.0071000000461936,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/endocentric-and-exocentric","display_name":"Endocentric and exocentric","score":0.7150999903678894},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.585099995136261},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.5591999888420105},{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.5450000166893005},{"id":"https://openalex.org/keywords/memory-model","display_name":"Memory model","score":0.36469998955726624},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.3546999990940094},{"id":"https://openalex.org/keywords/observer","display_name":"Observer (physics)","score":0.34869998693466187},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.3452000021934509}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7312999963760376},{"id":"https://openalex.org/C131042201","wikidata":"https://www.wikidata.org/wiki/Q493198","display_name":"Endocentric and exocentric","level":4,"score":0.7150999903678894},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.597599983215332},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.585099995136261},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.5591999888420105},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.5450000166893005},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.36469998955726624},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.3546999990940094},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3515999913215637},{"id":"https://openalex.org/C2780704645","wikidata":"https://www.wikidata.org/wiki/Q9251458","display_name":"Observer (physics)","level":2,"score":0.34869998693466187},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.3452000021934509},{"id":"https://openalex.org/C178278151","wikidata":"https://www.wikidata.org/wiki/Q7936607","display_name":"Visual memory","level":3,"score":0.34279999136924744},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.3402000069618225},{"id":"https://openalex.org/C169087156","wikidata":"https://www.wikidata.org/wiki/Q2131593","display_name":"Framing (construction)","level":2,"score":0.3400000035762787},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.33009999990463257},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3075000047683716},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.29580000042915344},{"id":"https://openalex.org/C88576662","wikidata":"https://www.wikidata.org/wiki/Q18646","display_name":"Episodic memory","level":3,"score":0.29260000586509705},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.28850001096725464},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.28780001401901245},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C21963081","wikidata":"https://www.wikidata.org/wiki/Q11337567","display_name":"Working memory","level":3,"score":0.2840999960899353},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2808000147342682},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2727000117301941},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.18734","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18734","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.18734","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.18734","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Egocentric":[0],"memory":[1,35,98,125,146],"is":[2],"widely":[3],"used":[4],"in":[5],"embodied":[6],"intelligence,":[7],"but":[8],"it":[9],"may":[10],"be":[11],"insufficient":[12],"for":[13,33,68],"comprehensive":[14],"spatial-temporal":[15],"reasoning.":[16,147],"Inspired":[17],"by":[18],"human":[19],"recall":[20],"from":[21,105],"both":[22],"field":[23],"and":[24,40,52,85,93,123,136,142],"observer":[25],"perspectives,":[26],"we":[27,60],"introduce":[28],"EgoExoMem,":[29],"the":[30,107,109,140],"first":[31],"benchmark":[32],"cross-view":[34,53,86,145],"reasoning":[36],"over":[37,121],"synchronized":[38,69],"egocentric":[39],"exocentric":[41],"videos.":[42,71],"EgoExoMem":[43],"contains":[44],"$2.6K$":[45],"high-quality":[46],"MCQs":[47],"across":[48],"eight":[49],"temporal,":[50],"spatial,":[51],"QA":[54],"types.":[55],"To":[56],"support":[57],"dual-view":[58],"retrieval,":[59],"propose":[61],"E$^2$-Select,":[62],"a":[63],"training-free":[64],"frame":[65],"selection":[66],"method":[67],"ego-exo":[70],"It":[72],"combines":[73],"relevance-based":[74],"budget":[75],"allocation":[76],"with":[77],"per-view":[78],"k-DPP":[79],"sampling":[80],"to":[81],"handle":[82],"view":[83],"asymmetry":[84],"temporal":[87],"consistency.":[88],"Experiments":[89],"show":[90],"that":[91],"ego":[92],"exo":[94],"views":[95],"provide":[96],"complementary":[97],"cues,":[99],"while":[100],"existing":[101],"MLLMs":[102],"remain":[103],"far":[104],"solving":[106],"benchmark:":[108],"best":[110],"model":[111],"reaches":[112],"only":[113],"$55.3\\%$.":[114],"E$^2$-Select":[115],"achieves":[116],"state-of-the-art":[117],"performance":[118],"of":[119,144],"$58.2\\%$":[120],"frame-selection":[122],"RAG-based":[124],"baselines.":[126],"Further":[127],"analysis":[128],"reveals":[129],"systematic":[130],"view-preference":[131],"conflicts":[132],"between":[133],"question":[134],"framing":[135],"answer":[137],"grounding,":[138],"underscoring":[139],"novelty":[141],"challenge":[143]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
