{"id":"https://openalex.org/W7117464804","doi":"https://doi.org/10.1145/3714394.3756290","title":"MemMod4CVQA: Using Memory Models to Infer Causal Relationships for Visual Question Answering on Life-Log Data","display_name":"MemMod4CVQA: Using Memory Models to Infer Causal Relationships for Visual Question Answering on Life-Log Data","publication_year":2025,"publication_date":"2025-10-12","ids":{"openalex":"https://openalex.org/W7117464804","doi":"https://doi.org/10.1145/3714394.3756290"},"language":null,"primary_location":{"id":"doi:10.1145/3714394.3756290","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3714394.3756290","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion of the 2025 ACM International Joint Conference on Pervasive and Ubiquitous Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3714394.3756290","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112597368","display_name":"Sohil Khan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148827","display_name":"Birla Institute of Technology and Science, Pilani - Goa Campus","ror":"https://ror.org/046sh6j17","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210148827","https://openalex.org/I74796645"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Sohil Khan","raw_affiliation_strings":["Department of Electronics and Electrical Engineering, BITS Pilani K.K. Birla Goa Campus, Goa, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Electrical Engineering, BITS Pilani K.K. Birla Goa Campus, Goa, India","institution_ids":["https://openalex.org/I4210148827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121509679","display_name":"Rakshit Mishra","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148827","display_name":"Birla Institute of Technology and Science, Pilani - Goa Campus","ror":"https://ror.org/046sh6j17","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210148827","https://openalex.org/I74796645"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rakshit Mishra","raw_affiliation_strings":["Department of Electronics and Electrical Engineering, BITS Pilani K.K. Birla Goa Campus, Goa, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Electrical Engineering, BITS Pilani K.K. Birla Goa Campus, Goa, India","institution_ids":["https://openalex.org/I4210148827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121468356","display_name":"Mehlam Songerwala","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148827","display_name":"Birla Institute of Technology and Science, Pilani - Goa Campus","ror":"https://ror.org/046sh6j17","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210148827","https://openalex.org/I74796645"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Mehlam Songerwala","raw_affiliation_strings":["Department of Electronics and Electrical Engineering, BITS Pilani K.K. Birla Goa Campus, Goa, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Electrical Engineering, BITS Pilani K.K. Birla Goa Campus, Goa, India","institution_ids":["https://openalex.org/I4210148827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121471315","display_name":"Meera Radhakrishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Meera Radhakrishnan","raw_affiliation_strings":["Data Science Institute, University of Technology Sydney, Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"Data Science Institute, University of Technology Sydney, Sydney, Australia","institution_ids":["https://openalex.org/I114017466"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033187487","display_name":"Dulanga Weerakoon","orcid":null},"institutions":[{"id":"https://openalex.org/I4210167254","display_name":"Singapore-MIT Alliance for Research and Technology","ror":"https://ror.org/05yb3w112","country_code":"SG","type":"education","lineage":["https://openalex.org/I4210167254"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dulanga Weerakoon","raw_affiliation_strings":["M3S, Singapore-MIT Alliance for Research and Technology (SMART) Centre, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"M3S, Singapore-MIT Alliance for Research and Technology (SMART) Centre, Singapore, Singapore","institution_ids":["https://openalex.org/I4210167254"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045309067","display_name":"Vigneshwaran Subbaraju","orcid":"https://orcid.org/0000-0002-4276-5939"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Vigneshwaran Subbaraju","raw_affiliation_strings":["IHPC, Agency for Science, Technology and Research, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"IHPC, Agency for Science, Technology and Research, Singapore, Singapore","institution_ids":["https://openalex.org/I115228651"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023938040","display_name":"Sougata Sen","orcid":"https://orcid.org/0000-0002-2466-0025"},"institutions":[{"id":"https://openalex.org/I4210148827","display_name":"Birla Institute of Technology and Science, Pilani - Goa Campus","ror":"https://ror.org/046sh6j17","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210148827","https://openalex.org/I74796645"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sougata Sen","raw_affiliation_strings":["Department of Computer Science and Information Systems, BITS Pilani K.K. Birla Goa Campus, Goa, Goa, India"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Information Systems, BITS Pilani K.K. Birla Goa Campus, Goa, Goa, India","institution_ids":["https://openalex.org/I4210148827"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5112597368"],"corresponding_institution_ids":["https://openalex.org/I4210148827"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65031126,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1517","last_page":"1523"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.00279999990016222,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.002300000051036477,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.7792999744415283},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6128000020980835},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5358999967575073},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.49729999899864197},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4871000051498413},{"id":"https://openalex.org/keywords/causal-model","display_name":"Causal model","score":0.46059998869895935},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.42590001225471497},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.39660000801086426},{"id":"https://openalex.org/keywords/conjunction","display_name":"Conjunction (astronomy)","score":0.3869999945163727}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7961000204086304},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.7792999744415283},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6128000020980835},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5950999855995178},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5419999957084656},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5358999967575073},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.49729999899864197},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4871000051498413},{"id":"https://openalex.org/C11671645","wikidata":"https://www.wikidata.org/wiki/Q5054567","display_name":"Causal model","level":2,"score":0.46059998869895935},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.42590001225471497},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.39660000801086426},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.3869999945163727},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.38339999318122864},{"id":"https://openalex.org/C88576662","wikidata":"https://www.wikidata.org/wiki/Q18646","display_name":"Episodic memory","level":3,"score":0.36579999327659607},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.334199994802475},{"id":"https://openalex.org/C163504300","wikidata":"https://www.wikidata.org/wiki/Q2364925","display_name":"Causal structure","level":2,"score":0.3337000012397766},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.3285999894142151},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.32359999418258667},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.31630000472068787},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.3111000061035156},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.28999999165534973},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2849999964237213},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.2750999927520752},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3714394.3756290","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3714394.3756290","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion of the 2025 ACM International Joint Conference on Pervasive and Ubiquitous Computing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3714394.3756290","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3714394.3756290","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Companion of the 2025 ACM International Joint Conference on Pervasive and Ubiquitous Computing","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.6094793677330017,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W2735685223","https://openalex.org/W3003587073","https://openalex.org/W3013140753","https://openalex.org/W4411062771"],"related_works":[],"abstract_inverted_index":{"Egocentric":[0],"cameras":[1,16],"are":[2,25],"increasingly":[3],"adopted":[4],"as":[5],"an":[6,149],"effective":[7],"tool":[8],"that":[9,51,96,102,139,169],"aids":[10],"in":[11,72,88,178,183],"self-monitoring":[12],"by":[13,27],"individuals.":[14],"These":[15],"automatically":[17],"record":[18],"event":[19],"details":[20],"into":[21,63],"a":[22,64,94,116,133],"video":[23],"which":[24,159],"reviewed":[26],"the":[28,45,52,56,103,108,145,170,184],"users":[29,98],"later,":[30],"to":[31,99,128,143,175],"identify":[32,80],"items":[33,57],"of":[34,47,54,58,120,153],"interest.":[35],"However,":[36],"this":[37,86,89],"process":[38],"is":[39,141,160],"time-consuming":[40],"and":[41,125,147],"labor":[42],"intensive.":[43],"With":[44],"availability":[46],"LLMs,":[48,71],"we":[49,91,137],"posit":[50],"task":[53],"identifying":[55],"interest":[59],"can":[60,78,173],"be":[61],"automated":[62],"natural":[65],"language":[66],"Question-Answering":[67],"format.":[68],"Furthermore,":[69],"these":[70,130],"conjunction":[73],"with":[74],"memory":[75,117,127],"graph":[76],"models":[77],"help":[79],"causal":[81,126,157,179],"relationship":[82],"between":[83],"events.":[84],"To":[85],"end,":[87],"paper,":[90],"propose":[92],"MemMod4CVQA,":[93],"framework":[95,104,114,146,171],"enables":[97],"pose":[100],"questions":[101],"will":[105],"answer":[106,129],"using":[107],"egocentric":[109],"camera":[110],"details.":[111],"The":[112],"MemMod4CVQA":[113],"uses":[115],"model":[118],"comprising":[119],"semantics":[121],"memory,":[122,124],"episodic":[123],"questions.":[131],"Through":[132],"small":[134],"simulation-based":[135],"study":[136],"observed":[138],"it":[140],"possible":[142],"realize":[144],"obtain":[148],"overall":[150],"F1":[151],"score":[152],"44.80%":[154],"on":[155],"predicting":[156],"relationships,":[158],"22.10%":[161],"higher":[162],"than":[163],"standard":[164],"baseline":[165],"approaches.":[166],"We":[167],"believe":[168],"architecture":[172],"lead":[174],"significant":[176],"improvements":[177],"visual":[180],"question":[181],"answering":[182],"future.":[185]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-29T00:00:00"}
