{"id":"https://openalex.org/W4389988129","doi":"https://doi.org/10.1109/tmm.2023.3345172","title":"Keyword-Aware Relative Spatio-Temporal Graph Networks for Video Question Answering","display_name":"Keyword-Aware Relative Spatio-Temporal Graph Networks for Video Question Answering","publication_year":2023,"publication_date":"2023-12-20","ids":{"openalex":"https://openalex.org/W4389988129","doi":"https://doi.org/10.1109/tmm.2023.3345172"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2023.3345172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3345172","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001675146","display_name":"Yi Cheng","orcid":"https://orcid.org/0000-0002-5940-0581"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Yi Cheng","raw_affiliation_strings":["Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore","School of Computing, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]},{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002207978","display_name":"Hehe Fan","orcid":"https://orcid.org/0000-0001-9572-2345"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hehe Fan","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Zhejiang, China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101811045","display_name":"Dongyun Lin","orcid":"https://orcid.org/0000-0002-9694-3454"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dongyun Lin","raw_affiliation_strings":["Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100649794","display_name":"Ying Sun","orcid":"https://orcid.org/0000-0002-7224-6726"},"institutions":[{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Ying Sun","raw_affiliation_strings":["Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016415049","display_name":"Mohan Kankanhalli","orcid":"https://orcid.org/0000-0002-4846-2015"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Mohan Kankanhalli","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077258552","display_name":"Joo\u2010Hwee Lim","orcid":"https://orcid.org/0000-0002-4103-3824"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]},{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Joo-Hwee Lim","raw_affiliation_strings":["Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore","SCSE, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research (I2R), Agency for Science, Technology and Research (A*STAR), Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]},{"raw_affiliation_string":"SCSE, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5001675146"],"corresponding_institution_ids":["https://openalex.org/I115228651","https://openalex.org/I165932596","https://openalex.org/I3005327000"],"apc_list":null,"apc_paid":null,"fwci":1.2279,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.82235122,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"26","issue":null,"first_page":"6131","last_page":"6141"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9936000108718872,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8658645749092102},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.6257617473602295},{"id":"https://openalex.org/keywords/spatial-relation","display_name":"Spatial relation","score":0.5337516069412231},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.4282625913619995},{"id":"https://openalex.org/keywords/temporal-database","display_name":"Temporal database","score":0.4221291244029999},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.4209517240524292},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4089600741863251},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3284570574760437},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3003428280353546}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8658645749092102},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.6257617473602295},{"id":"https://openalex.org/C27511587","wikidata":"https://www.wikidata.org/wiki/Q2178623","display_name":"Spatial relation","level":2,"score":0.5337516069412231},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.4282625913619995},{"id":"https://openalex.org/C77277458","wikidata":"https://www.wikidata.org/wiki/Q1969246","display_name":"Temporal database","level":2,"score":0.4221291244029999},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.4209517240524292},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4089600741863251},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3284570574760437},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3003428280353546}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2023.3345172","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2023.3345172","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320696","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2277195237","https://openalex.org/W2425121537","https://openalex.org/W2606982687","https://openalex.org/W2735159761","https://openalex.org/W2765716052","https://openalex.org/W2808124938","https://openalex.org/W2883891001","https://openalex.org/W2890904455","https://openalex.org/W2904452845","https://openalex.org/W2962949233","https://openalex.org/W2963524571","https://openalex.org/W2963541336","https://openalex.org/W2969897437","https://openalex.org/W2981582341","https://openalex.org/W2981985547","https://openalex.org/W2984008963","https://openalex.org/W2997344006","https://openalex.org/W2997805943","https://openalex.org/W2998166190","https://openalex.org/W3004413500","https://openalex.org/W3034730770","https://openalex.org/W3035265375","https://openalex.org/W3036900224","https://openalex.org/W3038528491","https://openalex.org/W3103668594","https://openalex.org/W3122622502","https://openalex.org/W3167092180","https://openalex.org/W3173367591","https://openalex.org/W3174490084","https://openalex.org/W3174873881","https://openalex.org/W3176896951","https://openalex.org/W3183719433","https://openalex.org/W3189890868","https://openalex.org/W3197457832","https://openalex.org/W4200631219","https://openalex.org/W4205492448","https://openalex.org/W4205817612","https://openalex.org/W4225414521","https://openalex.org/W4226060302","https://openalex.org/W4295036294","https://openalex.org/W4312245888","https://openalex.org/W4313186260","https://openalex.org/W4316661142","https://openalex.org/W4321350720","https://openalex.org/W4385572712","https://openalex.org/W6682864246","https://openalex.org/W6752083267","https://openalex.org/W6766978945","https://openalex.org/W6797109355","https://openalex.org/W6804277322","https://openalex.org/W6841299521"],"related_works":["https://openalex.org/W2384605597","https://openalex.org/W2363753014","https://openalex.org/W2385567678","https://openalex.org/W2355121635","https://openalex.org/W1967100394","https://openalex.org/W2016995243","https://openalex.org/W4312476862","https://openalex.org/W1495086659","https://openalex.org/W2382163390","https://openalex.org/W4254623023"],"abstract_inverted_index":{"The":[0,91],"main":[1],"challenge":[2],"in":[3,33],"video":[4,100],"question":[5,72,89,93],"answering":[6],"(VideoQA)":[7],"is":[8],"to":[9,40,52,70,82,86,98,114],"capture":[10,116],"and":[11,16,35,134,145,158],"understand":[12],"the":[13,110,117,126,141,155,162],"complex":[14],"spatial":[15,132,144],"temporal":[17,137,146],"relations":[18,46,105],"between":[19,47],"objects":[20],"based":[21],"on":[22,149,154],"given":[23],"questions.":[24],"Existing":[25],"graph-based":[26],"methods":[27],"for":[28,67],"VideoQA":[29],"usually":[30],"ignore":[31],"keywords":[32,87],"questions":[34],"employ":[36,78],"a":[37,60,135],"simple":[38],"graph":[39,65,101,133],"aggregate":[41],"features":[42,73,94],"without":[43],"considering":[44],"relative":[45,111],"objects,":[48],"which":[49,139],"may":[50],"lead":[51],"inferior":[53],"performance.":[54],"In":[55],"this":[56],"paper,":[57],"we":[58,77,108,124],"propose":[59],"Keyword-aware":[61],"Relative":[62],"Spatio-Temporal":[63],"(KRST)":[64],"network":[66],"VideoQA.":[68],"First,":[69],"make":[71],"aware":[74],"of":[75,143,164],"keywords,":[76],"an":[79,130],"attention":[80],"mechanism":[81],"assign":[83],"high":[84],"weights":[85],"during":[88],"encoding.":[90],"keyword-aware":[92],"are":[95,106],"then":[96],"used":[97],"guide":[99],"construction.":[102],"Second,":[103],"because":[104],"relative,":[107],"integrate":[109],"relation":[112,147],"modeling":[113],"better":[115],"spatio-temporal":[118,127],"dynamics":[119],"among":[120],"object":[121],"nodes.":[122],"Moreover,":[123],"disentangle":[125],"reasoning":[128,148],"into":[129],"object-level":[131],"frame-level":[136],"graph,":[138],"reduces":[140],"impact":[142],"each":[150],"other.":[151],"Extensive":[152],"experiments":[153],"TGIF-QA,":[156],"MSVD-QA":[157],"MSRVTT-QA":[159],"datasets":[160],"demonstrate":[161],"superiority":[163],"our":[165],"KRST":[166],"over":[167],"multiple":[168],"state-of-the-art":[169],"methods.":[170]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
