{"id":"https://openalex.org/W2969663619","doi":"https://doi.org/10.1145/3321505","title":"Video Question Answering via Knowledge-based Progressive Spatial-Temporal Attention Network","display_name":"Video Question Answering via Knowledge-based Progressive Spatial-Temporal Attention Network","publication_year":2019,"publication_date":"2019-04-30","ids":{"openalex":"https://openalex.org/W2969663619","doi":"https://doi.org/10.1145/3321505","mag":"2969663619"},"language":"en","primary_location":{"id":"doi:10.1145/3321505","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3321505","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051494566","display_name":"Weike Jin","orcid":"https://orcid.org/0000-0002-3132-5567"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weike Jin","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079260216","display_name":"Zhou Zhao","orcid":"https://orcid.org/0000-0001-6121-0384"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhou Zhao","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100696471","display_name":"Yimeng Li","orcid":"https://orcid.org/0000-0002-5658-3706"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yimeng Li","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104245706","display_name":"Jie Li","orcid":"https://orcid.org/0009-0008-9885-6144"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Li","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101485989","display_name":"Jun Xiao","orcid":"https://orcid.org/0000-0002-6142-9914"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Xiao","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008666077","display_name":"Yueting Zhuang","orcid":"https://orcid.org/0000-0001-9017-2508"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueting Zhuang","raw_affiliation_strings":["Zhejiang University, China"],"affiliations":[{"raw_affiliation_string":"Zhejiang University, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5051494566"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":1.1134,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.82189636,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"15","issue":"2s","first_page":"1","last_page":"22"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9919999837875366,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9796000123023987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.9159440398216248},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8416082859039307},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.7408086061477661},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5787692666053772},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4962514042854309},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.49330273270606995},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.48538291454315186},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.4807717204093933},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.47610270977020264},{"id":"https://openalex.org/keywords/natural-language-understanding","display_name":"Natural language understanding","score":0.4378723204135895},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.43709737062454224},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.38448232412338257},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.35153037309646606}],"concepts":[{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.9159440398216248},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8416082859039307},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.7408086061477661},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5787692666053772},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4962514042854309},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.49330273270606995},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.48538291454315186},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.4807717204093933},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.47610270977020264},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.4378723204135895},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.43709737062454224},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.38448232412338257},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35153037309646606},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3321505","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3321505","pdf_url":null,"source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7900000214576721,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G2316476382","display_name":null,"funder_award_id":"No.61602405,No.61836002,No.61572431,No.61751209","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3209259326","display_name":null,"funder_award_id":"LR19F020002,LZ17F020001","funder_id":"https://openalex.org/F4320338464","funder_display_name":"Natural Science Foundation of Zhejiang Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320338464","display_name":"Natural Science Foundation of Zhejiang Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W102708294","https://openalex.org/W804133461","https://openalex.org/W1493490255","https://openalex.org/W1514535095","https://openalex.org/W1586939924","https://openalex.org/W1801721664","https://openalex.org/W1933349210","https://openalex.org/W1947481528","https://openalex.org/W1964763677","https://openalex.org/W1983927101","https://openalex.org/W2016089260","https://openalex.org/W2042708146","https://openalex.org/W2064675550","https://openalex.org/W2080133951","https://openalex.org/W2094728533","https://openalex.org/W2097117768","https://openalex.org/W2112912048","https://openalex.org/W2131744502","https://openalex.org/W2136480620","https://openalex.org/W2142192571","https://openalex.org/W2142900973","https://openalex.org/W2166348853","https://openalex.org/W2194775991","https://openalex.org/W2251287417","https://openalex.org/W2293453011","https://openalex.org/W2302963717","https://openalex.org/W2346425926","https://openalex.org/W2412393473","https://openalex.org/W2463565445","https://openalex.org/W2511108736","https://openalex.org/W2553418567","https://openalex.org/W2560920409","https://openalex.org/W2565656701","https://openalex.org/W2606982687","https://openalex.org/W2612228435","https://openalex.org/W2615497679","https://openalex.org/W2620666060","https://openalex.org/W2732016772","https://openalex.org/W2735159761","https://openalex.org/W2737435850","https://openalex.org/W2765716052","https://openalex.org/W2766690867","https://openalex.org/W2798786641","https://openalex.org/W2808203533","https://openalex.org/W2808647806","https://openalex.org/W2897182555","https://openalex.org/W2897857500","https://openalex.org/W2951008357","https://openalex.org/W2951278025","https://openalex.org/W2951619830","https://openalex.org/W2953106684","https://openalex.org/W2953276893","https://openalex.org/W2962749469","https://openalex.org/W2962779575","https://openalex.org/W2962835968","https://openalex.org/W2962938145","https://openalex.org/W2962949233","https://openalex.org/W2963383024","https://openalex.org/W2963398599","https://openalex.org/W2963503066","https://openalex.org/W2963656855","https://openalex.org/W2963672682","https://openalex.org/W2963781647","https://openalex.org/W2963954913","https://openalex.org/W2964118342","https://openalex.org/W2964138017","https://openalex.org/W3099768435","https://openalex.org/W4236265809","https://openalex.org/W4236965008"],"related_works":["https://openalex.org/W3134247745","https://openalex.org/W4226243593","https://openalex.org/W3172691639","https://openalex.org/W4285816982","https://openalex.org/W3157284875","https://openalex.org/W2259406085","https://openalex.org/W2099715052","https://openalex.org/W4213176082","https://openalex.org/W4220955952","https://openalex.org/W1566366091"],"abstract_inverted_index":{"Visual":[0],"Question":[1],"Answering":[2],"(VQA)":[3],"is":[4,36,74,98,187,202],"a":[5,28,33,69,76,91,158,180,190,209,228],"challenging":[6],"task":[7],"that":[8,201],"has":[9,52],"gained":[10],"increasing":[11],"attention":[12,162,192,213],"from":[13,179,204],"both":[14,170],"the":[15,19,41,45,59,80,87,103,108,110,129,148,152,176,195,217,243],"computer":[16],"vision":[17],"and":[18,82,131,172],"natural":[20,31,92],"language":[21],"processing":[22],"communities":[23],"in":[24,30,56,86,107],"recent":[25],"years.":[26],"Given":[27],"question":[29,64,95,120,223,231],"language,":[32],"VQA":[34],"system":[35],"designed":[37],"to":[38,44,118,146,164,215],"automatically":[39],"generate":[40],"answer":[42],"according":[43],"referenced":[46],"visual":[47,63,84],"content.":[48],"Though":[49],"there":[50],"recently":[51],"been":[53],"much":[54],"intereset":[55],"this":[57,123,166],"topic,":[58],"existing":[60],"work":[61],"of":[62,79,102,112,134,151,175,198,245],"answering":[65,96,149,224,232],"mainly":[66],"focuses":[67],"on":[68,238],"single":[70],"static":[71],"image,":[72],"which":[73],"only":[75,127],"small":[77],"part":[78],"dynamic":[81],"sequential":[83],"data":[85],"real":[88],"world.":[89],"As":[90],"extension,":[93],"video":[94,119,135,177,219,222,230],"(VideoQA)":[97],"less":[99],"explored.":[100],"Because":[101],"inherent":[104],"temporal":[105,132],"structure":[106],"video,":[109],"approaches":[111],"ImageQA":[113],"may":[114],"be":[115],"ineffectively":[116],"applied":[117],"answering.":[121],"In":[122],"article,":[124],"we":[125,156,207],"not":[126],"take":[128],"spatial":[130],"dimension":[133],"content":[136],"into":[137],"account":[138],"but":[139],"also":[140],"employ":[141],"an":[142],"external":[143],"knowledge":[144,185],"base":[145],"improve":[147],"ability":[150],"network.":[153,183],"More":[154],"specifically,":[155],"propose":[157],"knowledge-based":[159],"progressive":[160,211],"spatial-temporal":[161,212],"network":[163,214],"tackle":[165],"problem.":[167],"We":[168,226],"obtain":[169],"objects":[171],"region":[173,181],"features":[174],"frames":[178],"proposal":[182],"The":[184,234],"representation":[186,220],"generated":[188],"by":[189],"word-level":[191],"mechanism":[193],"using":[194],"comment":[196],"information":[197],"each":[199],"object":[200],"extracted":[203],"DBpedia.":[205],"Then,":[206],"develop":[208],"question-knowledge-guided":[210],"learn":[216],"joint":[218],"for":[221],"task.":[225],"construct":[227],"large-scale":[229],"dataset.":[233],"extensive":[235],"experiments":[236],"based":[237],"two":[239],"different":[240],"datasets":[241],"validate":[242],"effectiveness":[244],"our":[246],"method.":[247]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2019-08-29T00:00:00"}
