{"id":"https://openalex.org/W3034425145","doi":"https://doi.org/10.1109/tmm.2020.3002667","title":"Adversarial Multimodal Network for Movie Story Question Answering","display_name":"Adversarial Multimodal Network for Movie Story Question Answering","publication_year":2020,"publication_date":"2020-06-15","ids":{"openalex":"https://openalex.org/W3034425145","doi":"https://doi.org/10.1109/tmm.2020.3002667","mag":"3034425145"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2020.3002667","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2020.3002667","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045800438","display_name":"Zhaoquan Yuan","orcid":"https://orcid.org/0000-0002-4083-5155"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhaoquan Yuan","raw_affiliation_strings":["School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107942686","display_name":"S. Sun","orcid":"https://orcid.org/0009-0007-8115-945X"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siyuan Sun","raw_affiliation_strings":["Big Data Research Center and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Big Data Research Center and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080093489","display_name":"Lixin Duan","orcid":"https://orcid.org/0000-0002-0723-4016"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lixin Duan","raw_affiliation_strings":["Big Data Research Center and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Big Data Research Center and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100330875","display_name":"Changsheng Li","orcid":"https://orcid.org/0000-0001-9789-7632"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changsheng Li","raw_affiliation_strings":["School of Computer Science and Technology, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011680564","display_name":"Xiao Wu","orcid":"https://orcid.org/0000-0002-8322-8558"},"institutions":[{"id":"https://openalex.org/I4800084","display_name":"Southwest Jiaotong University","ror":"https://ror.org/00hn7w693","country_code":"CN","type":"education","lineage":["https://openalex.org/I4800084"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Wu","raw_affiliation_strings":["School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Southwest Jiaotong University, Chengdu, China","institution_ids":["https://openalex.org/I4800084"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022636178","display_name":"Changsheng Xu","orcid":"https://orcid.org/0000-0001-8343-9665"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changsheng Xu","raw_affiliation_strings":["National Lab of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Lab of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5045800438"],"corresponding_institution_ids":["https://openalex.org/I4800084"],"apc_list":null,"apc_paid":null,"fwci":1.7586,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.87042078,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"23","issue":null,"first_page":"1744","last_page":"1756"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8690098524093628},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.6537253856658936},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.6186850070953369},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6051092147827148},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.56496262550354},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.5125443935394287},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.4934314787387848},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4881823658943176},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4755639433860779},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.4574512839317322},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4544726312160492},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4282373785972595},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.40837812423706055},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3456350564956665},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.12811732292175293}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8690098524093628},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.6537253856658936},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.6186850070953369},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6051092147827148},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.56496262550354},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.5125443935394287},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.4934314787387848},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4881823658943176},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4755639433860779},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.4574512839317322},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4544726312160492},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4282373785972595},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.40837812423706055},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3456350564956665},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.12811732292175293},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2020.3002667","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2020.3002667","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6499999761581421,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1930596891","display_name":null,"funder_award_id":"61772436","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2347935519","display_name":null,"funder_award_id":"61772118","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5269759798","display_name":null,"funder_award_id":"61802053","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G681710594","display_name":null,"funder_award_id":"61806044","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7813065526","display_name":null,"funder_award_id":"2682019CX62","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":76,"referenced_works":["https://openalex.org/W1614298861","https://openalex.org/W1793121960","https://openalex.org/W1933349210","https://openalex.org/W2099471712","https://openalex.org/W2142192571","https://openalex.org/W2151498684","https://openalex.org/W2194775991","https://openalex.org/W2599940792","https://openalex.org/W2600067905","https://openalex.org/W2725249286","https://openalex.org/W2740702290","https://openalex.org/W2746097825","https://openalex.org/W2751486419","https://openalex.org/W2756766706","https://openalex.org/W2767171539","https://openalex.org/W2768661419","https://openalex.org/W2798786641","https://openalex.org/W2799088654","https://openalex.org/W2808124938","https://openalex.org/W2866912866","https://openalex.org/W2890718122","https://openalex.org/W2890904455","https://openalex.org/W2896294941","https://openalex.org/W2896457183","https://openalex.org/W2896902935","https://openalex.org/W2913618459","https://openalex.org/W2949431215","https://openalex.org/W2950577311","https://openalex.org/W2951008357","https://openalex.org/W2952319120","https://openalex.org/W2962749469","https://openalex.org/W2962910007","https://openalex.org/W2962938145","https://openalex.org/W2962959437","https://openalex.org/W2963140463","https://openalex.org/W2963143606","https://openalex.org/W2963215144","https://openalex.org/W2963403868","https://openalex.org/W2963477107","https://openalex.org/W2963541336","https://openalex.org/W2963662177","https://openalex.org/W2963689203","https://openalex.org/W2963781647","https://openalex.org/W2963791035","https://openalex.org/W2963890755","https://openalex.org/W2963969878","https://openalex.org/W2964118342","https://openalex.org/W2964138343","https://openalex.org/W2964303913","https://openalex.org/W2964322347","https://openalex.org/W2965313405","https://openalex.org/W2965527197","https://openalex.org/W2969127500","https://openalex.org/W2974161034","https://openalex.org/W2978395334","https://openalex.org/W2981578638","https://openalex.org/W2981582341","https://openalex.org/W2981963155","https://openalex.org/W2981985547","https://openalex.org/W2982139784","https://openalex.org/W2984402309","https://openalex.org/W4249013746","https://openalex.org/W4293650424","https://openalex.org/W4293749116","https://openalex.org/W4298392976","https://openalex.org/W4320013936","https://openalex.org/W4385245566","https://openalex.org/W6636510571","https://openalex.org/W6638318767","https://openalex.org/W6682086655","https://openalex.org/W6739901393","https://openalex.org/W6744782574","https://openalex.org/W6748579893","https://openalex.org/W6748686444","https://openalex.org/W6752062744","https://openalex.org/W6755207826"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W3088136942","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W4290852288","https://openalex.org/W4388893791","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W2949522393"],"abstract_inverted_index":{"Visual":[0],"question":[1,55],"answering":[2],"by":[3,66],"using":[4],"information":[5],"from":[6],"multiple":[7],"modalities":[8],"has":[9],"attracted":[10],"more":[11,13,69],"and":[12,29,75,81,127],"attention":[14],"in":[15,101,116],"recent":[16],"years.":[17],"However,":[18],"it":[19],"is":[20,92],"a":[21,42,68,89],"very":[22],"challenging":[23],"task,":[24],"as":[25],"the":[26,76,105,108,112,117,124,131],"visual":[27,109],"content":[28],"natural":[30],"language":[31],"have":[32],"quite":[33],"different":[34],"statistical":[35],"properties.":[36],"In":[37,57],"this":[38],"work,":[39],"we":[40,59],"present":[41],"method":[43],"called":[44],"Adversarial":[45],"Multimodal":[46],"Network":[47],"(AMN)":[48],"to":[49,61,94,103],"better":[50],"understand":[51],"video":[52,73,114],"stories":[53],"for":[54,72],"answering.":[56],"AMN,":[58],"propose":[60],"learn":[62],"multimodal":[63,119],"feature":[64],"representations":[65],"finding":[67],"coherent":[70],"subspace":[71],"clips":[74,115],"corresponding":[77],"texts":[78],"(e.g.,":[79],"subtitles":[80],"questions)":[82],"based":[83],"on":[84,123],"generative":[85],"adversarial":[86],"networks.":[87],"Moreover,":[88],"self-attention":[90],"mechanism":[91],"developed":[93],"enforce":[95],"our":[96,134],"newly":[97],"introduced":[98],"consistency":[99],"constraint":[100],"order":[102],"preserve":[104],"self-correlation":[106],"between":[107],"cues":[110],"of":[111,133],"original":[113],"learned":[118],"representations.":[120],"Extensive":[121],"experiments":[122],"benchmark":[125],"MovieQA":[126],"TVQA":[128],"datasets":[129],"show":[130],"effectiveness":[132],"proposed":[135],"AMN":[136],"over":[137],"other":[138],"published":[139],"state-of-the-art":[140],"methods.":[141]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":8}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
