{"id":"https://openalex.org/W2981591098","doi":"https://doi.org/10.1145/3343031.3350923","title":"Multimodal Dialog System","display_name":"Multimodal Dialog System","publication_year":2019,"publication_date":"2019-10-15","ids":{"openalex":"https://openalex.org/W2981591098","doi":"https://doi.org/10.1145/3343031.3350923","mag":"2981591098"},"language":"en","primary_location":{"id":"doi:10.1145/3343031.3350923","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3350923","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038612499","display_name":"Liqiang Nie","orcid":"https://orcid.org/0000-0003-1476-0273"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liqiang Nie","raw_affiliation_strings":["Shandong University, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Qingdao, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100368524","display_name":"Wenjie Wang","orcid":"https://orcid.org/0000-0002-5199-1428"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjie Wang","raw_affiliation_strings":["Shandong University, Qingdao, China"],"affiliations":[{"raw_affiliation_string":"Shandong University, Qingdao, China","institution_ids":["https://openalex.org/I154099455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051332325","display_name":"Richang Hong","orcid":"https://orcid.org/0000-0001-5461-3986"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Richang Hong","raw_affiliation_strings":["Hefei University of Technology, Hefei, China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Hefei University of Technology, Hefei, China, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100377147","display_name":"Meng Wang","orcid":"https://orcid.org/0000-0002-3094-7735"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Meng Wang","raw_affiliation_strings":["Hefei University of Technology, Hefei, China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Hefei University of Technology, Hefei, China, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100393506","display_name":"Qi Tian","orcid":"https://orcid.org/0000-0002-7252-5047"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Tian","raw_affiliation_strings":["Noah's Ark Lab, Huawei, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Noah's Ark Lab, Huawei, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5038612499"],"corresponding_institution_ids":["https://openalex.org/I154099455"],"apc_list":null,"apc_paid":null,"fwci":2.8621,"has_fulltext":false,"cited_by_count":67,"citation_normalized_percentile":{"value":0.92985858,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1098","last_page":"1106"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8723545074462891},{"id":"https://openalex.org/keywords/dialog-box","display_name":"Dialog box","score":0.7464977502822876},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5686513781547546},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.48895323276519775},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4746951460838318},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.4414025843143463},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.43538007140159607},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.39482492208480835},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3304072618484497},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3203977346420288},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.26153016090393066}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8723545074462891},{"id":"https://openalex.org/C173853756","wikidata":"https://www.wikidata.org/wiki/Q86915","display_name":"Dialog box","level":2,"score":0.7464977502822876},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5686513781547546},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.48895323276519775},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4746951460838318},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.4414025843143463},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.43538007140159607},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39482492208480835},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3304072618484497},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3203977346420288},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26153016090393066},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3343031.3350923","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3343031.3350923","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 27th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1514535095","https://openalex.org/W1933349210","https://openalex.org/W2078861931","https://openalex.org/W2101105183","https://openalex.org/W2130942839","https://openalex.org/W2194775991","https://openalex.org/W2250645263","https://openalex.org/W2251235149","https://openalex.org/W2339852062","https://openalex.org/W2349436533","https://openalex.org/W2400455482","https://openalex.org/W2558809543","https://openalex.org/W2560730294","https://openalex.org/W2586847566","https://openalex.org/W2739634080","https://openalex.org/W2765757915","https://openalex.org/W2768661419","https://openalex.org/W2798385473","https://openalex.org/W2798392716","https://openalex.org/W2798914047","https://openalex.org/W2891389695","https://openalex.org/W2891416139","https://openalex.org/W2897182555","https://openalex.org/W2897195437","https://openalex.org/W2897628926","https://openalex.org/W2951008357","https://openalex.org/W2956125353","https://openalex.org/W2962676842","https://openalex.org/W2963068985","https://openalex.org/W2963206148","https://openalex.org/W2963448850","https://openalex.org/W2963550483","https://openalex.org/W2963715136","https://openalex.org/W2963748384","https://openalex.org/W2964112275","https://openalex.org/W2964308564","https://openalex.org/W3101567279","https://openalex.org/W4211082256"],"related_works":["https://openalex.org/W2098987383","https://openalex.org/W2417260800","https://openalex.org/W2795961259","https://openalex.org/W1596203174","https://openalex.org/W2117933979","https://openalex.org/W4298396513","https://openalex.org/W2283130723","https://openalex.org/W103938586","https://openalex.org/W2104718772","https://openalex.org/W4233992201"],"abstract_inverted_index":{"On":[0],"the":[1,7,17,21,32,38,48,52,62,72,92,96,102,105,116,140,146,149,161,165,174,191,196],"shoulders":[2],"of":[3,24,104],"textual":[4,162],"dialog":[5,26],"systems,":[6,27],"multimodal":[8,25,107,150],"ones,":[9],"recently":[10],"have":[11],"engaged":[12],"increasing":[13],"attention,":[14],"especially":[15],"in":[16,41],"retail":[18],"domain.":[19],"Despite":[20],"commercial":[22],"value":[23],"they":[28],"still":[29],"suffer":[30],"from":[31],"following":[33],"challenges:":[34],"1)":[35],"automatically":[36],"generate":[37,115],"right":[39],"responses":[40],"appropriate":[42],"medium":[43,98],"forms;":[44],"2)":[45],"jointly":[46,159],"consider":[47],"visual":[49,166],"cues":[50],"and":[51,59,67,95,148,164,194],"side":[53],"information":[54],"while":[55],"selecting":[56],"product":[57],"images;":[58],"3)":[60],"guide":[61],"response":[63,93,151],"generation":[64],"with":[65,81],"multi-faceted":[66],"heterogeneous":[68],"knowledge.":[69],"To":[70],"address":[71],"aforementioned":[73],"issues,":[74],"we":[75],"present":[76],"a":[77,119,132,169,182],"Multimodal":[78],"diAloG":[79],"system":[80],"adaptIve":[82],"deCoders,":[83],"MAGIC":[84,89,180,189],"for":[85],"short.":[86],"In":[87],"particular,":[88],"first":[90],"judges":[91],"type":[94],"corresponding":[97],"form":[99],"via":[100,168],"understanding":[101],"intention":[103],"given":[106],"context.":[108],"Hereafter,":[109],"it":[110],"employs":[111],"adaptive":[112],"decoders":[113],"to":[114,127,138,144],"desired":[117],"responses:":[118],"simple":[120],"recurrent":[121],"neural":[122,170],"network":[123],"(RNN)":[124],"is":[125,136],"applied":[126],"generating":[128],"general":[129],"responses,":[130],"then":[131],"knowledge-aware":[133],"RNN":[134],"decoder":[135,152],"designed":[137],"encode":[139],"multiform":[141],"domain":[142],"knowledge":[143],"enrich":[145],"response,":[147],"incorporates":[153],"an":[154],"image":[155],"recommendation":[156],"model":[157,171],"which":[158],"considers":[160],"attributes":[163],"images":[167],"optimized":[172],"by":[173],"max-margin":[175],"loss.":[176],"We":[177],"comparatively":[178],"justify":[179],"over":[181],"benchmark":[183],"dataset.":[184],"Experiment":[185],"results":[186],"demonstrate":[187],"that":[188],"outperforms":[190],"existing":[192],"methods":[193],"achieves":[195],"state-of-the-art":[197],"performance.":[198]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":17},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":4},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
