{"id":"https://openalex.org/W2950028154","doi":"https://doi.org/10.1145/3323873.3325050","title":"Emotion Reinforced Visual Storytelling","display_name":"Emotion Reinforced Visual Storytelling","publication_year":2019,"publication_date":"2019-06-05","ids":{"openalex":"https://openalex.org/W2950028154","doi":"https://doi.org/10.1145/3323873.3325050","mag":"2950028154"},"language":"en","primary_location":{"id":"doi:10.1145/3323873.3325050","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3323873.3325050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 on International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030541731","display_name":"Nanxing Li","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Nanxing Li","raw_affiliation_strings":["Tsinghua University &amp; Beijing National Research Center for Information Science and Technology (BNRist), Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University &amp; Beijing National Research Center for Information Science and Technology (BNRist), Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100378248","display_name":"Bei Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bei Liu","raw_affiliation_strings":["Microsoft Research Asia, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing, China","institution_ids":["https://openalex.org/I4210113369"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068597652","display_name":"Zhizhong Han","orcid":"https://orcid.org/0000-0001-9540-9973"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhizhong Han","raw_affiliation_strings":["University of Maryland, College Park, MD, USA"],"affiliations":[{"raw_affiliation_string":"University of Maryland, College Park, MD, USA","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101691399","display_name":"Yu-Shen Liu","orcid":"https://orcid.org/0000-0001-7305-1915"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Shen Liu","raw_affiliation_strings":["Tsinghua University &amp; Beijing National Research Center for Information Science and Technology (BNRist), Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University &amp; Beijing National Research Center for Information Science and Technology (BNRist), Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072029041","display_name":"Jianlong Fu","orcid":"https://orcid.org/0000-0002-1025-2012"},"institutions":[{"id":"https://openalex.org/I4210113369","display_name":"Microsoft Research Asia (China)","ror":"https://ror.org/0300m5276","country_code":"CN","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210113369"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianlong Fu","raw_affiliation_strings":["Microsoft Research Asia, Beijing , China"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Asia, Beijing , China","institution_ids":["https://openalex.org/I4210113369"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5030541731"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.4171,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.85302856,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"297","last_page":"305"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9749000072479248,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7313278913497925},{"id":"https://openalex.org/keywords/storytelling","display_name":"Storytelling","score":0.7118633985519409},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5908216238021851},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5007815361022949},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.45706453919410706},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4430108666419983},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.4369052052497864},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.41769009828567505},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.41182035207748413},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.23362165689468384},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10601216554641724}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7313278913497925},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.7118633985519409},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5908216238021851},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5007815361022949},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.45706453919410706},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4430108666419983},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.4369052052497864},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.41769009828567505},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41182035207748413},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.23362165689468384},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10601216554641724},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3323873.3325050","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3323873.3325050","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2019 on International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1514535095","https://openalex.org/W1895577753","https://openalex.org/W1895989618","https://openalex.org/W1897761818","https://openalex.org/W2066134726","https://openalex.org/W2075456404","https://openalex.org/W2099471712","https://openalex.org/W2101105183","https://openalex.org/W2112912048","https://openalex.org/W2119717200","https://openalex.org/W2125389028","https://openalex.org/W2183386595","https://openalex.org/W2188365844","https://openalex.org/W2302086703","https://openalex.org/W2528605210","https://openalex.org/W2549599535","https://openalex.org/W2552161745","https://openalex.org/W2559780844","https://openalex.org/W2740582239","https://openalex.org/W2745461083","https://openalex.org/W2768287968","https://openalex.org/W2798959609","https://openalex.org/W2888213795","https://openalex.org/W2893749619","https://openalex.org/W2904367110","https://openalex.org/W2963033554","https://openalex.org/W2963267809","https://openalex.org/W2963668753","https://openalex.org/W2963686907","https://openalex.org/W2963992143","https://openalex.org/W2964268978","https://openalex.org/W3037785019","https://openalex.org/W3104147459","https://openalex.org/W3106003309","https://openalex.org/W4289387529"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W4246396837","https://openalex.org/W2482350142","https://openalex.org/W3176240006","https://openalex.org/W3126451824","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W2619203976","https://openalex.org/W2326151908"],"abstract_inverted_index":{"Automatic":[0],"story":[1],"generation":[2],"from":[3,19,34,61],"a":[4,109],"sequence":[5,37],"of":[6,38,99,111,115,182],"images,":[7],"i.e.,":[8],"visual":[9,103,148,190,200],"storytelling,":[10],"has":[11],"attracted":[12],"extensive":[13,213],"attention.":[14],"The":[15,105,180,204],"challenges":[16],"mainly":[17],"drive":[18],"modeling":[20,80],"rich":[21],"visually-inspired":[22],"human":[23,125],"emotions,":[24,84],"which":[25,119,147],"results":[26],"in":[27,102,146],"generating":[28,86],"diverse":[29],"yet":[30],"realistic":[31,188],"stories":[32,78,128,164],"even":[33],"the":[35,97,112,116,194,198],"same":[36],"images.":[39],"Existing":[40],"works":[41],"usually":[42],"adopt":[43],"sequence-based":[44],"generative":[45],"adversarial":[46,92,141],"networks":[47],"(GAN)":[48],"by":[49,79,131,138,171],"encoding":[50],"deterministic":[51],"image":[52,63,81],"content":[53,82,114],"(e.g.,":[54],"concept,":[55],"attribute),":[56],"while":[57],"neglecting":[58],"probabilistic":[59],"inference":[60],"an":[62],"over":[64],"emotion":[65,90,100,106,139,153,174,183],"space.":[66],"In":[67],"this":[68],"paper,":[69],"we":[70,95],"take":[71],"one":[72],"step":[73],"further":[74,136],"to":[75,123,162,189,207],"create":[76],"human-level":[77],"with":[83,143,212],"and":[85,135,152,187],"textual":[87],"paragraph":[88],"via":[89],"reinforced":[91,140],"learning.":[93],"Firstly,":[94],"introduce":[96],"concept":[98],"engaged":[101],"storytelling.":[104,191],"feature":[107],"is":[108,160],"representation":[110],"emotional":[113],"generated":[117,130,170],"story,":[118],"enables":[120],"our":[121,172],"model":[122,159,196],"capture":[124],"emotion.":[126],"Secondly,":[127],"are":[129,210],"recurrent":[132],"neural":[133],"network,":[134],"optimized":[137],"learning":[142],"three":[144],"critics,":[145],"relevance,":[149],"language":[150],"style,":[151],"consistency":[154],"can":[155],"be":[156],"ensured.":[157],"Our":[158],"able":[161],"generate":[163],"based":[165],"on":[166,197],"not":[167],"only":[168],"emotions":[169],"novel":[173],"generator,":[175],"but":[176],"also":[177],"customized":[178],"emotions.":[179],"introduction":[181],"brings":[184],"more":[185],"variety":[186],"We":[192],"evaluate":[193],"proposed":[195],"largest":[199],"storytelling":[201],"dataset":[202],"(VIST).":[203],"superior":[205],"performance":[206],"state-of-the-art":[208],"methods":[209],"shown":[211],"experiments.":[214]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
