{"id":"https://openalex.org/W4312825258","doi":"https://doi.org/10.1109/tpami.2022.3230934","title":"Knowledge-Enriched Attention Network With Group-Wise Semantic for Visual Storytelling","display_name":"Knowledge-Enriched Attention Network With Group-Wise Semantic for Visual Storytelling","publication_year":2022,"publication_date":"2022-12-21","ids":{"openalex":"https://openalex.org/W4312825258","doi":"https://doi.org/10.1109/tpami.2022.3230934","pmid":"https://pubmed.ncbi.nlm.nih.gov/37015429"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2022.3230934","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3230934","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013006794","display_name":"Tengpeng Li","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tengpeng Li","raw_affiliation_strings":["Department of Computer Science &#x0026; Technology, Tongji University, Shanghai, China","Frontiers Science Center for Intelligent Autonomous Systems, Shanghai, China","Key Laboratory of Embedded System and Service Computing (Ministry of Education), Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science &#x0026; Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Frontiers Science Center for Intelligent Autonomous Systems, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Embedded System and Service Computing (Ministry of Education), Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058982350","display_name":"Hanli Wang","orcid":"https://orcid.org/0000-0002-9999-4871"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hanli Wang","raw_affiliation_strings":["Department of Computer Science &#x0026; Technology, Tongji University, Shanghai, China","Frontiers Science Center for Intelligent Autonomous Systems, Shanghai, China","Key Laboratory of Embedded System and Service Computing (Ministry of Education), Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science &#x0026; Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Frontiers Science Center for Intelligent Autonomous Systems, Shanghai, China","institution_ids":[]},{"raw_affiliation_string":"Key Laboratory of Embedded System and Service Computing (Ministry of Education), Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049557511","display_name":"Bin He","orcid":"https://orcid.org/0000-0003-3193-6269"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bin He","raw_affiliation_strings":["Frontiers Science Center for Intelligent Autonomous Systems, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Frontiers Science Center for Intelligent Autonomous Systems, Shanghai, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002277899","display_name":"Chang Wen Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Chang Wen Chen","raw_affiliation_strings":["Department of Computing, Hong Kong Polytechnic University, Hung Hom, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Computing, Hong Kong Polytechnic University, Hung Hom, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5013006794"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":1.3245,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.82009166,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"45","issue":"7","first_page":"8634","last_page":"8645"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7174688577651978},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.597143828868866},{"id":"https://openalex.org/keywords/group","display_name":"Group (periodic table)","score":0.545793354511261},{"id":"https://openalex.org/keywords/storytelling","display_name":"Storytelling","score":0.5316672325134277},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4553045630455017},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4550808370113373},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3285595178604126},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3281935453414917},{"id":"https://openalex.org/keywords/narrative","display_name":"Narrative","score":0.16073492169380188}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7174688577651978},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.597143828868866},{"id":"https://openalex.org/C2781311116","wikidata":"https://www.wikidata.org/wiki/Q83306","display_name":"Group (periodic table)","level":2,"score":0.545793354511261},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.5316672325134277},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4553045630455017},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4550808370113373},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3285595178604126},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3281935453414917},{"id":"https://openalex.org/C199033989","wikidata":"https://www.wikidata.org/wiki/Q1318295","display_name":"Narrative","level":2,"score":0.16073492169380188},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2022.3230934","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2022.3230934","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:37015429","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37015429","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8899999856948853,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G5501368935","display_name":null,"funder_award_id":"61976159","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1522301498","https://openalex.org/W1956340063","https://openalex.org/W2108598243","https://openalex.org/W2123301721","https://openalex.org/W2154652894","https://openalex.org/W2194775991","https://openalex.org/W2251913848","https://openalex.org/W2277195237","https://openalex.org/W2295107390","https://openalex.org/W2559780844","https://openalex.org/W2561529111","https://openalex.org/W2567070169","https://openalex.org/W2579549467","https://openalex.org/W2914699769","https://openalex.org/W2953486038","https://openalex.org/W2963033554","https://openalex.org/W2963084599","https://openalex.org/W2963101956","https://openalex.org/W2963187786","https://openalex.org/W2963668753","https://openalex.org/W2963829244","https://openalex.org/W2963993699","https://openalex.org/W2964104941","https://openalex.org/W2964231884","https://openalex.org/W2966774251","https://openalex.org/W2986670728","https://openalex.org/W2996941455","https://openalex.org/W2998106530","https://openalex.org/W2998178282","https://openalex.org/W2998303222","https://openalex.org/W3034655362","https://openalex.org/W3035284526","https://openalex.org/W3087871082","https://openalex.org/W3095631487","https://openalex.org/W3100995281","https://openalex.org/W3107848485","https://openalex.org/W3128339783","https://openalex.org/W3174377922","https://openalex.org/W3176313262","https://openalex.org/W3176565349","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6678262379","https://openalex.org/W6682631176","https://openalex.org/W6731370813","https://openalex.org/W6739901393","https://openalex.org/W6784477534","https://openalex.org/W6898505805"],"related_works":["https://openalex.org/W2884441370","https://openalex.org/W1536421369","https://openalex.org/W2082193010","https://openalex.org/W4319988281","https://openalex.org/W2086118318","https://openalex.org/W2993120730","https://openalex.org/W1765898938","https://openalex.org/W2970945984","https://openalex.org/W2355818213","https://openalex.org/W4320006770"],"abstract_inverted_index":{"As":[0],"a":[1,19,70,97,117,129,145],"technically":[2],"challenging":[3],"topic,":[4],"visual":[5,181],"storytelling":[6,182],"aims":[7],"at":[8],"generating":[9],"an":[10,174],"imaginary":[11],"and":[12,29,63,87,111,125,159,168,187],"coherent":[13],"story":[14,148,170],"with":[15,75,133,151,184,201],"narrative":[16],"multi-sentences":[17],"from":[18,55,107],"group":[20],"of":[21,32,41,61,195,208],"relevant":[22],"images.":[23,46],"Existing":[24],"methods":[25],"often":[26],"generate":[27],"direct":[28],"rigid":[30],"descriptions":[31],"apparent":[33],"image-based":[34],"contents,":[35],"because":[36],"they":[37],"are":[38,85,114],"not":[39,51],"capable":[40],"exploring":[42],"implicit":[43,105],"information":[44],"beyond":[45],"Hence,":[47],"these":[48,68,112],"schemes":[49],"could":[50],"capture":[52],"consistent":[53,142],"dependencies":[54],"holistic":[56],"representation,":[57],"impairing":[58],"the":[59,140,161,180,192,196],"generation":[60,149,171],"reasonable":[62],"fluent":[64],"stories.":[65],"To":[66],"address":[67],"problems,":[69],"novel":[71,83],"knowledge-enriched":[72,98,162],"attention":[73,99,120,163],"network":[74,100],"group-wise":[76,130,165],"semantic":[77,131,166],"model":[78,150],"is":[79,101,136,154],"proposed.":[80],"Three":[81],"main":[82],"components":[84],"designed":[86,102],"supported":[88],"by":[89,116],"substantial":[90],"experiments":[91,178],"to":[92,103,122,138,156],"reveal":[93],"practical":[94],"advantages.":[95],"First,":[96],"extract":[104],"concepts":[106,113],"external":[108],"knowledge":[109],"system,":[110],"followed":[115],"cascade":[118],"cross-modal":[119],"mechanism":[121],"characterize":[123],"imaginative":[124],"concrete":[126],"representations.":[127],"Second,":[128],"module":[132,167],"second-order":[134],"pooling":[135],"developed":[137],"explore":[139],"globally":[141],"guidance.":[143],"Third,":[144],"unified":[146],"one-stage":[147],"encoder-decoder":[152],"structure":[153],"proposed":[155,197],"simultaneously":[157],"train":[158],"infer":[160],"network,":[164],"multi-modal":[169],"decoder":[172],"in":[173,214],"end-to-end":[175],"fashion.":[176],"Substantial":[177],"on":[179],"datasets":[183],"both":[185],"objective":[186],"subjective":[188],"evaluation":[189],"metrics":[190],"demonstrate":[191],"superior":[193],"performance":[194],"scheme":[198],"as":[199],"compared":[200],"other":[202],"state-of-the-art":[203],"methods.":[204],"The":[205],"source":[206],"code":[207],"this":[209],"work":[210],"can":[211],"be":[212],"found":[213],"https://mic.tongji.edu.cn.":[215]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
