{"id":"https://openalex.org/W4402683747","doi":"https://doi.org/10.18653/v1/2024.findings-acl.587","title":"Leveraging Entity Information for Cross-Modality Correlation Learning: The Entity-Guided Multimodal Summarization","display_name":"Leveraging Entity Information for Cross-Modality Correlation Learning: The Entity-Guided Multimodal Summarization","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4402683747","doi":"https://doi.org/10.18653/v1/2024.findings-acl.587"},"language":"en","primary_location":{"id":"doi:10.18653/v1/2024.findings-acl.587","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.findings-acl.587","pdf_url":"https://aclanthology.org/2024.findings-acl.587.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics ACL 2024","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://aclanthology.org/2024.findings-acl.587.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023184567","display_name":"Yanghai Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanghai Zhang","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100346529","display_name":"Ye Liu","orcid":"https://orcid.org/0000-0001-7237-7382"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ye Liu","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101934104","display_name":"Shiwei Wu","orcid":"https://orcid.org/0000-0002-3206-6827"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiwei Wu","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100324017","display_name":"Kai Zhang","orcid":"https://orcid.org/0000-0002-9609-7788"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Zhang","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111258277","display_name":"Xukai Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xukai Liu","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100453156","display_name":"Qi Liu","orcid":"https://orcid.org/0000-0001-6956-5550"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Liu","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048237545","display_name":"Enhong Chen","orcid":"https://orcid.org/0000-0002-4835-4102"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Enhong Chen","raw_affiliation_strings":["State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Cognitive Intelligence , University of Science and Technology of China , Hefei , China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5023184567"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.3369,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.66219678,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"9851","last_page":"9862"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9779999852180481,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8605430126190186},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7821429371833801},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.7621593475341797},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5300549864768982},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47156664729118347},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.42812132835388184},{"id":"https://openalex.org/keywords/correlation","display_name":"Correlation","score":0.4104384779930115},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07659706473350525}],"concepts":[{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8605430126190186},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7821429371833801},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.7621593475341797},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5300549864768982},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47156664729118347},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.42812132835388184},{"id":"https://openalex.org/C117220453","wikidata":"https://www.wikidata.org/wiki/Q5172842","display_name":"Correlation","level":2,"score":0.4104384779930115},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07659706473350525},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/2024.findings-acl.587","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.findings-acl.587","pdf_url":"https://aclanthology.org/2024.findings-acl.587.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics ACL 2024","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/2024.findings-acl.587","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/2024.findings-acl.587","pdf_url":"https://aclanthology.org/2024.findings-acl.587.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Findings of the Association for Computational Linguistics ACL 2024","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2376276132","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G3085993365","display_name":null,"funder_award_id":"(Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G37568934","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6013138505","display_name":null,"funder_award_id":"21501100","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6764517672","display_name":null,"funder_award_id":"U20A202","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6770163833","display_name":null,"funder_award_id":"2308085Q","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"},{"id":"https://openalex.org/G6859851492","display_name":null,"funder_award_id":"U20A20229","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8073943209","display_name":null,"funder_award_id":"U20A2022","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8385868538","display_name":null,"funder_award_id":"WK2150110034","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G8473338416","display_name":null,"funder_award_id":"2021YFF0901000","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G8951484681","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334897","display_name":"Natural Science Foundation of Anhui Province","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4402683747.pdf","grobid_xml":"https://content.openalex.org/works/W4402683747.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W1517524280","https://openalex.org/W4323520239"],"abstract_inverted_index":{"The":[0],"rapid":[1],"increase":[2],"in":[3,9],"multimedia":[4],"data":[5,57,109],"has":[6],"spurred":[7],"advancements":[8],"Multimodal":[10,13,82],"Summarization":[11,83],"with":[12,94],"Output":[14],"(MSMO),":[15],"which":[16,140],"aims":[17],"to":[18,43,97,145],"produce":[19],"a":[20,40,51,124],"multimodal":[21,35,92],"summary":[22,113],"that":[23],"integrates":[24],"both":[25],"text":[26],"and":[27,37,68,100],"relevant":[28],"images.The":[29],"inherent":[30],"heterogeneity":[31],"of":[32,46,136],"content":[33],"within":[34],"inputs":[36],"outputs":[38],"presents":[39],"significant":[41],"challenge":[42],"the":[44,63,69,74,134,137,143],"execution":[45],"MSMO.Traditional":[47],"approaches":[48],"typically":[49],"adopt":[50],"holistic":[52],"perspective":[53],"on":[54,88,129],"coarse":[55],"image-text":[56],"or":[58],"individual":[59],"visual":[60,108],"objects,":[61],"overlooking":[62],"essential":[64],"connections":[65],"between":[66],"objects":[67],"entities":[70],"they":[71],"represent.To":[72],"integrate":[73],"fine-grained":[75],"entity":[76,147],"knowledge,":[77],"we":[78],"propose":[79],"an":[80],"Entity-Guided":[81],"model":[84],"(EGMS).Our":[85],"model,":[86],"building":[87],"BART,":[89],"utilizes":[90],"dual":[91],"encoders":[93],"shared":[95],"weights":[96],"process":[98],"text-image":[99],"entity-image":[101],"information":[102,148],"concurrently.A":[103],"gating":[104],"mechanism":[105],"then":[106],"combines":[107],"for":[110],"enhanced":[111],"textual":[112],"generation,":[114],"while":[115],"image":[116],"selection":[117],"is":[118],"refined":[119],"through":[120],"knowledge":[121],"distillation":[122],"from":[123],"pretrained":[125],"vision-language":[126],"model.Extensive":[127],"experiments":[128],"public":[130],"MSMO":[131,150],"dataset":[132],"validate":[133],"superiority":[135],"EGMS":[138],"method,":[139],"also":[141],"prove":[142],"necessity":[144],"incorporate":[146],"into":[149],"problem.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
