{"id":"https://openalex.org/W4406858541","doi":"https://doi.org/10.1109/apsipaasc63619.2025.10848846","title":"GMNER-LF: Generative Multi-modal Named Entity Recognition Based on LLM with Information Fusion","display_name":"GMNER-LF: Generative Multi-modal Named Entity Recognition Based on LLM with Information Fusion","publication_year":2024,"publication_date":"2024-12-03","ids":{"openalex":"https://openalex.org/W4406858541","doi":"https://doi.org/10.1109/apsipaasc63619.2025.10848846"},"language":"en","primary_location":{"id":"doi:10.1109/apsipaasc63619.2025.10848846","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc63619.2025.10848846","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003968318","display_name":"Hui-Yun Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huiyun Hu","raw_affiliation_strings":["State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Junda Kong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Junda Kong","raw_affiliation_strings":["State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fei Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fei Wang","raw_affiliation_strings":["State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100552674","display_name":"Hongzhi Sun","orcid":"https://orcid.org/0009-0004-4484-4843"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hongzhi Sun","raw_affiliation_strings":["State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112127940","display_name":"Yang Ge","orcid":"https://orcid.org/0000-0001-6282-138X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang Ge","raw_affiliation_strings":["State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Grid Shandong Electric Power Company Dezhou Power Supply Company,Dezhou,China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100771377","display_name":"Bo Xiao","orcid":"https://orcid.org/0000-0003-3392-3293"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Xiao","raw_affiliation_strings":["Beijing University of Posts and Telecommunications,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3055,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.68627137,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10679","display_name":"Service-Oriented Architecture and Web Services","score":0.9700999855995178,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7083162069320679},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.695048451423645},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6859260201454163},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5858818292617798},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5308996438980103},{"id":"https://openalex.org/keywords/information-fusion","display_name":"Information fusion","score":0.5112149715423584},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3775702714920044},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09717732667922974}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7083162069320679},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.695048451423645},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6859260201454163},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5858818292617798},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5308996438980103},{"id":"https://openalex.org/C2982962833","wikidata":"https://www.wikidata.org/wiki/Q17092450","display_name":"Information fusion","level":2,"score":0.5112149715423584},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3775702714920044},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09717732667922974},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc63619.2025.10848846","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc63619.2025.10848846","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2907492528","https://openalex.org/W3011594683","https://openalex.org/W3092692431","https://openalex.org/W3116194881","https://openalex.org/W4225757376","https://openalex.org/W4287854428","https://openalex.org/W4287887518","https://openalex.org/W4308608663","https://openalex.org/W4385571080","https://openalex.org/W4385573951","https://openalex.org/W4389519297","https://openalex.org/W4389520264","https://openalex.org/W4389523688","https://openalex.org/W4402684284","https://openalex.org/W6748687733","https://openalex.org/W6851819690"],"related_works":["https://openalex.org/W2380075625","https://openalex.org/W4390718435","https://openalex.org/W4390549206","https://openalex.org/W3137171911","https://openalex.org/W4379540039","https://openalex.org/W4237784285","https://openalex.org/W2374712251","https://openalex.org/W2355579697","https://openalex.org/W4360871138","https://openalex.org/W3208972923"],"abstract_inverted_index":{"Multi-modal":[0],"Named":[1,14],"Entity":[2,15],"Recognition":[3,16],"(MNER)":[4],"leverages":[5],"visual":[6],"information":[7,105,158],"to":[8,63,101,109,124],"enhance":[9],"the":[10,27,68,81,86,107,121,136,148,160,172],"effectiveness":[11],"of":[12,128,139,151],"text-only":[13],"(NER).":[17],"Currently,":[18],"many":[19],"methods":[20],"are":[21],"based":[22],"on":[23,178],"sequence":[24],"label,":[25],"but":[26,153],"model":[28],"architecture":[29],"is":[30,118],"relatively":[31],"complex.":[32],"Large":[33],"Language":[34],"Model":[35],"(LLM)":[36],"has":[37,175],"recently":[38],"demonstrated":[39],"powerful":[40],"generative":[41,55,170],"and":[42,96,130,133,181],"comprehension":[43],"abilities,":[44],"so":[45,79],"we":[46,58,71,90],"propose":[47],"GMNER-LF,":[48],"a":[49,76,92,98],"new":[50],"paradigm":[51],"for":[52,67],"MNER":[53],"with":[54,168],"method.":[56],"Firstly,":[57],"retrieve":[59],"relevant":[60],"image-text":[61],"pairs":[62],"provide":[64],"prior":[65],"knowledge":[66,138,150],"recognition.":[69],"Secondly,":[70],"construct":[72],"our":[73],"task":[74,78],"into":[75,120],"MRC":[77],"that":[80,166],"LLM":[82,122,129],"can":[83],"better":[84],"understand":[85],"problem.":[87],"In":[88],"addition,":[89],"design":[91],"multi-modal":[93,115,131],"fusion":[94,112,116,127],"module":[95,117],"add":[97],"gating":[99,161],"mechanism":[100],"help":[102],"filter":[103],"noise":[104],"in":[106],"image":[108],"obtain":[110],"high-quality":[111],"representations.":[113],"The":[114,141],"injected":[119],"block":[123],"achieve":[125],"deep":[126],"representations":[132],"fully":[134,146],"explore":[135],"internal":[137,149],"LLM.":[140],"proposed":[142,173],"method":[143,174],"not":[144],"only":[145],"explores":[147],"LLM,":[152],"also":[154],"filters":[155],"important":[156],"modal":[157],"through":[159],"mechanism.":[162],"Experimental":[163],"results":[164],"show":[165],"compared":[167],"other":[169],"methods,":[171],"improved":[176],"performance":[177],"both":[179],"Twitter-2015":[180],"Twitter-2017":[182],"datasets.":[183]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
