{"id":"https://openalex.org/W4387885774","doi":"https://doi.org/10.1109/tai.2023.3326416","title":"Text-Image Scene Graph Fusion for Multimodal Named Entity Recognition","display_name":"Text-Image Scene Graph Fusion for Multimodal Named Entity Recognition","publication_year":2023,"publication_date":"2023-10-23","ids":{"openalex":"https://openalex.org/W4387885774","doi":"https://doi.org/10.1109/tai.2023.3326416"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2023.3326416","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2023.3326416","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113012130","display_name":"Jian Cheng","orcid":"https://orcid.org/0000-0002-9805-8870"},"institutions":[{"id":"https://openalex.org/I4210165649","display_name":"China Coal Research Institute (China)","ror":"https://ror.org/05dy2c135","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210165649"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jian Cheng","raw_affiliation_strings":["Research Institute of Mine Big Data, Chinese Institute of Coal Science, State Key Laboratory for Intelligent Coal Mining and Strata Control, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Research Institute of Mine Big Data, Chinese Institute of Coal Science, State Key Laboratory for Intelligent Coal Mining and Strata Control, Beijing, China","institution_ids":["https://openalex.org/I4210165649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072081771","display_name":"Kaifang Long","orcid":"https://orcid.org/0000-0002-9460-0052"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaifang Long","raw_affiliation_strings":["College of Software, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"College of Software, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114859996","display_name":"Shuang Zhang","orcid":"https://orcid.org/0009-0004-3958-7213"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuang Zhang","raw_affiliation_strings":["College of Software, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"College of Software, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108950939","display_name":"Tian Zhang","orcid":"https://orcid.org/0000-0002-0538-1071"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tian Zhang","raw_affiliation_strings":["College of Software, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"College of Software, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068061222","display_name":"Lianbo Ma","orcid":"https://orcid.org/0000-0002-9969-211X"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianbo Ma","raw_affiliation_strings":["College of Software, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"College of Software, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024454462","display_name":"Shi Cheng","orcid":"https://orcid.org/0000-0002-5129-995X"},"institutions":[{"id":"https://openalex.org/I88830068","display_name":"Shaanxi Normal University","ror":"https://ror.org/0170z8493","country_code":"CN","type":"education","lineage":["https://openalex.org/I88830068"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shi Cheng","raw_affiliation_strings":["College of Computer Science, Shaanxi Normal University, Xi&#x0027;an, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science, Shaanxi Normal University, Xi&#x0027;an, China","institution_ids":["https://openalex.org/I88830068"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058828628","display_name":"Yinan Guo","orcid":"https://orcid.org/0000-0002-4276-5410"},"institutions":[{"id":"https://openalex.org/I25757504","display_name":"China University of Mining and Technology","ror":"https://ror.org/01xt2dr21","country_code":"CN","type":"education","lineage":["https://openalex.org/I25757504"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yinan Guo","raw_affiliation_strings":["China University of Mining and Technology, Xuzhou, China"],"affiliations":[{"raw_affiliation_string":"China University of Mining and Technology, Xuzhou, China","institution_ids":["https://openalex.org/I25757504"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5113012130"],"corresponding_institution_ids":["https://openalex.org/I4210165649"],"apc_list":null,"apc_paid":null,"fwci":1.0832,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.79995292,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"5","issue":"6","first_page":"2828","last_page":"2839"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7827903032302856},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5698797702789307},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5321903228759766},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.510482907295227},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.48133978247642517},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.44974285364151},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44238030910491943},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.410104364156723},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4023230969905853},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11938077211380005},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.11437720060348511}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7827903032302856},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5698797702789307},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5321903228759766},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.510482907295227},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.48133978247642517},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.44974285364151},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44238030910491943},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.410104364156723},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4023230969905853},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11938077211380005},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.11437720060348511},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tai.2023.3326416","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2023.3326416","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":66,"referenced_works":["https://openalex.org/W67303140","https://openalex.org/W1940872118","https://openalex.org/W2077069816","https://openalex.org/W2097606805","https://openalex.org/W2116922044","https://openalex.org/W2117772341","https://openalex.org/W2141869602","https://openalex.org/W2250378130","https://openalex.org/W2251913848","https://openalex.org/W2296283641","https://openalex.org/W2506483933","https://openalex.org/W2579549467","https://openalex.org/W2745461083","https://openalex.org/W2788647998","https://openalex.org/W2798298921","https://openalex.org/W2890531016","https://openalex.org/W2896457183","https://openalex.org/W2901988662","https://openalex.org/W2950339735","https://openalex.org/W2953702735","https://openalex.org/W2962779575","https://openalex.org/W2962902328","https://openalex.org/W2962982907","https://openalex.org/W2963101956","https://openalex.org/W2963140597","https://openalex.org/W2963536419","https://openalex.org/W2963649796","https://openalex.org/W2963762755","https://openalex.org/W2966683369","https://openalex.org/W2970151005","https://openalex.org/W2970278082","https://openalex.org/W2998098272","https://openalex.org/W3003940182","https://openalex.org/W3010277541","https://openalex.org/W3034302623","https://openalex.org/W3034379414","https://openalex.org/W3035017890","https://openalex.org/W3035448883","https://openalex.org/W3092692431","https://openalex.org/W3093434718","https://openalex.org/W3102187622","https://openalex.org/W3117216739","https://openalex.org/W3127151332","https://openalex.org/W3176489198","https://openalex.org/W3176858586","https://openalex.org/W3199057778","https://openalex.org/W3213739863","https://openalex.org/W4212998232","https://openalex.org/W4224988036","https://openalex.org/W4225757376","https://openalex.org/W4287854428","https://openalex.org/W4293518017","https://openalex.org/W4304015092","https://openalex.org/W4304091743","https://openalex.org/W4312044727","https://openalex.org/W4321488427","https://openalex.org/W4382466550","https://openalex.org/W4382766254","https://openalex.org/W4385574193","https://openalex.org/W4388334650","https://openalex.org/W6602852861","https://openalex.org/W6640362995","https://openalex.org/W6757817989","https://openalex.org/W6842362430","https://openalex.org/W6843008972","https://openalex.org/W6854222420"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W17155033","https://openalex.org/W3207760230","https://openalex.org/W1496222301","https://openalex.org/W4312814274","https://openalex.org/W1590307681","https://openalex.org/W2536018345","https://openalex.org/W4285370786","https://openalex.org/W2296488620","https://openalex.org/W2358353312"],"abstract_inverted_index":{"With":[0],"the":[1,46,56,71,78,87,96,106,148,161,189,192,200,226,239,248],"popularity":[2],"and":[3,13,19,101,128,142,153,157,159,179,194,197,224,241],"widespread":[4],"use":[5,213],"of":[6,17,26,48,77,80,108,151,191,202,221,243],"social":[7,31],"media":[8,32],"platforms":[9],"such":[10],"as":[11],"Twitter":[12],"Facebook,":[14],"massive":[15],"amounts":[16],"text":[18,61,99,114,156,195],"image":[20,115,158,193],"information":[21,204],"posted":[22],"by":[23],"a":[24,42,113,122,129,167,217],"variety":[25],"users":[27],"have":[28,83],"flooded":[29],"these":[30],"platforms.":[33],"Thus,":[34],"multi-modal":[35,53,81,219],"named":[36,50,72,109],"entity":[37,73,227],"recognition":[38],"(MNER)":[39],"has":[40],"become":[41],"research":[43],"hotspot":[44],"for":[45,104,134,209,247],"task":[47],"extracting":[49],"entities":[51],"from":[52],"data.":[54],"Empirically,":[55],"visual":[57,102,203],"clues":[58],"unrelated":[59],"to":[60,93,146,187,198,215],"data":[62,82,100,196],"may":[63],"introduce":[64],"uncertain":[65],"or":[66],"even":[67],"negative":[68],"impacts":[69],"on":[70,234],"recognition.":[74],"The":[75],"considerations":[76],"relevance":[79],"been":[84],"ignored":[85],"in":[86,155],"previous":[88],"studies.":[89],"In":[90,171],"this":[91,172],"paper,":[92],"effectively":[94],"measure":[95],"relationship":[97],"between":[98],"cues":[103],"improving":[105],"accuracy":[107],"entities,":[110],"we":[111,137,174,212],"propose":[112],"scene":[116,144,163],"graph":[117],"fusion":[118,131],"(TISGF)":[119],"approach":[120],"with":[121],"text-image":[123,130],"similarity":[124,190],"assessment":[125],"module":[126,132],"(TISA)":[127],"(TIF)":[133],"MNER.":[135],"Specifically,":[136],"first":[138],"construct":[139],"two":[140,162,235],"(visual":[141],"textual)":[143],"graphs":[145,164],"exploit":[147],"joint":[149],"features":[150],"objects":[152],"relations":[154],"encode":[160],"separately":[165],"using":[166,229],"specific":[168],"encoder":[169],"pair.":[170],"way,":[173],"can":[175],"obtain":[176],"both":[177],"object-level":[178],"relationship-level":[180],"cross-modal":[181],"features.":[182],"Subsequently,":[183],"TISA":[184],"is":[185],"used":[186],"compute":[188],"determine":[199],"proportion":[201],"that":[205],"will":[206],"be":[207],"retained":[208],"fusion.":[210],"Finally,":[211],"TIF":[214],"achieve":[216],"unified":[218],"representation":[220],"each":[222],"word":[223],"predict":[225],"type":[228],"CRF.":[230],"Extensive":[231],"experiment":[232],"results":[233],"public":[236],"datasets":[237],"demonstrate":[238],"effectiveness":[240],"competitiveness":[242],"our":[244],"proposed":[245],"method":[246],"MNER":[249],"task.":[250]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":7}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
