{"id":"https://openalex.org/W4408355643","doi":"https://doi.org/10.1109/icassp49660.2025.10890454","title":"WMAJL: Watcher-Mediated Attention Joint Learning Model for Multimodal Relation Extraction","display_name":"WMAJL: Watcher-Mediated Attention Joint Learning Model for Multimodal Relation Extraction","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408355643","doi":"https://doi.org/10.1109/icassp49660.2025.10890454"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890454","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890454","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071751357","display_name":"Yunrui Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunrui Dong","raw_affiliation_strings":["University of Electronic Science and Technology of China,School of Computer Science and Engineering,Chengdu,China,611731"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China,School of Computer Science and Engineering,Chengdu,China,611731","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081385896","display_name":"Guiduo Duan","orcid":"https://orcid.org/0000-0003-4448-6906"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guiduo Duan","raw_affiliation_strings":["University of Electronic Science and Technology of China,School of Computer Science and Engineering,Chengdu,China,611731"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China,School of Computer Science and Engineering,Chengdu,China,611731","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5104260111","display_name":"Tianxi Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I207528943","display_name":"Chengdu Medical College","ror":"https://ror.org/01c4jmp52","country_code":"CN","type":"healthcare","lineage":["https://openalex.org/I207528943"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianxi Huang","raw_affiliation_strings":["College of Humanities and General Education,Chengdu Textile College,Chengdu,China,611731"],"affiliations":[{"raw_affiliation_string":"College of Humanities and General Education,Chengdu Textile College,Chengdu,China,611731","institution_ids":["https://openalex.org/I207528943"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100778545","display_name":"Yunhao Li","orcid":"https://orcid.org/0000-0003-1704-3050"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunhao Li","raw_affiliation_strings":["University of Electronic Science and Technology of China,Laboratory of Intelligent Collaborative Computing,Chengdu,China,611731"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China,Laboratory of Intelligent Collaborative Computing,Chengdu,China,611731","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5071751357"],"corresponding_institution_ids":["https://openalex.org/I150229711"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02096335,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9451000094413757,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7310891151428223},{"id":"https://openalex.org/keywords/joint","display_name":"Joint (building)","score":0.6477131247520447},{"id":"https://openalex.org/keywords/relationship-extraction","display_name":"Relationship extraction","score":0.5983983278274536},{"id":"https://openalex.org/keywords/relation","display_name":"Relation (database)","score":0.5698260068893433},{"id":"https://openalex.org/keywords/joint-attention","display_name":"Joint attention","score":0.48277416825294495},{"id":"https://openalex.org/keywords/extraction","display_name":"Extraction (chemistry)","score":0.44946035742759705},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4313841760158539},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.2580414414405823},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.11749127507209778},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10742917656898499},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.10505390167236328},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.041998207569122314}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7310891151428223},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.6477131247520447},{"id":"https://openalex.org/C153604712","wikidata":"https://www.wikidata.org/wiki/Q7310755","display_name":"Relationship extraction","level":3,"score":0.5983983278274536},{"id":"https://openalex.org/C25343380","wikidata":"https://www.wikidata.org/wiki/Q277521","display_name":"Relation (database)","level":2,"score":0.5698260068893433},{"id":"https://openalex.org/C137878579","wikidata":"https://www.wikidata.org/wiki/Q9636076","display_name":"Joint attention","level":3,"score":0.48277416825294495},{"id":"https://openalex.org/C4725764","wikidata":"https://www.wikidata.org/wiki/Q844704","display_name":"Extraction (chemistry)","level":2,"score":0.44946035742759705},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4313841760158539},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.2580414414405823},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.11749127507209778},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10742917656898499},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.10505390167236328},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.041998207569122314},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C138496976","wikidata":"https://www.wikidata.org/wiki/Q175002","display_name":"Developmental psychology","level":1,"score":0.0},{"id":"https://openalex.org/C170154142","wikidata":"https://www.wikidata.org/wiki/Q150737","display_name":"Architectural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C205778803","wikidata":"https://www.wikidata.org/wiki/Q38404","display_name":"Autism","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890454","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890454","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322108","display_name":"Ministry of Science and Technology","ror":"https://ror.org/032e49973"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W143521272","https://openalex.org/W2053101950","https://openalex.org/W2053238041","https://openalex.org/W2146960529","https://openalex.org/W2194775991","https://openalex.org/W2474574787","https://openalex.org/W2798298921","https://openalex.org/W2964166731","https://openalex.org/W3011594683","https://openalex.org/W3035524453","https://openalex.org/W3114632476","https://openalex.org/W3166170409","https://openalex.org/W3207972321","https://openalex.org/W4229024390","https://openalex.org/W4287854428","https://openalex.org/W4390479123","https://openalex.org/W4391164085","https://openalex.org/W4399435816","https://openalex.org/W6640963894","https://openalex.org/W6732370935","https://openalex.org/W6752178629","https://openalex.org/W6755207826"],"related_works":["https://openalex.org/W2976808399","https://openalex.org/W2609844752","https://openalex.org/W2331316773","https://openalex.org/W4392969631","https://openalex.org/W4285246823","https://openalex.org/W4226278302","https://openalex.org/W4221160509","https://openalex.org/W2547211086","https://openalex.org/W2538200646","https://openalex.org/W4234497699"],"abstract_inverted_index":{"In":[0],"the":[1,10,21,37,74,101,108,138,158,206,228],"domain":[2],"of":[3,23,31,39,104,110,134,145,184,193,203],"Multimodal":[4],"Relation":[5],"Extraction":[6],"(MRE),":[7],"we":[8],"present":[9],"$\\color{Red}{\\text{W}}$atcher-$\\color{Red}{\\text{M}}$ediated":[11],"$\\color{Red}{\\text{A}}$ttention":[12],"$\\color{Red}{\\text{J}}$oint":[13],"$\\color{Red}{\\text{L}}$earning":[14],"Model":[15],"($\\color{Red}{\\text{WMAJL}}$),":[16],"a":[17,81,131,190,216],"novel":[18],"approach":[19],"addressing":[20],"challenges":[22],"modality":[24,56],"alignment":[25,57],"noise,":[26],"cross-modal":[27,87],"fusion":[28,88],"disparity,":[29],"preservation":[30],"textual":[32,95],"relative":[33,127],"position":[34,128],"information,":[35,129],"and":[36,50,64,96,119,214],"distinctiveness":[38],"classification":[40,171],"labels.":[41],"WMAJL":[42,146],"employs":[43],"an":[44],"integrative":[45],"framework":[46],"leveraging":[47],"contrastive":[48],"learning":[49],"variational":[51],"autoencoder":[52],"constraints":[53],"to":[54,73,160,189,226],"mitigate":[55],"noise":[58,68],"by":[59,89,154,174,198],"prioritizing":[60],"relevant":[61],"semantic":[62],"data":[63],"effectively":[65],"reducing":[66],"extraneous":[67],"that":[69,125],"does":[70],"not":[71],"contribute":[72],"task.":[75],"The":[76,181],"model\u2019s":[77],"innovative":[78],"architecture":[79],"includes":[80],"mediator":[82],"watcher,":[83],"which":[84,156],"facilitates":[85],"enhanced":[86],"enabling":[90],"nuanced":[91],"information":[92],"exchange":[93],"between":[94],"visual":[97],"modalities":[98],"while":[99],"preserving":[100],"unique":[102],"characteristics":[103],"each":[105],"modality.":[106],"Additionally,":[107],"design":[109],"auxiliary":[111],"tasks,":[112],"such":[113],"as":[114,196],"Named":[115],"Entity":[116],"Recognition":[117],"(NER),":[118],"output":[120],"supervision":[121],"constructs":[122],"loss":[123,151],"functions":[124],"preserve":[126],"ensuring":[130],"precise":[132],"depiction":[133],"entity":[135],"relationships":[136],"throughout":[137],"multilayer":[139],"encoding":[140],"processes.":[141],"A":[142],"key":[143],"differentiator":[144],"is":[147],"its":[148,199],"label-centric":[149],"self-information":[150],"technique,":[152],"inspired":[153],"InfoNCE,":[155],"trains":[157],"model":[159],"cluster":[161],"similar":[162],"relation":[163,179],"labels":[164],"in":[165],"semantically":[166],"coherent":[167],"areas,":[168],"thereby":[169],"optimizing":[170],"label":[172],"uniqueness":[173],"discerning":[175],"subtle":[176],"differences":[177],"among":[178],"types.":[180],"synergistic":[182],"application":[183],"these":[185],"strategies":[186],"has":[187],"led":[188],"significant":[191],"enhancement":[192],"WMAJL\u2019s":[194,224],"performance,":[195],"evidenced":[197],"state-of-the-art":[200],"F1":[201],"score":[202],"$\\color{Red}{84.93\\%}$":[204],"on":[205],"MNRE":[207],"dataset.":[208],"This":[209],"achievement":[210],"surpasses":[211],"existing":[212],"benchmarks":[213],"sets":[215],"new":[217],"standard":[218],"for":[219],"multimodal":[220],"knowledge":[221],"extraction,":[222],"underscoring":[223],"potential":[225],"revolutionize":[227],"MRE":[229],"landscape.":[230]},"counts_by_year":[],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
