{"id":"https://openalex.org/W4224313128","doi":"https://doi.org/10.1145/3485447.3511946","title":"Context-Enriched Learning Models for Aligning Biomedical Vocabularies at Scale in the UMLS Metathesaurus","display_name":"Context-Enriched Learning Models for Aligning Biomedical Vocabularies at Scale in the UMLS Metathesaurus","publication_year":2022,"publication_date":"2022-04-25","ids":{"openalex":"https://openalex.org/W4224313128","doi":"https://doi.org/10.1145/3485447.3511946","pmid":"https://pubmed.ncbi.nlm.nih.gov/36108322"},"language":"en","primary_location":{"id":"doi:10.1145/3485447.3511946","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3485447.3511946","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3485447.3511946","source":{"id":"https://openalex.org/S4363608783","display_name":"Proceedings of the ACM Web Conference 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2022","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3485447.3511946","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066629222","display_name":"Vinh Nguyen","orcid":null},"institutions":[{"id":"https://openalex.org/I2800548410","display_name":"United States National Library of Medicine","ror":"https://ror.org/0060t0j89","country_code":"US","type":"archive","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I2800548410"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Vinh Nguyen","raw_affiliation_strings":["National Library of Medicine, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Library of Medicine, USA","institution_ids":["https://openalex.org/I2800548410"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064336316","display_name":"Hong Yung Yip","orcid":"https://orcid.org/0000-0003-1393-7890"},"institutions":[{"id":"https://openalex.org/I155781252","display_name":"University of South Carolina","ror":"https://ror.org/02b6qw903","country_code":"US","type":"education","lineage":["https://openalex.org/I155781252"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hong Yung Yip","raw_affiliation_strings":["University of South Carolina, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of South Carolina, USA","institution_ids":["https://openalex.org/I155781252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015619335","display_name":"Goonmeet Bajaj","orcid":"https://orcid.org/0000-0003-0182-9200"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Goonmeet Bajaj","raw_affiliation_strings":["The Ohio State University, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026459564","display_name":"Thilini Wijesiriwardene","orcid":"https://orcid.org/0000-0001-8431-8443"},"institutions":[{"id":"https://openalex.org/I155781252","display_name":"University of South Carolina","ror":"https://ror.org/02b6qw903","country_code":"US","type":"education","lineage":["https://openalex.org/I155781252"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Thilini Wijesiriwardene","raw_affiliation_strings":["University of South Carolina, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of South Carolina, USA","institution_ids":["https://openalex.org/I155781252"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040670143","display_name":"Vishesh Javangula","orcid":"https://orcid.org/0000-0002-7034-3725"},"institutions":[{"id":"https://openalex.org/I193531525","display_name":"George Washington University","ror":"https://ror.org/00y4zzh67","country_code":"US","type":"education","lineage":["https://openalex.org/I193531525"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vishesh Javangula","raw_affiliation_strings":["George Washington University, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"George Washington University, USA","institution_ids":["https://openalex.org/I193531525"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100755351","display_name":"Srinivasan Parthasarathy","orcid":"https://orcid.org/0000-0002-6062-6449"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Srinivasan Parthasarathy","raw_affiliation_strings":["The Ohio State University, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028772801","display_name":"Amit Sheth","orcid":null},"institutions":[{"id":"https://openalex.org/I155781252","display_name":"University of South Carolina","ror":"https://ror.org/02b6qw903","country_code":"US","type":"education","lineage":["https://openalex.org/I155781252"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amit Sheth","raw_affiliation_strings":["University of South Carolina, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of South Carolina, USA","institution_ids":["https://openalex.org/I155781252"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073807945","display_name":"Olivier Bodenreider","orcid":"https://orcid.org/0000-0003-4769-4217"},"institutions":[{"id":"https://openalex.org/I2800548410","display_name":"United States National Library of Medicine","ror":"https://ror.org/0060t0j89","country_code":"US","type":"archive","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I2800548410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Olivier Bodenreider","raw_affiliation_strings":["National Library of Medicine, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Library of Medicine, USA","institution_ids":["https://openalex.org/I2800548410"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5066629222"],"corresponding_institution_ids":["https://openalex.org/I2800548410"],"apc_list":null,"apc_paid":null,"fwci":0.7275,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.69761526,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":"2022","issue":null,"first_page":"1037","last_page":"1046"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/unified-medical-language-system","display_name":"Unified Medical Language System","score":0.9415000677108765},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8111047744750977},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6782304048538208},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6632764935493469},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6428161859512329},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.5633556842803955},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5292320251464844},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5207297801971436},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4876474142074585},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.46946799755096436},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.10506758093833923},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08259165287017822}],"concepts":[{"id":"https://openalex.org/C69505689","wikidata":"https://www.wikidata.org/wiki/Q455338","display_name":"Unified Medical Language System","level":2,"score":0.9415000677108765},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8111047744750977},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6782304048538208},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6632764935493469},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6428161859512329},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.5633556842803955},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5292320251464844},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5207297801971436},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4876474142074585},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.46946799755096436},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.10506758093833923},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08259165287017822},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3485447.3511946","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3485447.3511946","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3485447.3511946","source":{"id":"https://openalex.org/S4363608783","display_name":"Proceedings of the ACM Web Conference 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2022","raw_type":"proceedings-article"},{"id":"pmid:36108322","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36108322","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ... International World-Wide Web Conference. International WWW Conference","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:9455675","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9455675","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proc Int World Wide Web Conf","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1145/3485447.3511946","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3485447.3511946","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3485447.3511946","source":{"id":"https://openalex.org/S4363608783","display_name":"Proceedings of the ACM Web Conference 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM Web Conference 2022","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8100000023841858}],"awards":[{"id":"https://openalex.org/G2173531888","display_name":null,"funder_award_id":"ZIA LM010017-01","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"},{"id":"https://openalex.org/G3318334062","display_name":null,"funder_award_id":"CNS-2112471","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"},{"id":"https://openalex.org/F4320332382","display_name":"Oak Ridge Institute for Science and Education","ror":"https://ror.org/0526p1y61"},{"id":"https://openalex.org/F4320337372","display_name":"U.S. National Library of Medicine","ror":"https://ror.org/0060t0j89"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4224313128.pdf","grobid_xml":"https://content.openalex.org/works/W4224313128.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W102861580","https://openalex.org/W1566018662","https://openalex.org/W1822004795","https://openalex.org/W2010866855","https://openalex.org/W2083195256","https://openalex.org/W2087361167","https://openalex.org/W2101026445","https://openalex.org/W2118100588","https://openalex.org/W2165533158","https://openalex.org/W2184957013","https://openalex.org/W2251427843","https://openalex.org/W2283196293","https://openalex.org/W2406695577","https://openalex.org/W2508865106","https://openalex.org/W2551361256","https://openalex.org/W2759136286","https://openalex.org/W2774837955","https://openalex.org/W2887535136","https://openalex.org/W2889583850","https://openalex.org/W2903963001","https://openalex.org/W2907492528","https://openalex.org/W2911489562","https://openalex.org/W2944400536","https://openalex.org/W2949972983","https://openalex.org/W2963104256","https://openalex.org/W2964263523","https://openalex.org/W2971258845","https://openalex.org/W3003265726","https://openalex.org/W3012000912","https://openalex.org/W3046075728","https://openalex.org/W3090380219","https://openalex.org/W3092008332","https://openalex.org/W3099387504","https://openalex.org/W3122741928","https://openalex.org/W3153694186","https://openalex.org/W4210257598","https://openalex.org/W4226282904","https://openalex.org/W4281665639","https://openalex.org/W4285242074"],"related_works":["https://openalex.org/W1822792362","https://openalex.org/W1507779355","https://openalex.org/W4286432911","https://openalex.org/W2892839738","https://openalex.org/W4288278495","https://openalex.org/W2940007344","https://openalex.org/W2777111309","https://openalex.org/W4298857951","https://openalex.org/W2766727221","https://openalex.org/W2805170835"],"abstract_inverted_index":{"The":[0,300],"Unified":[1],"Medical":[2],"Language":[3],"System":[4],"(UMLS)":[5],"Metathesaurus":[6,35],"construction":[7,48],"process":[8],"mainly":[9],"relies":[10],"on":[11],"lexical":[12,64,275,306],"algorithms":[13],"and":[14,37,102,154,320],"manual":[15],"expert":[16],"curation":[17],"for":[18,56,107,230,296,317,325],"integrating":[19],"over":[20,214],"200":[21],"biomedical":[22],"vocabularies.":[23],"A":[24],"lexical-based":[25],"learning":[26,123],"model":[27],"(LexLM)":[28],"was":[29],"developed":[30],"to":[31,90,128],"predict":[32],"synonymy":[33,96],"among":[34],"terms":[36,272],"largely":[38],"outperforms":[39],"a":[40,207,260],"rule-based":[41],"approach":[42],"(RBA)":[43],"that":[44,238,268],"approximates":[45],"the":[46,51,54,67,71,81,91,108,129,131,168,172,177,182,186,189,192,212,215,231,239,243,269,297,331,338],"current":[47],"process.":[49],"However,":[50],"LexLM":[52,130],"has":[53],"potential":[55],"being":[57],"improved":[58],"further":[59],"because":[60],"it":[61],"only":[62],"uses":[63],"information":[65,88,135,336],"from":[66,181,211,279],"source":[68,95,98,103],"vocabularies,":[69],"while":[70],"RBA":[72],"also":[73,236,308],"takes":[74,247],"advantage":[75],"of":[76,83,86,121,133,188,199,201,271,305,333],"contextual":[77,87,134,281,335],"information.":[78],"We":[79,138,156,166,184],"investigate":[80],"role":[82],"multiple":[84,119],"types":[85,132,142,246],"available":[89],"UMLS":[92,109],"editors,":[93],"namely":[94,217,283],"(SS),":[97],"semantic":[99],"group":[100],"(SG),":[101],"hierarchical":[104],"relations":[105],"(HR),":[106],"vocabulary":[110],"alignment":[111],"(UVA)":[112],"problem.":[113,340],"In":[114],"this":[115],"paper,":[116],"we":[117],"develop":[118],"variants":[120,150,258],"context-enriched":[122,144],"models":[124],"(ConLMs)":[125],"by":[126,170],"adding":[127,280],"listed":[136],"above.":[137],"represent":[139],"these":[140,158],"context":[141,245,262],"in":[143,219,223,227,285,289,293,314,322,337],"knowledge":[145],"graphs":[146],"(ConKGs)":[147],"with":[148,176,197,259,273,302,312],"four":[149],"ConSS,":[151],"ConSG,":[152],"ConHR,":[153],"ConAll.":[155],"train":[157],"ConKG":[159,173],"embeddings":[160],"using":[161,191,334],"seven":[162],"KG":[163],"embedding":[164,174,179],"techniques.":[165],"create":[167],"ConLMs":[169,190,213],"concatenating":[171],"vectors":[175,180],"word":[178],"LexLM.":[183],"evaluate":[185],"performance":[187,209,310],"UVA":[193,339],"generalization":[194],"test":[195],"datasets":[196],"hundreds":[198],"millions":[200],"pairs.":[202],"Our":[203,234],"extensive":[204],"experiments":[205,235,266],"show":[206,237,267,309],"significant":[208],"improvement":[210,311],"LexLM,":[216],"+5.0%":[218],"precision":[220,286],"(93.75%),":[221],"+0.69%":[222],"recall":[224,290],"(93.23%),":[225,291],"+2.88%":[226],"F1":[228,294,315,323],"(93.49%)":[229],"best":[232,298],"ConLM.":[233,299],"ConAll":[240],"variant":[241],"including":[242],"three":[244],"more":[248],"time,":[249],"but":[250],"does":[251],"not":[252],"always":[253],"perform":[254],"better":[255],"than":[256],"other":[257],"single":[261],"type.":[263],"Finally,":[264],"our":[265],"pairs":[270,301],"high":[274],"similarity":[276,307,319],"benefit":[277],"most":[278],"information,":[282],"+6.56%":[284],"(94.97%),":[287],"+2.13%":[288],"+4.35%":[292],"(94.09%)":[295],"lower":[303],"degrees":[304],"+0.85%":[313],"(96%)":[316],"low":[318],"+1.31%":[321],"(96.34%)":[324],"no":[326],"similarity.":[327],"These":[328],"results":[329],"demonstrate":[330],"importance":[332]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3}],"updated_date":"2026-05-09T13:55:54.758798","created_date":"2025-10-10T00:00:00"}
