{"id":"https://openalex.org/W6930482628","doi":"https://doi.org/10.5281/zenodo.13119437","title":"Bio-ML: Machine Learning-Friendly Biomedical Datasets for Equivalence and Subsumption Ontology Matching","display_name":"Bio-ML: Machine Learning-Friendly Biomedical Datasets for Equivalence and Subsumption Ontology Matching","publication_year":2024,"publication_date":"2024-07-28","ids":{"openalex":"https://openalex.org/W6930482628","doi":"https://doi.org/10.5281/zenodo.13119437"},"language":"en","primary_location":{"id":"doi:10.5281/zenodo.13119437","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13119437","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.13119437","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Yuan He","orcid":"https://orcid.org/0000-0002-4486-1262"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Yuan He","raw_affiliation_strings":["University of Oxford"],"affiliations":[{"raw_affiliation_string":"University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiaoyan Chen","orcid":"https://orcid.org/0000-0003-4643-6750"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jiaoyan Chen","raw_affiliation_strings":["University of Oxford"],"affiliations":[{"raw_affiliation_string":"University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Hang Dong","orcid":"https://orcid.org/0000-0001-6828-6891"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hang Dong","raw_affiliation_strings":["University of Oxford"],"affiliations":[{"raw_affiliation_string":"University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ernesto Jim\u00e9nez-Ruiz","orcid":"https://orcid.org/0000-0002-9083-4599"},"institutions":[{"id":"https://openalex.org/I180825142","display_name":"City, University of London","ror":"https://ror.org/04489at23","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I180825142"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ernesto Jim\u00e9nez-Ruiz","raw_affiliation_strings":["City, University of London"],"affiliations":[{"raw_affiliation_string":"City, University of London","institution_ids":["https://openalex.org/I180825142"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Ali Hadian","orcid":null},"institutions":[{"id":"https://openalex.org/I4210117523","display_name":"Samsung (United Kingdom)","ror":"https://ror.org/01w6gjq94","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210117523"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ali Hadian","raw_affiliation_strings":["Samsung Research UK"],"affiliations":[{"raw_affiliation_string":"Samsung Research UK","institution_ids":["https://openalex.org/I4210117523"]}]},{"author_position":"last","author":{"id":null,"display_name":"Ian Horrocks","orcid":"https://orcid.org/0000-0002-2685-7462"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Ian Horrocks","raw_affiliation_strings":["University of Oxford"],"affiliations":[{"raw_affiliation_string":"University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I40120149"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T11094","display_name":"Face Recognition and Perception","score":0.3732999861240387,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11094","display_name":"Face Recognition and Perception","score":0.3732999861240387,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10427","display_name":"Visual perception and processing mechanisms","score":0.2976999878883362,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11118","display_name":"Evolutionary Psychology and Human Behavior","score":0.03500000014901161,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/unified-medical-language-system","display_name":"Unified Medical Language System","score":0.805899977684021},{"id":"https://openalex.org/keywords/equivalence","display_name":"Equivalence (formal languages)","score":0.6281999945640564},{"id":"https://openalex.org/keywords/ontology","display_name":"Ontology","score":0.564300000667572},{"id":"https://openalex.org/keywords/ontology-alignment","display_name":"Ontology alignment","score":0.5123999714851379},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4560000002384186},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.36090001463890076},{"id":"https://openalex.org/keywords/uniprot","display_name":"UniProt","score":0.35249999165534973},{"id":"https://openalex.org/keywords/open-biomedical-ontologies","display_name":"Open Biomedical Ontologies","score":0.34360000491142273},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.3425999879837036}],"concepts":[{"id":"https://openalex.org/C69505689","wikidata":"https://www.wikidata.org/wiki/Q455338","display_name":"Unified Medical Language System","level":2,"score":0.805899977684021},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7840999960899353},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.6281999945640564},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6157000064849854},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.564300000667572},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5357999801635742},{"id":"https://openalex.org/C98893333","wikidata":"https://www.wikidata.org/wiki/Q4339878","display_name":"Ontology alignment","level":4,"score":0.5123999714851379},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4560000002384186},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4542999863624573},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.36090001463890076},{"id":"https://openalex.org/C202264299","wikidata":"https://www.wikidata.org/wiki/Q905695","display_name":"UniProt","level":3,"score":0.35249999165534973},{"id":"https://openalex.org/C137982476","wikidata":"https://www.wikidata.org/wiki/Q7072326","display_name":"Open Biomedical Ontologies","level":5,"score":0.34360000491142273},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3425999879837036},{"id":"https://openalex.org/C37926939","wikidata":"https://www.wikidata.org/wiki/Q7449061","display_name":"Semantic equivalence","level":4,"score":0.33340001106262207},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.3228999972343445},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.3095000088214874},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.2962999939918518},{"id":"https://openalex.org/C69075417","wikidata":"https://www.wikidata.org/wiki/Q515701","display_name":"Linked data","level":3,"score":0.28360000252723694},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.27639999985694885},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C110903229","wikidata":"https://www.wikidata.org/wiki/Q7449064","display_name":"Semantic integration","level":4,"score":0.2728999853134155},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.2662000060081482},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.26339998841285706},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C110615152","wikidata":"https://www.wikidata.org/wiki/Q1469824","display_name":"Controlled vocabulary","level":2,"score":0.2624000012874603}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.13119437","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13119437","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.13119437","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.13119437","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"version":[1,297],"is":[2,20,34,117,124,148,155,303],"used":[3],"in":[4,295],"the":[5,9,12,17,21,103,131,162,168,246,257,270,280,300,304],"Bio-ML":[6,173,248,259],"track":[7,116,249],"of":[8,23,31,109,306],"OAEI":[10,18,247,301],"2024;":[11],"only":[13,293],"change":[14,294],"compared":[15,298],"to":[16,35,106,299],"2023":[19,302],"deletion":[22,108,305],"certain":[24,110,307],"training":[25,111,308],"subsumption":[26,39,112,142,184,309],"mappings.":[27,113,171],"Overview":[28],"The":[29,99,114,145,292],"purpose":[30],"these":[32],"datasets":[33,180],"support":[36],"equivalence":[37,137,182],"and":[38,50,133,164,167,183,189,192,195,198,201,224,227,230,267],"ontology":[40,45,185,220],"matching.":[41],"There":[42],"are":[43],"five":[44],"pairs":[46],"extracted":[47],"from":[48],"MONDO":[49],"UMLS:":[51],"Source":[52],"Task":[53],"Category":[54],"#SrcCls":[55],"#TgtCls":[56],"#Ref":[57,59],"(equiv)":[58],"(subs)":[60],"Mondo":[61,68],"OMIM-ORDO":[62],"Disease":[63,70],"9,648":[64],"9,275":[65],"3,721":[66],"103":[67],"NCIT-DOID":[69],"15,762":[71],"8,465":[72],"4,686":[73],"3,338":[74],"(-1)":[75,91],"UMLS":[76,84,92],"SNOMED-FMA":[77],"Body":[78],"34,418":[79],"88,955":[80],"7,256":[81],"5,453":[82],"(-53)":[83],"SNOMED-NCIT":[85,93],"Pharm":[86],"29,500":[87],"22,136":[88],"5,803":[89],"4,224":[90],"Neoplas":[94],"22,971":[95],"20,247":[96],"3,804":[97],"213":[98],"\"-\"":[100],"numbers":[101],"reflect":[102],"changes":[104],"due":[105],"lthe":[107],"main":[115],"available":[118,149],"at":[119,150,260,265,283,286],"\"bio-ml\",":[120],"where":[121,152],"each":[122,153],"pair":[123,154],"associated":[125,156],"with":[126,157],"a":[127,158],"task":[128,159],"folder,":[129,160],"containing":[130,161],"source":[132,163],"target":[134,165],"ontologies,":[135,166],"reference":[136,141],"mappings":[138,143,310],"(in":[139],"\"refs_equiv\"),":[140],"(\"refs_subs\").":[144],"special":[146],"sub-track":[147,282],"\"bio-llm\",":[151],"test":[169],"candidate":[170],"Citation":[172],"(Main":[174],"Track)":[175],"```@inproceedings{he2022machine,":[176],"title={Machine":[177],"learning-friendly":[178],"biomedical":[179],"for":[181,219,256,279],"matching},":[186],"author={He,":[187,222],"Yuan":[188,223],"Chen,":[190,225],"Jiaoyan":[191,226],"Dong,":[193,228],"Hang":[194,229],"Jim{\\'e}nez-Ruiz,":[196],"Ernesto":[197],"Hadian,":[199],"Ali":[200],"Horrocks,":[202,231],"Ian},":[203,232],"booktitle={International":[204],"Semantic":[205],"Web":[206],"Conference},":[207],"pages={575--591},":[208],"year={2022},":[209],"organization={Springer}":[210],"}```":[211,237],"Bio-LLM":[212,281],"(Sub-track)":[213],"```@article{he2023exploring,":[214],"title={Exploring":[215],"large":[216],"language":[217],"models":[218],"alignment},":[221],"journal={arXiv":[233],"preprint":[234],"arXiv:2309.07172},":[235],"year={2023}":[236],"Important":[238],"Links":[239],"See":[240,245,252,275],"detailed":[241],"documentation":[242],"at:":[243,250],"https://krr-oxford.github.io/DeepOnto/bio-ml.":[244],"https://www.cs.ox.ac.uk/isg/projects/ConCur/oaei/":[251],"our":[253,276],"resource":[254,272],"paper":[255,273,278],"original":[258],"arxiv":[261,284],"or":[262],"springer":[263],"(accepted":[264,285],"ISWC-2022":[266],"nominated":[268],"as":[269],"best":[271],"candidate).":[274],"poster":[277],"ISWC-2023":[287],"Posters":[288],"&":[289],"Demos).":[290],"Changelog":[291],"this":[296],"that":[311],"can":[312],"be":[313],"directly":[314],"exploited":[315],"through":[316],"deductive":[317],"reasoning.":[318]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
