{"id":"https://openalex.org/W4413879958","doi":"https://doi.org/10.1186/s13321-025-01086-1","title":"Box embeddings for extending ontologies: a data-driven and interpretable approach","display_name":"Box embeddings for extending ontologies: a data-driven and interpretable approach","publication_year":2025,"publication_date":"2025-09-01","ids":{"openalex":"https://openalex.org/W4413879958","doi":"https://doi.org/10.1186/s13321-025-01086-1","pmid":"https://pubmed.ncbi.nlm.nih.gov/40890838"},"language":"en","primary_location":{"id":"doi:10.1186/s13321-025-01086-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-025-01086-1","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01086-1","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01086-1","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071777525","display_name":"Adel Memariani","orcid":"https://orcid.org/0000-0002-8368-7658"},"institutions":[{"id":"https://openalex.org/I206945453","display_name":"Paderborn University","ror":"https://ror.org/058kzsd48","country_code":"DE","type":"education","lineage":["https://openalex.org/I206945453"]},{"id":"https://openalex.org/I4210152224","display_name":"Heinz Nixdorf Stiftung","ror":"https://ror.org/04j2tkk21","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I4210152224"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Adel Memariani","raw_affiliation_strings":["Data Science Group (DICE), Heinz Nixdorf Institute, Paderborn University, Warburger Str. 100, 33098, Paderborn, North Rhine-Westphalia, Germany. adel.memariani@uni-paderborn.de","Data Science Group (DICE), Heinz Nixdorf Institute, Paderborn University, Warburger Str. 100, 33098, Paderborn, North Rhine\u2013Westphalia, Germany"],"raw_orcid":"https://orcid.org/0000-0002-8368-7658","affiliations":[{"raw_affiliation_string":"Data Science Group (DICE), Heinz Nixdorf Institute, Paderborn University, Warburger Str. 100, 33098, Paderborn, North Rhine-Westphalia, Germany. adel.memariani@uni-paderborn.de","institution_ids":["https://openalex.org/I206945453"]},{"raw_affiliation_string":"Data Science Group (DICE), Heinz Nixdorf Institute, Paderborn University, Warburger Str. 100, 33098, Paderborn, North Rhine\u2013Westphalia, Germany","institution_ids":["https://openalex.org/I206945453","https://openalex.org/I4210152224"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084910607","display_name":"Martin Glauer","orcid":"https://orcid.org/0000-0001-6772-1943"},"institutions":[{"id":"https://openalex.org/I95793202","display_name":"Otto-von-Guericke-Universit\u00e4t Magdeburg","ror":"https://ror.org/00ggpsq73","country_code":"DE","type":"education","lineage":["https://openalex.org/I95793202"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Martin Glauer","raw_affiliation_strings":["Institute for Intelligent Cooperating Systems, Otto von Guericke University, Universit\u00e4tsplatz 2, 39106, Magdeburg, Saxony-Anhalt, Germany"],"raw_orcid":"https://orcid.org/0000-0001-6772-1943","affiliations":[{"raw_affiliation_string":"Institute for Intelligent Cooperating Systems, Otto von Guericke University, Universit\u00e4tsplatz 2, 39106, Magdeburg, Saxony-Anhalt, Germany","institution_ids":["https://openalex.org/I95793202"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040189126","display_name":"Simon Fl\u00fcgel","orcid":"https://orcid.org/0000-0003-3754-9016"},"institutions":[{"id":"https://openalex.org/I170658231","display_name":"Osnabr\u00fcck University","ror":"https://ror.org/04qmmjx98","country_code":"DE","type":"education","lineage":["https://openalex.org/I170658231"]},{"id":"https://openalex.org/I4210159638","display_name":"Hochschule Osnabr\u00fcck","ror":"https://ror.org/059vymd37","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210159638"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Simon Fl\u00fcgel","raw_affiliation_strings":["Institute for computer science, Osnabr\u00fcck University, Friedrich-Janssen-Str. 1, 49076, Osnabr\u00fcck, Lower Saxony, Germany"],"raw_orcid":"https://orcid.org/0000-0003-3754-9016","affiliations":[{"raw_affiliation_string":"Institute for computer science, Osnabr\u00fcck University, Friedrich-Janssen-Str. 1, 49076, Osnabr\u00fcck, Lower Saxony, Germany","institution_ids":["https://openalex.org/I170658231","https://openalex.org/I4210159638"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080272127","display_name":"Fabian Neuhaus","orcid":"https://orcid.org/0000-0002-1058-3102"},"institutions":[{"id":"https://openalex.org/I95793202","display_name":"Otto-von-Guericke-Universit\u00e4t Magdeburg","ror":"https://ror.org/00ggpsq73","country_code":"DE","type":"education","lineage":["https://openalex.org/I95793202"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Fabian Neuhaus","raw_affiliation_strings":["Institute for Intelligent Cooperating Systems, Otto von Guericke University, Universit\u00e4tsplatz 2, 39106, Magdeburg, Saxony-Anhalt, Germany"],"raw_orcid":"https://orcid.org/0000-0002-1058-3102","affiliations":[{"raw_affiliation_string":"Institute for Intelligent Cooperating Systems, Otto von Guericke University, Universit\u00e4tsplatz 2, 39106, Magdeburg, Saxony-Anhalt, Germany","institution_ids":["https://openalex.org/I95793202"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044072805","display_name":"Janna Hastings","orcid":"https://orcid.org/0000-0002-3469-4923"},"institutions":[{"id":"https://openalex.org/I202697423","display_name":"University of Zurich","ror":"https://ror.org/02crff812","country_code":"CH","type":"education","lineage":["https://openalex.org/I202697423"]},{"id":"https://openalex.org/I202963720","display_name":"University of St.Gallen","ror":"https://ror.org/0561a3s31","country_code":"CH","type":"education","lineage":["https://openalex.org/I202963720"]},{"id":"https://openalex.org/I4210145378","display_name":"University of Applied Sciences St. Gallen","ror":"https://ror.org/049bwzr51","country_code":"CH","type":"education","lineage":["https://openalex.org/I4210129390","https://openalex.org/I4210145378"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Janna Hastings","raw_affiliation_strings":["Institute for Implementation Science in Health Care (IfIS), Faculty of Medicine, University of Zurich, Universit\u00e4tsstrasse 84, 8006, Z\u00fcrich, Switzerland","School of Medicine, University of St. Gallen, (HSG), St. JakobStrasse 21, 9000, Gallen, Switzerland"],"raw_orcid":"https://orcid.org/0000-0002-3469-4923","affiliations":[{"raw_affiliation_string":"Institute for Implementation Science in Health Care (IfIS), Faculty of Medicine, University of Zurich, Universit\u00e4tsstrasse 84, 8006, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I202697423"]},{"raw_affiliation_string":"School of Medicine, University of St. Gallen, (HSG), St. JakobStrasse 21, 9000, Gallen, Switzerland","institution_ids":["https://openalex.org/I202963720","https://openalex.org/I4210145378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040001719","display_name":"Till Mossakowski","orcid":"https://orcid.org/0000-0002-8938-5204"},"institutions":[{"id":"https://openalex.org/I170658231","display_name":"Osnabr\u00fcck University","ror":"https://ror.org/04qmmjx98","country_code":"DE","type":"education","lineage":["https://openalex.org/I170658231"]},{"id":"https://openalex.org/I4210159638","display_name":"Hochschule Osnabr\u00fcck","ror":"https://ror.org/059vymd37","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210159638"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Till Mossakowski","raw_affiliation_strings":["Institute for computer science, Osnabr\u00fcck University, Friedrich-Janssen-Str. 1, 49076, Osnabr\u00fcck, Lower Saxony, Germany"],"raw_orcid":"https://orcid.org/0000-0002-8938-5204","affiliations":[{"raw_affiliation_string":"Institute for computer science, Osnabr\u00fcck University, Friedrich-Janssen-Str. 1, 49076, Osnabr\u00fcck, Lower Saxony, Germany","institution_ids":["https://openalex.org/I170658231","https://openalex.org/I4210159638"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5071777525"],"corresponding_institution_ids":["https://openalex.org/I206945453","https://openalex.org/I4210152224"],"apc_list":{"value":1290,"currency":"GBP","value_usd":1582},"apc_paid":{"value":1290,"currency":"GBP","value_usd":1582},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11454275,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"17","issue":"1","first_page":"138","last_page":"138"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6994017958641052},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.45221391320228577},{"id":"https://openalex.org/keywords/ontology","display_name":"Ontology","score":0.4293038845062256},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4245806634426117},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4070797264575958}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6994017958641052},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.45221391320228577},{"id":"https://openalex.org/C25810664","wikidata":"https://www.wikidata.org/wiki/Q44325","display_name":"Ontology","level":2,"score":0.4293038845062256},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4245806634426117},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4070797264575958},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1186/s13321-025-01086-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-025-01086-1","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01086-1","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},{"id":"pmid:40890838","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40890838","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of cheminformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:c960ba8db97342f28e15a7fa9f011362","is_oa":true,"landing_page_url":"https://doaj.org/article/c960ba8db97342f28e15a7fa9f011362","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Journal of Cheminformatics, Vol 17, Iss 1, Pp 1-18 (2025)","raw_type":"article"},{"id":"pmh:oai:europepmc.org:11213750","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/12403937","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"},{"id":"pmh:oai:pubmedcentral.nih.gov:12403937","is_oa":true,"landing_page_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12403937/","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"J Cheminform","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/s13321-025-01086-1","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13321-025-01086-1","pdf_url":"https://jcheminf.biomedcentral.com/counter/pdf/10.1186/s13321-025-01086-1","source":{"id":"https://openalex.org/S180838163","display_name":"Journal of Cheminformatics","issn_l":"1758-2946","issn":["1758-2946"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Cheminformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320324816","display_name":"Universit\u00e4t Paderborn","ror":"https://ror.org/058kzsd48"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4413879958.pdf","grobid_xml":"https://content.openalex.org/works/W4413879958.grobid-xml"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W1494581921","https://openalex.org/W1935434993","https://openalex.org/W1975147762","https://openalex.org/W2103017472","https://openalex.org/W2114940395","https://openalex.org/W2548357532","https://openalex.org/W2564425030","https://openalex.org/W2615066396","https://openalex.org/W2798442412","https://openalex.org/W2962891712","https://openalex.org/W2962992134","https://openalex.org/W2963085936","https://openalex.org/W2963691377","https://openalex.org/W2964330146","https://openalex.org/W2965778154","https://openalex.org/W3113096756","https://openalex.org/W3132675136","https://openalex.org/W3167617922","https://openalex.org/W3168355451","https://openalex.org/W3214163703","https://openalex.org/W4224326644","https://openalex.org/W4225687252","https://openalex.org/W4298625426","https://openalex.org/W4307468223","https://openalex.org/W4309066180","https://openalex.org/W4312602175","https://openalex.org/W4367047185","https://openalex.org/W4385584357","https://openalex.org/W4393190704","https://openalex.org/W4396736534"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Deriving":[0],"symbolic":[1],"knowledge":[2,150],"from":[3],"trained":[4],"deep":[5],"learning":[6],"models":[7],"is":[8,26,147,186],"challenging":[9],"due":[10],"to":[11,22,27,51,111,133],"the":[12,33,39,63,67,97,135,143,153,172,194],"lack":[13],"of":[14,93,99,108,138,155,216],"transparency":[15],"in":[16,122,142,152,181],"such":[17,45],"models.":[18],"A":[19],"promising":[20],"approach":[21,201],"address":[23],"this":[24,185],"issue":[25],"couple":[28],"a":[29,59,73,94,100,210],"semantic":[30],"structure":[31,61],"with":[32,171],"model":[34,40,128,162],"outputs":[35,65,208],"and":[36,113,212,218],"thereby":[37],"make":[38],"interpretable.":[41],"In":[42,70],"prediction":[43],"tasks":[44],"as":[46],"multi-label":[47,123,182],"classification,":[48],"labels":[49],"tend":[50],"form":[52],"hierarchical":[53,165],"relationships.":[54],"Therefore,":[55],"we":[56,104],"propose":[57],"enforcing":[58],"taxonomical":[60],"on":[62],"model's":[64],"throughout":[66],"training":[68,195],"phase.":[69],"vector":[71],"space,":[72],"taxonomy":[74,192],"can":[75],"be":[76],"represented":[77],"using":[78],"axis-aligned":[79],"hyper-rectangles,":[80],"or":[81,86],"boxes,":[82],"which":[83,146],"may":[84],"overlap":[85],"nest":[87],"within":[88],"one":[89],"another.":[90],"The":[91],"boundaries":[92],"box":[95],"determine":[96],"extent":[98],"particular":[101],"category.":[102],"Thus,":[103],"used":[105],"box-shaped":[106],"embeddings":[107],"ontology":[109],"classes":[110],"learn":[112],"transparently":[114],"represent":[115],"logical":[116],"relationships":[117,166],"that":[118,160],"are":[119],"only":[120],"implicit":[121,164],"datasets.":[124],"We":[125,158],"assessed":[126],"our":[127,161],"by":[129,205],"measuring":[130],"its":[131],"ability":[132],"approximate":[134],"full":[136],"set":[137],"inferred":[139],"subclass":[140],"relations":[141],"ChEBI":[144],"ontology,":[145],"an":[148,190],"important":[149],"base":[151],"field":[154],"life":[156],"science.":[157],"demonstrate":[159],"captures":[163],"among":[167],"labels,":[168],"ensuring":[169],"consistency":[170],"underlying":[173],"ontological":[174],"conceptualization,":[175],"while":[176],"also":[177],"achieving":[178],"state-of-the-art":[179],"performance":[180],"classification.":[183],"Notably,":[184],"accomplished":[187],"without":[188],"requiring":[189],"explicit":[191],"during":[193],"process.":[196],"SCIENTIFIC":[197],"CONTRIBUTION:":[198],"Our":[199],"proposed":[200],"advances":[202],"chemical":[203],"classification":[204],"enabling":[206],"interpretable":[207],"through":[209],"structured":[211],"geometrically":[213],"expressive":[214],"representation":[215],"molecules":[217],"their":[219],"classes.":[220]},"counts_by_year":[],"updated_date":"2026-04-18T05:59:34.339393","created_date":"2025-10-10T00:00:00"}
