{"id":"https://openalex.org/W4225939827","doi":"https://doi.org/10.1145/3486622.3493941","title":"Unsupervised Tree Extraction in Embedding Spaces for Taxonomy Induction","display_name":"Unsupervised Tree Extraction in Embedding Spaces for Taxonomy Induction","publication_year":2021,"publication_date":"2021-12-14","ids":{"openalex":"https://openalex.org/W4225939827","doi":"https://doi.org/10.1145/3486622.3493941"},"language":"en","primary_location":{"id":"doi:10.1145/3486622.3493941","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3486622.3493941","pdf_url":null,"source":{"id":"https://openalex.org/S4363608074","display_name":"IEEE/WIC/ACM International Conference on Web Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/WIC/ACM International Conference on Web Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-03494697","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034915019","display_name":"Fran\u00e7ois Torregrossa","orcid":"https://orcid.org/0000-0003-3900-2196"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I2802519937","display_name":"Institut de Recherche en Informatique et Syst\u00e8mes Al\u00e9atoires","ror":"https://ror.org/00myn0z94","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I205703379","https://openalex.org/I2802204017","https://openalex.org/I2802519937","https://openalex.org/I28221208","https://openalex.org/I4210127572","https://openalex.org/I4210159245","https://openalex.org/I56067802"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Fran\u00e7ois Torregrossa","raw_affiliation_strings":["CNRS, IRISA, France and SoLocal, France","Solocal (115 Boulevard Albert 1er, 35200 Rennes - France)","LinkMedia - Creating and exploiting explicit links between multimedia fragments (Campus de Beaulieu 35042 Rennes cedex - France)"],"affiliations":[{"raw_affiliation_string":"CNRS, IRISA, France and SoLocal, France","institution_ids":["https://openalex.org/I2802519937","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Solocal (115 Boulevard Albert 1er, 35200 Rennes - France)","institution_ids":[]},{"raw_affiliation_string":"LinkMedia - Creating and exploiting explicit links between multimedia fragments (Campus de Beaulieu 35042 Rennes cedex - France)","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024542662","display_name":"Robin Allesiardo","orcid":"https://orcid.org/0000-0001-5767-1188"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robin Allesiardo","raw_affiliation_strings":["SoLocal, France"],"affiliations":[{"raw_affiliation_string":"SoLocal, France","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036636249","display_name":"Vincent Claveau","orcid":null},"institutions":[{"id":"https://openalex.org/I2802519937","display_name":"Institut de Recherche en Informatique et Syst\u00e8mes Al\u00e9atoires","ror":"https://ror.org/00myn0z94","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I205703379","https://openalex.org/I2802204017","https://openalex.org/I2802519937","https://openalex.org/I28221208","https://openalex.org/I4210127572","https://openalex.org/I4210159245","https://openalex.org/I56067802"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Vincent Claveau","raw_affiliation_strings":["CNRS, IRISA, France","LinkMedia - Creating and exploiting explicit links between multimedia fragments (Campus de Beaulieu 35042 Rennes cedex - France)"],"affiliations":[{"raw_affiliation_string":"CNRS, IRISA, France","institution_ids":["https://openalex.org/I2802519937","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"LinkMedia - Creating and exploiting explicit links between multimedia fragments (Campus de Beaulieu 35042 Rennes cedex - France)","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008190208","display_name":"Guillaume Gravier","orcid":"https://orcid.org/0000-0002-2266-5682"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I2802519937","display_name":"Institut de Recherche en Informatique et Syst\u00e8mes Al\u00e9atoires","ror":"https://ror.org/00myn0z94","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I205703379","https://openalex.org/I2802204017","https://openalex.org/I2802519937","https://openalex.org/I28221208","https://openalex.org/I4210127572","https://openalex.org/I4210159245","https://openalex.org/I56067802"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Guillaume Gravier","raw_affiliation_strings":["CNRS, IRISA, France","LinkMedia - Creating and exploiting explicit links between multimedia fragments (Campus de Beaulieu 35042 Rennes cedex - France)"],"affiliations":[{"raw_affiliation_string":"CNRS, IRISA, France","institution_ids":["https://openalex.org/I2802519937","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"LinkMedia - Creating and exploiting explicit links between multimedia fragments (Campus de Beaulieu 35042 Rennes cedex - France)","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5034915019"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I2802519937"],"apc_list":null,"apc_paid":null,"fwci":0.2513,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.54888764,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"302","last_page":"309"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.658704400062561},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5576547384262085},{"id":"https://openalex.org/keywords/taxonomy","display_name":"Taxonomy (biology)","score":0.5362491011619568},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4782796800136566},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.4452546238899231},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20129001140594482},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.08613595366477966},{"id":"https://openalex.org/keywords/botany","display_name":"Botany","score":0.07996618747711182}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.658704400062561},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5576547384262085},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.5362491011619568},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4782796800136566},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.4452546238899231},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20129001140594482},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.08613595366477966},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.07996618747711182},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3486622.3493941","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3486622.3493941","pdf_url":null,"source":{"id":"https://openalex.org/S4363608074","display_name":"IEEE/WIC/ACM International Conference on Web Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/WIC/ACM International Conference on Web Intelligence","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-03494697v1","is_oa":true,"landing_page_url":"https://hal.science/hal-03494697","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"WI-IAT 2021 - 20th IEEE/WIC/ACM International Conference on Web Intelligence and Intelligent Agent Technology, Dec 2021, Melbourne, Australia. pp.1-8, &#x27E8;10.1145/3486622.3493941&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-03494697v1","is_oa":true,"landing_page_url":"https://hal.science/hal-03494697","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"WI-IAT 2021 - 20th IEEE/WIC/ACM International Conference on Web Intelligence and Intelligent Agent Technology, Dec 2021, Melbourne, Australia. pp.1-8, &#x27E8;10.1145/3486622.3493941&#x27E9;","raw_type":"Conference papers"},"sustainable_development_goals":[{"score":0.44999998807907104,"display_name":"Zero hunger","id":"https://metadata.un.org/sdg/2"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1966907789","https://openalex.org/W1996551363","https://openalex.org/W2068737686","https://openalex.org/W2081580037","https://openalex.org/W2100132811","https://openalex.org/W2142498761","https://openalex.org/W2465217376","https://openalex.org/W2468208907","https://openalex.org/W2471992743","https://openalex.org/W2760204057","https://openalex.org/W2948646817","https://openalex.org/W2962814626","https://openalex.org/W2962909572","https://openalex.org/W2962992134","https://openalex.org/W2963173796","https://openalex.org/W3034444248","https://openalex.org/W3167126457","https://openalex.org/W4244182232","https://openalex.org/W4245795068","https://openalex.org/W4253001967"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2081900870","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W4402327032"],"abstract_inverted_index":{"Exposing":[0],"latent":[1],"structure":[2],"(graph,":[3],"tree...)":[4],"of":[5,16,146],"data":[6,23],"is":[7,93],"a":[8],"major":[9],"challenge":[10],"to":[11,41,80,89,102,153],"deal":[12],"with":[13,49],"the":[14,50,81,144,154],"web":[15],"data.":[17,58],"Today\u2019s":[18],"embedding":[19,104,109],"techniques":[20],"incorporate":[21],"any":[22,103],"source":[24],"(noisy":[25],"graphs,":[26],"item":[27],"similarities,":[28],"plain":[29],"text)":[30],"into":[31],"continuous":[32],"vector":[33],"spaces":[34],"that":[35,143],"are":[36,47,150],"typically":[37],"used":[38],"as":[39,97],"input":[40],"classifier.":[42],"In":[43],"this":[44],"work,":[45],"we":[46,127],"dealing":[48],"opposite":[51],"task:":[52],"finding":[53],"structures":[54,73,145],"(taxonomies)":[55],"from":[56],"embedded":[57],"We":[59],"provide":[60],"an":[61],"original":[62],"unsupervised":[63],"methodology":[64],"for":[65,71,132],"taxonomy":[66,133],"induction":[67],"by":[68],"directly":[69],"searching":[70],"graph":[72,136],"preserving":[74],"pairwise":[75],"distances":[76],"between":[77],"items.":[78],"Contrary":[79],"state-of-the-art":[82],"(SOTA),":[83],"our":[84,119,147],"approach":[85,120],"does":[86],"not":[87],"require":[88],"train":[90],"classifiers;":[91],"it":[92,98],"also":[94],"more":[95],"versatile":[96],"can":[99],"be":[100],"applied":[101],"(eg.":[105],"word":[106],"embedding,":[107],"similarity":[108],"like":[110],"space-time":[111],"local":[112],"embedding...).":[113],"On":[114],"standard":[115],"benchmarks":[116],"and":[117,139],"metrics,":[118],"yields":[121],"SOTA":[122,157],"performance.":[123],"As":[124],"another":[125],"contribution,":[126],"propose":[128],"better":[129],"evaluation":[130],"metrics":[131],"induction,":[134],"leveraging":[135],"kernel":[137],"similarities":[138],"edit":[140],"distance,":[141],"showing":[142],"predicted":[148],"taxonomies":[149],"significantly":[151],"closer":[152],"ground-truth":[155],"than":[156],"solutions.":[158]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
