{"id":"https://openalex.org/W4382201771","doi":"https://doi.org/10.1145/3582768.3582807","title":"Building term hierarchies using graph-based clustering","display_name":"Building term hierarchies using graph-based clustering","publication_year":2022,"publication_date":"2022-12-16","ids":{"openalex":"https://openalex.org/W4382201771","doi":"https://doi.org/10.1145/3582768.3582807"},"language":"en","primary_location":{"id":"doi:10.1145/3582768.3582807","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3582768.3582807","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 6th International Conference on Natural Language Processing and Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055965962","display_name":"Mark Hloch","orcid":"https://orcid.org/0000-0002-3436-1029"},"institutions":[{"id":"https://openalex.org/I4210113269","display_name":"Hochschule Niederrhein","ror":"https://ror.org/027b9qx26","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210113269"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Mark Hloch","raw_affiliation_strings":["Faculty of Electrical Engineering and Computer Science, Hochschule Niederrhein - University of Applied Sciences, Germany"],"raw_orcid":"https://orcid.org/0000-0002-3436-1029","affiliations":[{"raw_affiliation_string":"Faculty of Electrical Engineering and Computer Science, Hochschule Niederrhein - University of Applied Sciences, Germany","institution_ids":["https://openalex.org/I4210113269"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092276014","display_name":"Markus Van Meegen","orcid":"https://orcid.org/0000-0003-2977-8556"},"institutions":[{"id":"https://openalex.org/I4210113269","display_name":"Hochschule Niederrhein","ror":"https://ror.org/027b9qx26","country_code":"DE","type":"education","lineage":["https://openalex.org/I4210113269"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Markus Van Meegen","raw_affiliation_strings":["Faculty of Electrical Engineering and Computer Science, Hochschule Niederrhein - University of Applied Sciences, Germany"],"raw_orcid":"https://orcid.org/0000-0003-2977-8556","affiliations":[{"raw_affiliation_string":"Faculty of Electrical Engineering and Computer Science, Hochschule Niederrhein - University of Applied Sciences, Germany","institution_ids":["https://openalex.org/I4210113269"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078419084","display_name":"Mario Kubek","orcid":"https://orcid.org/0000-0003-2641-2065"},"institutions":[{"id":"https://openalex.org/I181565077","display_name":"Georgia State University","ror":"https://ror.org/03qt6ba18","country_code":"US","type":"education","lineage":["https://openalex.org/I181565077"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mario Kubek","raw_affiliation_strings":["Department of Computer Science, Georgia State University, USA"],"raw_orcid":"https://orcid.org/0000-0003-2641-2065","affiliations":[{"raw_affiliation_string":"Department of Computer Science, Georgia State University, USA","institution_ids":["https://openalex.org/I181565077"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003105685","display_name":"Herwig Unger","orcid":"https://orcid.org/0000-0002-8818-3600"},"institutions":[{"id":"https://openalex.org/I120691247","display_name":"FernUniversit\u00e4t in Hagen","ror":"https://ror.org/04tkkr536","country_code":"DE","type":"education","lineage":["https://openalex.org/I120691247"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Herwig Unger","raw_affiliation_strings":["Chair of Computer Engineering, University in Hagen, Germany"],"raw_orcid":"https://orcid.org/0000-0002-8818-3600","affiliations":[{"raw_affiliation_string":"Chair of Computer Engineering, University in Hagen, Germany","institution_ids":["https://openalex.org/I120691247"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5055965962"],"corresponding_institution_ids":["https://openalex.org/I4210113269"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.18260063,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"49","last_page":"56"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7662478685379028},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.741641104221344},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.586033821105957},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5248494148254395},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.5125644207000732},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.4805586636066437},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.47918689250946045},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.47394755482673645},{"id":"https://openalex.org/keywords/clustering-coefficient","display_name":"Clustering coefficient","score":0.44159069657325745},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2731574475765228}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7662478685379028},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.741641104221344},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.586033821105957},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5248494148254395},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.5125644207000732},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.4805586636066437},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.47918689250946045},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.47394755482673645},{"id":"https://openalex.org/C22047676","wikidata":"https://www.wikidata.org/wiki/Q898680","display_name":"Clustering coefficient","level":3,"score":0.44159069657325745},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2731574475765228},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3582768.3582807","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3582768.3582807","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 6th International Conference on Natural Language Processing and Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1614298861","https://openalex.org/W1985258161","https://openalex.org/W1987302197","https://openalex.org/W1987869189","https://openalex.org/W2033403400","https://openalex.org/W2127218421","https://openalex.org/W2153579005","https://openalex.org/W2250539671","https://openalex.org/W2482589566","https://openalex.org/W2896457183","https://openalex.org/W3115522112","https://openalex.org/W3115995735","https://openalex.org/W4213009331","https://openalex.org/W4240908132","https://openalex.org/W4294170691","https://openalex.org/W6640911648","https://openalex.org/W6670271065","https://openalex.org/W6719054054"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W3200375535"],"abstract_inverted_index":{"Classical":[0],"tasks":[1],"of":[2,26,32,59,63,83,107,127,136,150,162,167],"a":[3,33,56,80,105,128,152],"librarian,":[4],"such":[5],"as":[6],"screening":[7],"and":[8,45,68],"categorizing":[9],"new":[10,96,153],"documents":[11],"based":[12,132],"on":[13,133,144],"their":[14],"content,":[15],"are":[16],"increasingly":[17],"replaced":[18],"by":[19,40,123],"search":[20,43],"engines":[21,44],"or":[22],"through":[23],"the":[24,60,92,134,137,141,145,168],"use":[25],"cataloging":[27],"software.":[28],"A":[29],"first":[30],"overview":[31],"corpus":[34],"topical":[35],"orientation":[36],"can":[37],"be":[38,66],"achieved":[39],"combining":[41],"graph-based":[42,88,109],"clustering":[46,50,89,110,117],"methods.":[47],"Existing":[48],"classical":[49],"methods,":[51],"however,":[52],"often":[53],"require":[54],"an":[55],"priori":[57],"specification":[58],"desired":[61],"number":[62],"clusters":[64,161],"to":[65],"output":[67],"do":[69],"not":[70],"consider":[71],"term":[72,93,121,160],"relationships":[73,149],"in":[74],"graphs,":[75],"which":[76],"is":[77,155,174],"deficient":[78],"from":[79],"practical":[81],"point":[82],"view.":[84],"Therefore,":[85],"fully":[86],"unsupervised":[87],"approaches":[90],"at":[91],"level":[94],"offer":[95],"possibilities":[97],"that":[98],"mitigate":[99],"these":[100],"shortcomings.":[101],"Within":[102],"this":[103],"work,":[104],"set":[106],"novel":[108],"algorithms":[111],"have":[112],"been":[113],"developed.":[114],"The":[115,165],"hierarchical":[116],"algorithm":[118],"(HCA)":[119],"forms":[120],"hierarchies":[122],"iteratively":[124],"isolating":[125],"nodes":[126],"given":[129],"co-occurrence":[130,146],"graph":[131,147,154],"evaluation":[135],"edge":[138],"weight":[139],"between":[140],"nodes.":[142],"Based":[143],"inherent":[148],"terms,":[151],"built":[156],"agglomerative":[157],"forming":[158],"individual":[159],"related":[163],"terms.":[164],"feasibility":[166],"outlined":[169],"methods":[170],"for":[171],"text":[172],"analysis":[173],"shown.":[175]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
