{"id":"https://openalex.org/W4385292525","doi":"https://doi.org/10.48550/arxiv.2307.13417","title":"Towards Resolving Word Ambiguity with Word Embeddings","display_name":"Towards Resolving Word Ambiguity with Word Embeddings","publication_year":2023,"publication_date":"2023-07-25","ids":{"openalex":"https://openalex.org/W4385292525","doi":"https://doi.org/10.48550/arxiv.2307.13417"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2307.13417","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.13417","pdf_url":"https://arxiv.org/pdf/2307.13417","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2307.13417","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092550302","display_name":"Matthias Thurnbauer","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Thurnbauer, Matthias","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044144468","display_name":"J. Reisinger","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reisinger, Johannes","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088166206","display_name":"Christoph Goller","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goller, Christoph","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5019597653","display_name":"Andreas Fischer","orcid":"https://orcid.org/0000-0003-0069-3436"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fischer, Andreas","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5092550302"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.8583253622055054},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7881219387054443},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7536474466323853},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6274328231811523},{"id":"https://openalex.org/keywords/dbscan","display_name":"DBSCAN","score":0.5930986404418945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.508988618850708},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5035869479179382},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4553745687007904},{"id":"https://openalex.org/keywords/semantic-space","display_name":"Semantic space","score":0.427903950214386},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3732476234436035},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11842185258865356},{"id":"https://openalex.org/keywords/fuzzy-clustering","display_name":"Fuzzy clustering","score":0.07235580682754517}],"concepts":[{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.8583253622055054},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7881219387054443},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7536474466323853},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6274328231811523},{"id":"https://openalex.org/C46576248","wikidata":"https://www.wikidata.org/wiki/Q1114630","display_name":"DBSCAN","level":5,"score":0.5930986404418945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.508988618850708},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5035869479179382},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4553745687007904},{"id":"https://openalex.org/C2986420190","wikidata":"https://www.wikidata.org/wiki/Q39045939","display_name":"Semantic space","level":2,"score":0.427903950214386},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3732476234436035},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11842185258865356},{"id":"https://openalex.org/C17212007","wikidata":"https://www.wikidata.org/wiki/Q5511111","display_name":"Fuzzy clustering","level":3,"score":0.07235580682754517},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C104047586","wikidata":"https://www.wikidata.org/wiki/Q5033439","display_name":"Canopy clustering algorithm","level":4,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2307.13417","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.13417","pdf_url":"https://arxiv.org/pdf/2307.13417","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2307.13417","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2307.13417","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2307.13417","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.13417","pdf_url":"https://arxiv.org/pdf/2307.13417","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[{"score":0.5199999809265137,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3163639875","https://openalex.org/W2353179089","https://openalex.org/W2364999035","https://openalex.org/W4226497289","https://openalex.org/W2966681114","https://openalex.org/W4386078164","https://openalex.org/W2923538289","https://openalex.org/W2353125546","https://openalex.org/W2369356834","https://openalex.org/W2771808941"],"abstract_inverted_index":{"Ambiguity":[0],"is":[1,9,58],"ubiquitous":[2],"in":[3,12,60,72],"natural":[4],"language.":[5],"Resolving":[6],"ambiguous":[7,47,100],"meanings":[8,127],"especially":[10],"important":[11],"information":[13],"retrieval":[14],"tasks.":[15],"While":[16],"word":[17,35],"embeddings":[18,79],"carry":[19],"semantic":[20],"information,":[21],"they":[22,41],"fail":[23],"to":[24,33,45,94,114,124],"handle":[25,34],"ambiguity":[26,36],"well.":[27],"Transformer":[28],"models":[29,57],"have":[30],"been":[31],"shown":[32],"for":[37,50],"complex":[38],"queries,":[39],"but":[40],"cannot":[42],"be":[43,81],"used":[44],"identify":[46,99],"words,":[48],"e.g.":[49],"a":[51,129],"1-word":[52],"query.":[53],"Furthermore,":[54],"training":[55,67],"these":[56],"costly":[59],"terms":[61],"of":[62,106,128],"time,":[63],"hardware":[64,85],"resources,":[65],"and":[66,102,121],"data,":[68],"prohibiting":[69],"their":[70,104],"use":[71],"specialized":[73],"environments":[74],"with":[75],"sensitive":[76],"data.":[77],"Word":[78],"can":[80,98],"trained":[82],"using":[83],"moderate":[84],"resources.":[86],"This":[87],"paper":[88],"shows":[89],"that":[90],"applying":[91],"DBSCAN":[92,110],"clustering":[93],"the":[95,125],"latent":[96],"space":[97],"words":[101],"evaluate":[103],"level":[105],"ambiguity.":[107],"An":[108],"automatic":[109],"parameter":[111],"selection":[112],"leads":[113],"high-quality":[115],"clusters,":[116],"which":[117],"are":[118],"semantically":[119],"coherent":[120],"correspond":[122],"well":[123],"perceived":[126],"given":[130],"word.":[131]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
