{"id":"https://openalex.org/W2948075061","doi":"https://doi.org/10.18653/v1/p19-1574","title":"Probing for Semantic Classes: Diagnosing the Meaning Content of Word Embeddings","display_name":"Probing for Semantic Classes: Diagnosing the Meaning Content of Word Embeddings","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2948075061","doi":"https://doi.org/10.18653/v1/p19-1574","mag":"2948075061"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p19-1574","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1574","pdf_url":"https://www.aclweb.org/anthology/P19-1574.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P19-1574.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031030600","display_name":"Yadollah Yaghoobzadeh","orcid":"https://orcid.org/0000-0003-0646-0852"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Yadollah Yaghoobzadeh","raw_affiliation_strings":["Microsoft Research Montral","(Microsoft)"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Montral","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"(Microsoft)","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082874907","display_name":"Katharina Kann","orcid":null},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Katharina Kann","raw_affiliation_strings":["Center for Data Science, New York University"],"affiliations":[{"raw_affiliation_string":"Center for Data Science, New York University","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114018312","display_name":"Timothy J. Hazen","orcid":"https://orcid.org/0009-0006-1413-9590"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"T. J. Hazen","raw_affiliation_strings":["Microsoft Research Montral"],"affiliations":[{"raw_affiliation_string":"Microsoft Research Montral","institution_ids":["https://openalex.org/I4210164937"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047151336","display_name":"Eneko Agirre","orcid":"https://orcid.org/0000-0002-0195-4899"},"institutions":[{"id":"https://openalex.org/I169108374","display_name":"University of the Basque Country","ror":"https://ror.org/000xsnr85","country_code":"ES","type":"education","lineage":["https://openalex.org/I169108374"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Eneko Agirre","raw_affiliation_strings":["IXA NLP Group, University of the Basque Country"],"affiliations":[{"raw_affiliation_string":"IXA NLP Group, University of the Basque Country","institution_ids":["https://openalex.org/I169108374"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071144367","display_name":"Hinrich Sch\u00fctze","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hinrich Sch\u00fctze","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5031030600"],"corresponding_institution_ids":["https://openalex.org/I4210164937"],"apc_list":null,"apc_paid":null,"fwci":0.289,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.6548509,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"5740","last_page":"5753"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7817007303237915},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.714777946472168},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.708349347114563},{"id":"https://openalex.org/keywords/conflation","display_name":"Conflation","score":0.6997118592262268},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6624854207038879},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.6226365566253662},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5973197817802429},{"id":"https://openalex.org/keywords/vector-space","display_name":"Vector space","score":0.5457959175109863},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5425854325294495},{"id":"https://openalex.org/keywords/semantic-space","display_name":"Semantic space","score":0.4770599901676178},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4290751814842224},{"id":"https://openalex.org/keywords/distributional-semantics","display_name":"Distributional semantics","score":0.4205384850502014},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.4200670123100281},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.4150620698928833},{"id":"https://openalex.org/keywords/word-sense-disambiguation","display_name":"Word-sense disambiguation","score":0.41028133034706116},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33280786871910095},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2508271336555481},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24714237451553345},{"id":"https://openalex.org/keywords/wordnet","display_name":"WordNet","score":0.17336416244506836},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.12755820155143738}],"concepts":[{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7817007303237915},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.714777946472168},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.708349347114563},{"id":"https://openalex.org/C130440534","wikidata":"https://www.wikidata.org/wiki/Q14946528","display_name":"Conflation","level":2,"score":0.6997118592262268},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6624854207038879},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.6226365566253662},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5973197817802429},{"id":"https://openalex.org/C13336665","wikidata":"https://www.wikidata.org/wiki/Q125977","display_name":"Vector space","level":2,"score":0.5457959175109863},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5425854325294495},{"id":"https://openalex.org/C2986420190","wikidata":"https://www.wikidata.org/wiki/Q39045939","display_name":"Semantic space","level":2,"score":0.4770599901676178},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4290751814842224},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.4205384850502014},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.4200670123100281},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.4150620698928833},{"id":"https://openalex.org/C51646954","wikidata":"https://www.wikidata.org/wiki/Q48522","display_name":"Word-sense disambiguation","level":3,"score":0.41028133034706116},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33280786871910095},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2508271336555481},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24714237451553345},{"id":"https://openalex.org/C157659113","wikidata":"https://www.wikidata.org/wiki/Q533822","display_name":"WordNet","level":2,"score":0.17336416244506836},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.12755820155143738},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.18653/v1/p19-1574","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1574","pdf_url":"https://www.aclweb.org/anthology/P19-1574.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1906.03608","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1906.03608","pdf_url":"https://arxiv.org/pdf/1906.03608","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:2948075061","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1906.03608","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:epub.ub.uni-muenchen.de:72190","is_oa":true,"landing_page_url":"http://nbn-resolving.de/urn:nbn:de:bvb:19-epub-72190-4","pdf_url":null,"source":{"id":"https://openalex.org/S4306401845","display_name":"Open access LMU (Ludwid Maxmilian's Universitat Munchen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I8204097","host_organization_name":"Ludwig-Maximilians-Universit\u00e4t M\u00fcnchen","host_organization_lineage":["https://openalex.org/I8204097"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Konferenz"},{"id":"doi:10.48550/arxiv.1906.03608","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1906.03608","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"doi:10.5282/ubm/epub.72190","is_oa":true,"landing_page_url":"https://doi.org/10.5282/ubm/epub.72190","pdf_url":null,"source":{"id":"https://openalex.org/S7407052039","display_name":"Universit\u00e4tsbibliothek der LMU","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.18653/v1/p19-1574","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1574","pdf_url":"https://www.aclweb.org/anthology/P19-1574.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.75,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320308943","display_name":"Microsoft Research","ror":"https://ror.org/00d0nc645"},{"id":"https://openalex.org/F4320321919","display_name":"Euskal Herriko Unibertsitatea","ror":"https://ror.org/000xsnr85"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2948075061.pdf","grobid_xml":"https://content.openalex.org/works/W2948075061.grobid-xml"},"referenced_works_count":52,"referenced_works":["https://openalex.org/W125820043","https://openalex.org/W1010415138","https://openalex.org/W1614298861","https://openalex.org/W1980776243","https://openalex.org/W2026185168","https://openalex.org/W2040004971","https://openalex.org/W2051390224","https://openalex.org/W2065030658","https://openalex.org/W2065157922","https://openalex.org/W2091117392","https://openalex.org/W2101234009","https://openalex.org/W2114524997","https://openalex.org/W2116715664","https://openalex.org/W2130337399","https://openalex.org/W2131357087","https://openalex.org/W2149671658","https://openalex.org/W2160660844","https://openalex.org/W2162456950","https://openalex.org/W2163455955","https://openalex.org/W2164019165","https://openalex.org/W2171082019","https://openalex.org/W2250539671","https://openalex.org/W2296194829","https://openalex.org/W2406945108","https://openalex.org/W2436001372","https://openalex.org/W2507974895","https://openalex.org/W2511478665","https://openalex.org/W2512498397","https://openalex.org/W2519468206","https://openalex.org/W2587764909","https://openalex.org/W2622670270","https://openalex.org/W2780932362","https://openalex.org/W2790235966","https://openalex.org/W2798287132","https://openalex.org/W2889647547","https://openalex.org/W2891958973","https://openalex.org/W2953369973","https://openalex.org/W2962713724","https://openalex.org/W2962739339","https://openalex.org/W2962926715","https://openalex.org/W2963341956","https://openalex.org/W2963430224","https://openalex.org/W2963639656","https://openalex.org/W2963672540","https://openalex.org/W2963677631","https://openalex.org/W2963756346","https://openalex.org/W2963850840","https://openalex.org/W2964204621","https://openalex.org/W2964210975","https://openalex.org/W2964303159","https://openalex.org/W3098861490","https://openalex.org/W3101950626"],"related_works":["https://openalex.org/W2981499762","https://openalex.org/W2989798563","https://openalex.org/W3202858538","https://openalex.org/W2252085576","https://openalex.org/W2794132063","https://openalex.org/W2614551030","https://openalex.org/W2941076272","https://openalex.org/W2108061274","https://openalex.org/W3135353212","https://openalex.org/W2558421169","https://openalex.org/W2889801236","https://openalex.org/W2798542442","https://openalex.org/W2809234507","https://openalex.org/W2963033440","https://openalex.org/W2579644692","https://openalex.org/W3132982245","https://openalex.org/W2262907013","https://openalex.org/W2804313859","https://openalex.org/W2787788033","https://openalex.org/W2986907052"],"abstract_inverted_index":{"Word":[0],"embeddings":[1,17,84,95],"typically":[2],"represent":[3],"different":[4,62],"meanings":[5],"of":[6,16,18,28],"a":[7,10,47,106,113,128],"word":[8,37,56,59,83,129],"in":[9,112,147],"single":[11],"conflated":[12],"vector.":[13],"Empirical":[14],"analysis":[15],"ambiguous":[19],"words":[20,63],"is":[21,70,108,119,130],"currently":[22],"limited":[23],"by":[24,33,66,93],"the":[25,34,71,90,117],"small":[26],"size":[27],"manually":[29],"annotated":[30],"resources":[31],"and":[32,55,88],"fact":[35],"that":[36],"senses":[38,60,142],"are":[39,64,143],"treated":[40],"as":[41],"unrelated":[42],"individual":[43],"concepts.":[44],"We":[45],"present":[46],"large":[48],"dataset":[49],"based":[50,134],"on":[51,136,156,163],"manual":[52],"Wikipedia":[53],"annotations":[54],"senses,":[57],"where":[58],"from":[61],"related":[65],"semantic":[67,86,97],"classes.":[68,98],"This":[69],"basis":[72],"for":[73,77,85],"novel":[74],"diagnostic":[75],"tests":[76],"an":[78,157],"embedding's":[79],"content:":[80],"we":[81],"probe":[82],"classes":[87],"analyze":[89],"embedding":[91,115],"space":[92],"classifying":[94],"into":[96],"Our":[99],"main":[100],"findings":[101],"are:":[102],"(i)":[103],"Information":[104],"about":[105],"sense":[107,118],"generally":[109],"represented":[110,146],"well":[111,145],"single-vector":[114,148],"-if":[116],"frequent.":[120],"(ii)":[121],"A":[122],"classifier":[123],"can":[124],"accurately":[125],"predict":[126],"whether":[127],"single-sense":[131],"or":[132],"multi-sense,":[133],"only":[135],"its":[137],"embedding.":[138],"(iii)":[139],"Although":[140],"rare":[141],"not":[144,152],"embeddings,":[149],"this":[150],"does":[151],"have":[153],"negative":[154],"impact":[155],"NLP":[158],"application":[159],"whose":[160],"performance":[161],"depends":[162],"frequent":[164],"senses.":[165]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
