{"id":"https://openalex.org/W2518048962","doi":"https://doi.org/10.18653/v1/w16-1623","title":"Using Embedding Masks for Word Categorization","display_name":"Using Embedding Masks for Word Categorization","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2518048962","doi":"https://doi.org/10.18653/v1/w16-1623","mag":"2518048962"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w16-1623","is_oa":true,"landing_page_url":"http://doi.org/10.18653/v1/w16-1623","pdf_url":"https://doi.org/10.18653/v1/w16-1623","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st Workshop on Representation Learning for NLP","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.18653/v1/w16-1623","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073856277","display_name":"\u015etefan Ru\u015fe\u0163i","orcid":"https://orcid.org/0000-0002-0380-6814"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Stefan Ruseti","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077365712","display_name":"Traian Rebedea","orcid":"https://orcid.org/0000-0002-7255-5537"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Traian Rebedea","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077419846","display_name":"\u0218tefan Tr\u0103u\u0219an-Matu","orcid":"https://orcid.org/0000-0001-8082-8497"},"institutions":[{"id":"https://openalex.org/I61641377","display_name":"Universitatea Na\u021bional\u0103 de \u0218tiin\u021b\u0103 \u0219i Tehnologie Politehnica Bucure\u0219ti","ror":"https://ror.org/0558j5q12","country_code":"RO","type":"education","lineage":["https://openalex.org/I61641377"]}],"countries":["RO"],"is_corresponding":false,"raw_author_name":"Stefan Trausan-Matu","raw_affiliation_strings":["\u201cPolitehnica\u201c University of Bucharest"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"\u201cPolitehnica\u201c University of Bucharest","institution_ids":["https://openalex.org/I61641377"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5073856277"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.8834,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.84490261,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"201","last_page":"205"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.7508805990219116},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7324038147926331},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.7246368527412415},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7158187627792358},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7038165330886841},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6969035267829895},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.6755058765411377},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.636830747127533},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.6313341856002808},{"id":"https://openalex.org/keywords/vector-space","display_name":"Vector space","score":0.598840594291687},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5685802698135376},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5096800327301025},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.4381505250930786},{"id":"https://openalex.org/keywords/series","display_name":"Series (stratigraphy)","score":0.4361400306224823},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.41415613889694214},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.23546653985977173},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2087649703025818},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.15703365206718445},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.13012629747390747}],"concepts":[{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.7508805990219116},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7324038147926331},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.7246368527412415},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7158187627792358},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7038165330886841},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6969035267829895},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.6755058765411377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.636830747127533},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.6313341856002808},{"id":"https://openalex.org/C13336665","wikidata":"https://www.wikidata.org/wiki/Q125977","display_name":"Vector space","level":2,"score":0.598840594291687},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5685802698135376},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5096800327301025},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.4381505250930786},{"id":"https://openalex.org/C143724316","wikidata":"https://www.wikidata.org/wiki/Q312468","display_name":"Series (stratigraphy)","level":2,"score":0.4361400306224823},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.41415613889694214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.23546653985977173},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2087649703025818},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.15703365206718445},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.13012629747390747},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/w16-1623","is_oa":true,"landing_page_url":"http://doi.org/10.18653/v1/w16-1623","pdf_url":"https://doi.org/10.18653/v1/w16-1623","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st Workshop on Representation Learning for NLP","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/w16-1623","is_oa":true,"landing_page_url":"http://doi.org/10.18653/v1/w16-1623","pdf_url":"https://doi.org/10.18653/v1/w16-1623","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st Workshop on Representation Learning for NLP","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.8100000023841858,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1503259811","https://openalex.org/W1614298861","https://openalex.org/W1880262756","https://openalex.org/W1983578042","https://openalex.org/W2081580037","https://openalex.org/W2108919995","https://openalex.org/W2125031621","https://openalex.org/W2141599568","https://openalex.org/W2162456950","https://openalex.org/W2250539671","https://openalex.org/W2251123913","https://openalex.org/W2964232431"],"related_works":["https://openalex.org/W2165912799","https://openalex.org/W2735662278","https://openalex.org/W2382615723","https://openalex.org/W4311804456","https://openalex.org/W1987484445","https://openalex.org/W2623658258","https://openalex.org/W2798669739","https://openalex.org/W2953242939","https://openalex.org/W2612746495","https://openalex.org/W4292355215"],"abstract_inverted_index":{"Word":[0],"embeddings":[1,37,48,68],"are":[2],"widely":[3],"used":[4,34],"nowadays":[5],"for":[6,83,122],"many":[7],"NLP":[8],"tasks.":[9],"They":[10],"reduce":[11],"the":[12,15,26,36,110,114],"dimensionality":[13],"of":[14,28,40,92,97],"vocabulary":[16],"space,":[17],"but":[18],"most":[19],"importantly":[20],"they":[21],"should":[22],"capture":[23],"(part":[24],"of)":[25],"meaning":[27],"words.":[29],"The":[30],"new":[31,64],"vector":[32,52],"space":[33],"by":[35,74],"allows":[38],"computation":[39],"semantic":[41],"distances":[42],"between":[43],"words,":[44],"while":[45],"some":[46],"word":[47,67],"also":[49],"permit":[50],"simple":[51],"operations":[53],"(e.g.":[54],"summation,":[55],"difference)":[56],"resembling":[57],"analogical":[58],"reasoning.":[59],"This":[60],"paper":[61,115],"proposes":[62],"a":[63,90],"operation":[65],"on":[66,100],"aimed":[69],"to":[70,95],"capturing":[71],"categorical":[72],"information":[73],"first":[75],"learning":[76],"and":[77],"then":[78],"applying":[79],"an":[80],"embedding":[81,119],"mask":[82],"each":[84,123],"analyzed":[85],"category.":[86,124],"Thus,":[87],"we":[88],"conducted":[89],"series":[91],"experiments":[93],"related":[94],"categorization":[96],"words":[98],"based":[99],"their":[101],"embeddings.":[102],"Several":[103],"classical":[104],"approaches":[105],"were":[106],"compared":[107],"together":[108],"with":[109],"one":[111],"introduced":[112],"in":[113],"which":[116],"uses":[117],"different":[118],"masks":[120],"learnt":[121]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2026-05-19T21:40:30.786675","created_date":"2025-10-10T00:00:00"}
