{"id":"https://openalex.org/W2941819978","doi":"https://doi.org/10.18653/v1/p19-1300","title":"Unsupervised Multilingual Word Embedding with Limited Resources using Neural Language Models","display_name":"Unsupervised Multilingual Word Embedding with Limited Resources using Neural Language Models","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2941819978","doi":"https://doi.org/10.18653/v1/p19-1300","mag":"2941819978"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p19-1300","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1300","pdf_url":"https://www.aclweb.org/anthology/P19-1300.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P19-1300.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057566812","display_name":"Takashi Wada","orcid":"https://orcid.org/0009-0006-1586-7530"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Takashi Wada","raw_affiliation_strings":["Nara Institute of Science and Technology"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034538103","display_name":"Tomoharu Iwata","orcid":"https://orcid.org/0000-0003-4425-1971"},"institutions":[{"id":"https://openalex.org/I4210126580","display_name":"RIKEN Center for Advanced Intelligence Project","ror":"https://ror.org/03ckxwf91","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210126580"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomoharu Iwata","raw_affiliation_strings":["NTT Communication Science Laboratories","RIKEN Center for Advanced Intelligence Project (AIP)"],"affiliations":[{"raw_affiliation_string":"NTT Communication Science Laboratories","institution_ids":[]},{"raw_affiliation_string":"RIKEN Center for Advanced Intelligence Project (AIP)","institution_ids":["https://openalex.org/I4210126580"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072032804","display_name":"Y\u016bji Matsumoto","orcid":"https://orcid.org/0000-0003-4946-9574"},"institutions":[{"id":"https://openalex.org/I4210126580","display_name":"RIKEN Center for Advanced Intelligence Project","ror":"https://ror.org/03ckxwf91","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210126580"]},{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yuji Matsumoto","raw_affiliation_strings":["Nara Institute of Science and Technology","RIKEN Center for Advanced Intelligence Project (AIP)"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology","institution_ids":["https://openalex.org/I75917431"]},{"raw_affiliation_string":"RIKEN Center for Advanced Intelligence Project (AIP)","institution_ids":["https://openalex.org/I4210126580"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5057566812"],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":2.4562,"has_fulltext":true,"cited_by_count":28,"citation_normalized_percentile":{"value":0.91578972,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"3113","last_page":"3124"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8351471424102783},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7493882179260254},{"id":"https://openalex.org/keywords/word-embedding","display_name":"Word embedding","score":0.6576792597770691},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6508689522743225},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6486701965332031},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6079666614532471},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5273799896240234},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.5241793990135193},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5028049945831299},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.47780805826187134},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.4358426630496979},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4203197956085205},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.15976649522781372},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10607528686523438}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8351471424102783},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7493882179260254},{"id":"https://openalex.org/C2777462759","wikidata":"https://www.wikidata.org/wiki/Q18395344","display_name":"Word embedding","level":3,"score":0.6576792597770691},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6508689522743225},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6486701965332031},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6079666614532471},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5273799896240234},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.5241793990135193},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5028049945831299},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.47780805826187134},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.4358426630496979},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4203197956085205},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.15976649522781372},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10607528686523438},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/p19-1300","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1300","pdf_url":"https://www.aclweb.org/anthology/P19-1300.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},{"id":"pmh:oai:library.naist.jp:10061/13250","is_oa":false,"landing_page_url":"http://hdl.handle.net/10061/13250","pdf_url":null,"source":{"id":"https://openalex.org/S4377196843","display_name":"NAIST Digital Library (Nara Institute of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I75917431","host_organization_name":"Nara Institute of Science and Technology","host_organization_lineage":["https://openalex.org/I75917431"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Thesis or Dissertation"}],"best_oa_location":{"id":"doi:10.18653/v1/p19-1300","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1300","pdf_url":"https://www.aclweb.org/anthology/P19-1300.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"No poverty","id":"https://metadata.un.org/sdg/1","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2941819978.pdf","grobid_xml":"https://content.openalex.org/works/W2941819978.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W22168010","https://openalex.org/W114517082","https://openalex.org/W179875071","https://openalex.org/W1614298861","https://openalex.org/W1815076433","https://openalex.org/W2007780422","https://openalex.org/W2095705004","https://openalex.org/W2099471712","https://openalex.org/W2118090838","https://openalex.org/W2126725946","https://openalex.org/W2171082019","https://openalex.org/W2187089797","https://openalex.org/W2294774419","https://openalex.org/W2467585580","https://openalex.org/W2594021297","https://openalex.org/W2740132093","https://openalex.org/W2741986357","https://openalex.org/W2760424551","https://openalex.org/W2788353357","https://openalex.org/W2807669488","https://openalex.org/W2888536529","https://openalex.org/W2889894161","https://openalex.org/W2899486018","https://openalex.org/W2952190837","https://openalex.org/W2962739339","https://openalex.org/W2963047628","https://openalex.org/W2963118869","https://openalex.org/W2963467085","https://openalex.org/W2964266061","https://openalex.org/W4234117503","https://openalex.org/W4293763774","https://openalex.org/W4299579390","https://openalex.org/W4320013936"],"related_works":["https://openalex.org/W4288407670","https://openalex.org/W947140380","https://openalex.org/W2911655849","https://openalex.org/W4286432911","https://openalex.org/W4230884544","https://openalex.org/W4245453790","https://openalex.org/W3194985222","https://openalex.org/W3216571906","https://openalex.org/W4214830338","https://openalex.org/W2518587255"],"abstract_inverted_index":{"Recently,":[0],"a":[1,30,77,99],"variety":[2],"of":[3,14,66,102,114,133,143,156,201],"unsupervised":[4,79,191,207],"methods":[5,26,68,195,208],"have":[6,179],"been":[7,49],"proposed":[8,122],"that":[9,37,51,83],"map":[10],"pre-trained":[11],"word":[12,39,154,176],"embeddings":[13,40,155,166],"different":[15,118,157],"languages":[16,145,158],"into":[17,146],"the":[18,35,64,112,134,147,160,183],"same":[19,148,161],"space":[20],"without":[21,167],"any":[22,168],"parallel":[23,169],"data.":[24],"These":[25],"aim":[27],"to":[28],"find":[29],"linear":[31],"transformation":[32],"based":[33],"on":[34,57,87,175,182],"assumption":[36,53,89],"monolingual":[38,103,115],"are":[41,108,117],"approximately":[42],"isomorphic":[43],"between":[44],"languages.":[45,120,213],"However,":[46],"it":[47],"has":[48],"demonstrated":[50,180],"this":[52,73],"holds":[54],"true":[55],"only":[56,98],"specific":[58],"conditions,":[59],"and":[60,90,140,163,192],"with":[61,197],"limited":[62],"resources,":[63],"performance":[65],"these":[67],"decreases":[69],"drastically.":[70],"To":[71],"overcome":[72],"problem,":[74],"we":[75,125],"propose":[76],"new":[78],"multilingual":[80,165],"embedding":[81],"method":[82],"does":[84],"not":[85],"rely":[86],"such":[88],"performs":[91],"well":[92],"under":[93],"resource-poor":[94],"scenarios,":[95],"namely":[96],"when":[97,111],"small":[100],"amount":[101],"data":[104,116,170],"(i.e.,":[105],"50k":[106],"sentences)":[107],"available,":[109],"or":[110,171],"domains":[113],"across":[119,212],"Our":[121,173,203,214],"model,":[123],"which":[124],"call":[126],"'Multilingual":[127],"Neural":[128],"Language":[129],"Models',":[130],"shares":[131],"some":[132],"network":[135],"parameters":[136],"among":[137],"multiple":[138,144],"languages,":[139],"encodes":[141],"sentences":[142],"space.":[149],"The":[150],"model":[151,187,204],"jointly":[152],"learns":[153],"in":[159],"space,":[162],"generates":[164],"pre-training.":[172],"experiments":[174],"alignment":[177],"tasks":[178],"that,":[181],"low-resource":[184],"condition,":[185],"our":[186],"substantially":[188],"outperforms":[189,206],"existing":[190],"even":[193],"supervised":[194],"trained":[196],"500":[198],"bilingual":[199],"pairs":[200],"words.":[202],"also":[205],"given":[209],"different-domain":[210],"corpora":[211],"code":[215],"is":[216],"publicly":[217],"available":[218],"1":[219],".":[220]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
