{"id":"https://openalex.org/W3203813575","doi":"https://doi.org/10.1109/access.2021.3118093","title":"Inferring Multilingual Domain-Specific Word Embeddings From Large Document Corpora","display_name":"Inferring Multilingual Domain-Specific Word Embeddings From Large Document Corpora","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3203813575","doi":"https://doi.org/10.1109/access.2021.3118093","mag":"3203813575"},"language":"en","primary_location":{"id":"doi:10.1109/access.2021.3118093","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3118093","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09559966.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09559966.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001746215","display_name":"Luca Cagliero","orcid":"https://orcid.org/0000-0002-7185-5247"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Luca Cagliero","raw_affiliation_strings":["Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy). (e-mail: luca.cagliero@polito.it)","Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy"],"raw_orcid":"https://orcid.org/0000-0002-7185-5247","affiliations":[{"raw_affiliation_string":"Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy). (e-mail: luca.cagliero@polito.it)","institution_ids":["https://openalex.org/I177477856"]},{"raw_affiliation_string":"Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy","institution_ids":["https://openalex.org/I177477856"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078641012","display_name":"Moreno La Quatra","orcid":"https://orcid.org/0000-0001-8838-064X"},"institutions":[{"id":"https://openalex.org/I177477856","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508","country_code":"IT","type":"education","lineage":["https://openalex.org/I177477856"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Moreno La Quatra","raw_affiliation_strings":["Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy)","Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy"],"raw_orcid":"https://orcid.org/0000-0001-8838-064X","affiliations":[{"raw_affiliation_string":"Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy)","institution_ids":["https://openalex.org/I177477856"]},{"raw_affiliation_string":"Politecnico di Torino, Corso Duca degli Abruzzi, 24 10129 Turin (Italy","institution_ids":["https://openalex.org/I177477856"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5001746215"],"corresponding_institution_ids":["https://openalex.org/I177477856"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.6996,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.76739456,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"9","issue":null,"first_page":"137309","last_page":"137321"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8939480781555176},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.7296050190925598},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6942757368087769},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.6261957883834839},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5983534455299377},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.527600109577179},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5265179872512817},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4917941391468048},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.42600953578948975},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41485488414764404},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.0761706531047821},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07231888175010681}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8939480781555176},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.7296050190925598},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6942757368087769},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.6261957883834839},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5983534455299377},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.527600109577179},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5265179872512817},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4917941391468048},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.42600953578948975},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41485488414764404},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0761706531047821},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07231888175010681},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/access.2021.3118093","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3118093","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09559966.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:f343696f39844982bf9a466cdac10f91","is_oa":true,"landing_page_url":"https://doaj.org/article/f343696f39844982bf9a466cdac10f91","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 9, Pp 137309-137321 (2021)","raw_type":"article"},{"id":"pmh:oai:zenodo.org:140651","is_oa":true,"landing_page_url":"https://www.openaccessrepository.it/record/140651","pdf_url":null,"source":{"id":"https://openalex.org/S4306402478","display_name":"INFM-OAR (INFN Catania)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210116497","host_organization_name":"Istituto Nazionale di Fisica Nucleare, Sezione di Catania","host_organization_lineage":["https://openalex.org/I4210116497"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1109/access.2021.3118093","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3118093","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09559966.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.7400000095367432,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320313985","display_name":"Politecnico di Torino","ror":"https://ror.org/00bgk9508"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3203813575.pdf","grobid_xml":"https://content.openalex.org/works/W3203813575.grobid-xml"},"referenced_works_count":69,"referenced_works":["https://openalex.org/W168564468","https://openalex.org/W1523296404","https://openalex.org/W1697700638","https://openalex.org/W1970161214","https://openalex.org/W2088212442","https://openalex.org/W2101234009","https://openalex.org/W2153579005","https://openalex.org/W2163426343","https://openalex.org/W2248676660","https://openalex.org/W2250539671","https://openalex.org/W2404244834","https://openalex.org/W2493916176","https://openalex.org/W2530085701","https://openalex.org/W2752172973","https://openalex.org/W2791766977","https://openalex.org/W2803176955","https://openalex.org/W2804580284","https://openalex.org/W2807399069","https://openalex.org/W2882319491","https://openalex.org/W2891896107","https://openalex.org/W2896457183","https://openalex.org/W2897103370","https://openalex.org/W2899286282","https://openalex.org/W2909182718","https://openalex.org/W2913433659","https://openalex.org/W2921634120","https://openalex.org/W2962739339","https://openalex.org/W2962755455","https://openalex.org/W2962844668","https://openalex.org/W2962887999","https://openalex.org/W2962936818","https://openalex.org/W2963216505","https://openalex.org/W2963341956","https://openalex.org/W2963472233","https://openalex.org/W2963667932","https://openalex.org/W2964325543","https://openalex.org/W2964921277","https://openalex.org/W2970597249","https://openalex.org/W2983766176","https://openalex.org/W2998704965","https://openalex.org/W3001434439","https://openalex.org/W3034378323","https://openalex.org/W3035009610","https://openalex.org/W3080236009","https://openalex.org/W3090350559","https://openalex.org/W3102264439","https://openalex.org/W3107826490","https://openalex.org/W3117605583","https://openalex.org/W3122135088","https://openalex.org/W3132982245","https://openalex.org/W4232619139","https://openalex.org/W4288620981","https://openalex.org/W4294170691","https://openalex.org/W4297801177","https://openalex.org/W4299579390","https://openalex.org/W4302571896","https://openalex.org/W6637707414","https://openalex.org/W6675354045","https://openalex.org/W6680532216","https://openalex.org/W6682691769","https://openalex.org/W6743384090","https://openalex.org/W6744957266","https://openalex.org/W6748304040","https://openalex.org/W6752242417","https://openalex.org/W6752325554","https://openalex.org/W6755207826","https://openalex.org/W6758543384","https://openalex.org/W6763701032","https://openalex.org/W6789032802"],"related_works":["https://openalex.org/W2378211422","https://openalex.org/W2745001401","https://openalex.org/W4321353415","https://openalex.org/W2130974462","https://openalex.org/W972276598","https://openalex.org/W4246352526","https://openalex.org/W2028665553","https://openalex.org/W4230315250","https://openalex.org/W2086519370","https://openalex.org/W2944691285"],"abstract_inverted_index":{"The":[0,110,161,193],"use":[1],"of":[2,6,97,138,152,159,163,200],"distributed":[3],"vector":[4,18,150],"representations":[5],"words":[7,124],"in":[8,45,142],"Natural":[9],"Language":[10],"Processing":[11],"has":[12,190],"become":[13],"established.":[14],"To":[15,179],"tailor":[16,148],"general-purpose":[17,99],"spaces":[19],"to":[20,40,63,83,134,144,147,156],"the":[21,41,75,95,98,129,135,139,149,153,157,164,174,196,201],"context":[22],"under":[23],"analysis,":[24],"several":[25,46],"domain":[26,158],"adaptation":[27],"techniques":[28],"have":[29],"been":[30,191],"proposed.":[31],"They":[32],"all":[33],"require":[34],"sufficiently":[35],"large":[36,51],"document":[37,54],"corpora":[38,55],"tailored":[39],"target":[42,92,154],"domains.":[43],"However,":[44],"cross-lingual":[47],"NLP":[48],"domains":[49],"both":[50],"enough":[52],"domain-specific":[53,58,87,101,123],"and":[56,100,125,198],"pre-trained":[57],"word":[59,88,136,176],"vectors":[60,137],"are":[61],"hard":[62],"find":[64],"for":[65,90,104],"languages":[66],"other":[67],"than":[68],"English.":[69],"This":[70],"paper":[71],"aims":[72],"at":[73],"tackling":[74],"aforesaid":[76],"issue.":[77],"It":[78],"proposes":[79],"a":[80,91,105,116,182],"new":[81,183],"methodology":[82],"automatically":[84,121],"infer":[85],"aligned":[86],"embeddings":[89],"language":[93,107,141,155],"on":[94,115],"basis":[96],"models":[102],"available":[103],"source":[106,140],"(typically,":[108],"English).":[109],"proposed":[111,165,202],"inference":[112],"method":[113,166],"relies":[114],"two-step":[117],"process,":[118],"which":[119],"first":[120],"identifies":[122],"then":[126],"opportunistically":[127],"reuses":[128],"non-linear":[130],"space":[131,151],"transformations":[132],"applied":[133],"order":[143],"learn":[145],"how":[146],"interest.":[160],"performance":[162],"was":[167],"validated":[168],"via":[169],"extrinsic":[170],"evaluation":[171],"by":[172],"addressing":[173],"established":[175],"retrieval":[177],"task.":[178],"this":[180],"aim,":[181],"benchmark":[184],"multilingual":[185],"dataset,":[186],"derived":[187],"from":[188],"Wikipedia,":[189],"released.":[192],"results":[194],"confirmed":[195],"effectiveness":[197],"usability":[199],"approach.":[203]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2021-10-11T00:00:00"}
