{"id":"https://openalex.org/W2970635698","doi":"https://doi.org/10.18653/v1/w19-5117","title":"Neural Lemmatization of Multiword Expressions","display_name":"Neural Lemmatization of Multiword Expressions","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2970635698","doi":"https://doi.org/10.18653/v1/w19-5117","mag":"2970635698"},"language":"en","primary_location":{"id":"doi:10.18653/v1/w19-5117","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w19-5117","pdf_url":"https://www.aclweb.org/anthology/W19-5117.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/W19-5117.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026579029","display_name":"Marine Schmitt","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121906","display_name":"Analyse et Traitement Informatique de la Langue Fran\u00e7aise","ror":"https://ror.org/02cy9g557","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210121906","https://openalex.org/I4210150854","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Marine Schmitt","raw_affiliation_strings":["Universit de Lorraine & CNRS ATILF F-54000 Nancy, France","ATILF - Analyse et Traitement Informatique de la Langue Fran\u00e7aise (Universit\u00e9 de Lorraine, 44 Av de la Lib\u00e9ration, BP 30687 54063 Nancy Cedex - France)"],"affiliations":[{"raw_affiliation_string":"Universit de Lorraine & CNRS ATILF F-54000 Nancy, France","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I1294671590","https://openalex.org/I4210121906"]},{"raw_affiliation_string":"ATILF - Analyse et Traitement Informatique de la Langue Fran\u00e7aise (Universit\u00e9 de Lorraine, 44 Av de la Lib\u00e9ration, BP 30687 54063 Nancy Cedex - France)","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I4210121906"]}]},{"author_position":"last","author":{"id":null,"display_name":"Mathieu Constant","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121906","display_name":"Analyse et Traitement Informatique de la Langue Fran\u00e7aise","ror":"https://ror.org/02cy9g557","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I4210121906","https://openalex.org/I4210150854","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Mathieu Constant","raw_affiliation_strings":["Universit de Lorraine & CNRS ATILF F-54000 Nancy, France","ATILF - Analyse et Traitement Informatique de la Langue Fran\u00e7aise (Universit\u00e9 de Lorraine, 44 Av de la Lib\u00e9ration, BP 30687 54063 Nancy Cedex - France)"],"affiliations":[{"raw_affiliation_string":"Universit de Lorraine & CNRS ATILF F-54000 Nancy, France","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I1294671590","https://openalex.org/I4210121906"]},{"raw_affiliation_string":"ATILF - Analyse et Traitement Informatique de la Langue Fran\u00e7aise (Universit\u00e9 de Lorraine, 44 Av de la Lib\u00e9ration, BP 30687 54063 Nancy Cedex - France)","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I4210121906"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5026579029"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210121906","https://openalex.org/I90183372"],"apc_list":null,"apc_paid":null,"fwci":0.289,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.66845203,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"142","last_page":"148"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/lemmatisation","display_name":"Lemmatisation","score":0.9049814343452454},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8210904598236084},{"id":"https://openalex.org/keywords/lemma","display_name":"Lemma (botany)","score":0.7223376631736755},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6661556363105774},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6260359883308411},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6177011132240295},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5966468453407288},{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.5920811891555786},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5043483972549438},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.48247721791267395},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.41628652811050415},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3963729739189148},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3903505802154541},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.23772504925727844},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10475856065750122}],"concepts":[{"id":"https://openalex.org/C161831844","wikidata":"https://www.wikidata.org/wiki/Q2554325","display_name":"Lemmatisation","level":2,"score":0.9049814343452454},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8210904598236084},{"id":"https://openalex.org/C2777759810","wikidata":"https://www.wikidata.org/wiki/Q149316","display_name":"Lemma (botany)","level":3,"score":0.7223376631736755},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6661556363105774},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6260359883308411},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6177011132240295},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5966468453407288},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.5920811891555786},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5043483972549438},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.48247721791267395},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.41628652811050415},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3963729739189148},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3903505802154541},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.23772504925727844},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10475856065750122},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C46757340","wikidata":"https://www.wikidata.org/wiki/Q43238","display_name":"Poaceae","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/w19-5117","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w19-5117","pdf_url":"https://www.aclweb.org/anthology/W19-5117.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-03229308v1","is_oa":true,"landing_page_url":"https://hal.science/hal-03229308","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019), Aug 2019, Florence, Italy. pp.142-148, &#x27E8;10.18653/v1/W19-5117&#x27E9;","raw_type":"Conference papers"}],"best_oa_location":{"id":"doi:10.18653/v1/w19-5117","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/w19-5117","pdf_url":"https://www.aclweb.org/anthology/W19-5117.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Joint Workshop on Multiword Expressions and WordNet (MWE-WN 2019)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5099999904632568,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G2503264477","display_name":null,"funder_award_id":"ANR-14-CERA-0001","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G5348246107","display_name":null,"funder_award_id":"ANR-15-IDEX-0","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7166692799","display_name":null,"funder_award_id":"ANR-15-I","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G8254623148","display_name":null,"funder_award_id":"ANR-15-IDEX-04-LUE","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G8918884702","display_name":null,"funder_award_id":"15-IDEX-04-LUE","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2970635698.pdf","grobid_xml":"https://content.openalex.org/works/W2970635698.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1498763386","https://openalex.org/W1582588624","https://openalex.org/W1865928303","https://openalex.org/W2049018290","https://openalex.org/W2051846017","https://openalex.org/W2057138859","https://openalex.org/W2098908879","https://openalex.org/W2114121678","https://openalex.org/W2115673450","https://openalex.org/W2133564696","https://openalex.org/W2143391265","https://openalex.org/W2159083246","https://openalex.org/W2159714709","https://openalex.org/W2251102497","https://openalex.org/W2251386579","https://openalex.org/W2251864848","https://openalex.org/W2577871717","https://openalex.org/W2616272086","https://openalex.org/W2664496537","https://openalex.org/W2735555159","https://openalex.org/W2741029840","https://openalex.org/W2772814603","https://openalex.org/W2804387108","https://openalex.org/W2840687837","https://openalex.org/W2888274736","https://openalex.org/W2902945038","https://openalex.org/W2964308564","https://openalex.org/W3096630569","https://openalex.org/W4285038102","https://openalex.org/W4293361313","https://openalex.org/W4301691548"],"related_works":["https://openalex.org/W2887281027","https://openalex.org/W4288429387","https://openalex.org/W1552656226","https://openalex.org/W1561563106","https://openalex.org/W2116831595","https://openalex.org/W2884860922","https://openalex.org/W3042025871","https://openalex.org/W2226076398","https://openalex.org/W2251336637","https://openalex.org/W1562768541"],"abstract_inverted_index":{"This":[0],"article":[1],"focuses":[2],"on":[3,28,38,42,90],"the":[4,25,29,33,44,48,58,62,76,80,86],"lemmatization":[5],"of":[6,32,47,61,74,79,85],"multiword":[7],"expressions":[8],"(MWEs).":[9],"We":[10],"propose":[11],"a":[12,91],"deep":[13],"encoder-decoder":[14],"architecture":[15],"generating":[16,75],"for":[17,82,101,112],"every":[18],"MWE":[19,63,87],"word":[20,59,84],"its":[21],"corresponding":[22,77],"part":[23,78],"in":[24,72],"lemma,":[26],"based":[27,41,89],"internal":[30],"context":[31],"MWE.":[34],"The":[35,70],"encoder":[36],"relies":[37],"recurrent":[39,95],"networks":[40],"(1)":[43],"character":[45],"sequence":[46,60],"individual":[49],"words":[50],"to":[51,64],"capture":[52,65],"their":[53],"morphological":[54],"properties,":[55],"and":[56,67,105,107],"(2)":[57],"lexical":[66],"syntactic":[68],"properties.":[69],"decoder":[71],"charge":[73],"lemma":[81],"each":[83],"is":[88,99],"classical":[92],"character-level":[93],"attention-based":[94],"model.":[96],"Our":[97],"model":[98],"evaluated":[100],"Italian,":[102],"French,":[103],"Polish":[104],"Portuguese":[106],"shows":[108],"good":[109],"performances":[110],"except":[111],"Polish.":[113]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-16T08:26:57.006410","created_date":"2025-10-10T00:00:00"}
