{"id":"https://openalex.org/W2962915948","doi":"https://doi.org/10.18653/v1/p19-1125","title":"Imitation Learning for Non-Autoregressive Neural Machine Translation","display_name":"Imitation Learning for Non-Autoregressive Neural Machine Translation","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2962915948","doi":"https://doi.org/10.18653/v1/p19-1125","mag":"2962915948"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p19-1125","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1125","pdf_url":"https://www.aclweb.org/anthology/P19-1125.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P19-1125.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000258378","display_name":"Bingzhen Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bingzhen Wei","raw_affiliation_strings":["MOE Key Lab of Computational Linguistics, School of EECS, Peking University"],"affiliations":[{"raw_affiliation_string":"MOE Key Lab of Computational Linguistics, School of EECS, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043256966","display_name":"Mingxuan Wang","orcid":"https://orcid.org/0000-0002-2858-6512"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mingxuan Wang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022574607","display_name":"Hao Zhou","orcid":"https://orcid.org/0000-0002-0173-0393"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao Zhou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100612233","display_name":"Junyang Lin","orcid":"https://orcid.org/0000-0001-9931-383X"},"institutions":[{"id":"https://openalex.org/I111483173","display_name":"King University","ror":"https://ror.org/01evb6z23","country_code":"US","type":"education","lineage":["https://openalex.org/I111483173"]},{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Junyang Lin","raw_affiliation_strings":["MOE Key Lab of Computational Linguistics, School of EECS, Peking University","School of Foreign Languages, Peking University"],"affiliations":[{"raw_affiliation_string":"MOE Key Lab of Computational Linguistics, School of EECS, Peking University","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Foreign Languages, Peking University","institution_ids":["https://openalex.org/I111483173","https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101441137","display_name":"Xu Sun","orcid":"https://orcid.org/0000-0001-8241-9320"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]},{"id":"https://openalex.org/I4210096250","display_name":"Beijing Institute of Big Data Research","ror":"https://ror.org/00s1sz824","country_code":"CN","type":"facility","lineage":["https://openalex.org/I20231570","https://openalex.org/I37796252","https://openalex.org/I4210096250"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xu Sun","raw_affiliation_strings":["Deep Learning Lab, Beijing Institute of Big Data Research, Peking University","MOE Key Lab of Computational Linguistics, School of EECS, Peking University"],"affiliations":[{"raw_affiliation_string":"Deep Learning Lab, Beijing Institute of Big Data Research, Peking University","institution_ids":["https://openalex.org/I4210096250","https://openalex.org/I20231570"]},{"raw_affiliation_string":"MOE Key Lab of Computational Linguistics, School of EECS, Peking University","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5000258378"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":7.22003404,"has_fulltext":true,"cited_by_count":74,"citation_normalized_percentile":{"value":0.97335165,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1304","last_page":"1312"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.84388267993927},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8280807137489319},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.7779077887535095},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.7255255579948425},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6970710754394531},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.629368007183075},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5456108450889587},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5323140025138855},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4285699129104614},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.41502711176872253},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4063856601715088},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.1293032467365265},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.10530805587768555},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08791062235832214}],"concepts":[{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.84388267993927},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8280807137489319},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.7779077887535095},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.7255255579948425},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6970710754394531},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.629368007183075},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5456108450889587},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5323140025138855},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4285699129104614},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.41502711176872253},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4063856601715088},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.1293032467365265},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.10530805587768555},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08791062235832214},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/p19-1125","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1125","pdf_url":"https://www.aclweb.org/anthology/P19-1125.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/p19-1125","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p19-1125","pdf_url":"https://www.aclweb.org/anthology/P19-1125.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5600000023841858,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2962915948.pdf","grobid_xml":"https://content.openalex.org/works/W2962915948.grobid-xml"},"referenced_works_count":26,"referenced_works":["https://openalex.org/W1757796397","https://openalex.org/W1916559533","https://openalex.org/W2064675550","https://openalex.org/W2072128103","https://openalex.org/W2130942839","https://openalex.org/W2145339207","https://openalex.org/W2153653739","https://openalex.org/W2157331557","https://openalex.org/W2518578398","https://openalex.org/W2595715041","https://openalex.org/W2767206889","https://openalex.org/W2789543585","https://openalex.org/W2890501761","https://openalex.org/W2892213699","https://openalex.org/W2962784628","https://openalex.org/W2962969034","https://openalex.org/W2963403868","https://openalex.org/W2963434219","https://openalex.org/W2963536265","https://openalex.org/W2963736842","https://openalex.org/W2964074409","https://openalex.org/W3211848854","https://openalex.org/W4231109964","https://openalex.org/W4241645538","https://openalex.org/W4298857966","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W2883671469"],"abstract_inverted_index":{"Non-autoregressive":[0],"translation":[1,49,54,85],"models":[2],"(NAT)":[3],"have":[4],"achieved":[5],"impressive":[6],"inference":[7,99],"speedup.":[8],"A":[9],"potential":[10],"issue":[11],"of":[12,105],"the":[13,20,47,65,79,84,89,103],"existing":[14],"NAT":[15],"algorithms,":[16],"however,":[17],"is":[18,22],"that":[19],"decoding":[21],"conducted":[23],"in":[24,96],"parallel,":[25],"without":[26],"directly":[27],"considering":[28],"previous":[29],"context.":[30],"In":[31],"this":[32],"paper,":[33],"we":[34,101],"propose":[35],"an":[36],"imitation":[37],"learning":[38],"framework":[39],"for":[40],"non-autoregressive":[41],"machine":[42],"translation,":[43],"which":[44],"still":[45],"enjoys":[46],"fast":[48],"speed":[50],"but":[51],"gives":[52],"comparable":[53,87],"performance":[55,104],"compared":[56],"to":[57,88],"its":[58],"auto-regressive":[59],"counterpart.":[60],"We":[61],"conduct":[62],"experiments":[63],"on":[64,108,114],"IWSLT16,":[66],"WMT14":[67],"and":[68,111],"WMT16":[69,109],"datasets.":[70],"Our":[71],"proposed":[72],"model":[73],"achieves":[74],"a":[75],"significant":[76],"speedup":[77],"over":[78],"autoregressive":[80,90],"models,":[81],"while":[82],"keeping":[83],"quality":[86],"models.":[91],"By":[92],"sampling":[93],"sentence":[94],"length":[95],"parallel":[97],"at":[98],"time,":[100],"achieve":[102],"31.85":[106],"BLEU":[107,113],"Ro\u2192En":[110],"30.68":[112],"IWSLT16":[115],"En\u2192De.":[116]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":16},{"year":2022,"cited_by_count":10},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":15},{"year":2019,"cited_by_count":3}],"updated_date":"2026-02-05T00:54:17.221276","created_date":"2025-10-10T00:00:00"}
