{"id":"https://openalex.org/W2799923439","doi":"https://doi.org/10.18653/v1/p18-4022","title":"RETURNN as a Generic Flexible Neural Toolkit with Application to Translation and Speech Recognition","display_name":"RETURNN as a Generic Flexible Neural Toolkit with Application to Translation and Speech Recognition","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2799923439","doi":"https://doi.org/10.18653/v1/p18-4022","mag":"2799923439"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p18-4022","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-4022","pdf_url":"https://www.aclweb.org/anthology/P18-4022.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of ACL 2018, System Demonstrations","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P18-4022.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059521407","display_name":"Albert Zeyer","orcid":"https://orcid.org/0000-0002-6655-671X"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Albert Zeyer","raw_affiliation_strings":["NNAISENSE, Switzerland,","Human Language Technology and Pattern Recognition Group RWTH Aachen University, Aachen, Germany,","www.apptek.com/,","AppTek, USA, http://"],"affiliations":[{"raw_affiliation_string":"NNAISENSE, Switzerland,","institution_ids":[]},{"raw_affiliation_string":"Human Language Technology and Pattern Recognition Group RWTH Aachen University, Aachen, Germany,","institution_ids":["https://openalex.org/I887968799"]},{"raw_affiliation_string":"www.apptek.com/,","institution_ids":[]},{"raw_affiliation_string":"AppTek, USA, http://","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081695539","display_name":"Tamer Alkhouli","orcid":null},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tamer Alkhouli","raw_affiliation_strings":["Human Language Technology and Pattern Recognition Group RWTH Aachen University, Aachen, Germany,","www.apptek.com/,","AppTek, USA, http://"],"affiliations":[{"raw_affiliation_string":"Human Language Technology and Pattern Recognition Group RWTH Aachen University, Aachen, Germany,","institution_ids":["https://openalex.org/I887968799"]},{"raw_affiliation_string":"www.apptek.com/,","institution_ids":[]},{"raw_affiliation_string":"AppTek, USA, http://","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112501010","display_name":"Hermann Ney","orcid":null},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Hermann Ney","raw_affiliation_strings":["Human Language Technology and Pattern Recognition Group RWTH Aachen University, Aachen, Germany,","AppTek, USA, http://","www.apptek.com/,"],"affiliations":[{"raw_affiliation_string":"Human Language Technology and Pattern Recognition Group RWTH Aachen University, Aachen, Germany,","institution_ids":["https://openalex.org/I887968799"]},{"raw_affiliation_string":"AppTek, USA, http://","institution_ids":[]},{"raw_affiliation_string":"www.apptek.com/,","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059521407"],"corresponding_institution_ids":["https://openalex.org/I887968799"],"apc_list":null,"apc_paid":null,"fwci":9.8149,"has_fulltext":true,"cited_by_count":77,"citation_normalized_percentile":{"value":0.98362665,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"128","last_page":"133"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8709719181060791},{"id":"https://openalex.org/keywords/generality","display_name":"Generality","score":0.69828200340271},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.6521064043045044},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6117600798606873},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.56849205493927},{"id":"https://openalex.org/keywords/translation","display_name":"Translation (biology)","score":0.5626557469367981},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5532363653182983},{"id":"https://openalex.org/keywords/machine-translation","display_name":"Machine translation","score":0.5372189879417419},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5330656170845032},{"id":"https://openalex.org/keywords/beam-search","display_name":"Beam search","score":0.5082663893699646},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.43713024258613586},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.4239041805267334},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4215604364871979},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.37254178524017334},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.13716661930084229},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.11498740315437317},{"id":"https://openalex.org/keywords/search-algorithm","display_name":"Search algorithm","score":0.11055505275726318}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8709719181060791},{"id":"https://openalex.org/C2780767217","wikidata":"https://www.wikidata.org/wiki/Q5532421","display_name":"Generality","level":2,"score":0.69828200340271},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.6521064043045044},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6117600798606873},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.56849205493927},{"id":"https://openalex.org/C149364088","wikidata":"https://www.wikidata.org/wiki/Q185917","display_name":"Translation (biology)","level":4,"score":0.5626557469367981},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5532363653182983},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.5372189879417419},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5330656170845032},{"id":"https://openalex.org/C19889080","wikidata":"https://www.wikidata.org/wiki/Q2835852","display_name":"Beam search","level":3,"score":0.5082663893699646},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.43713024258613586},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4239041805267334},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4215604364871979},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.37254178524017334},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.13716661930084229},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.11498740315437317},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.11055505275726318},{"id":"https://openalex.org/C105580179","wikidata":"https://www.wikidata.org/wiki/Q188928","display_name":"Messenger RNA","level":3,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.18653/v1/p18-4022","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-4022","pdf_url":"https://www.aclweb.org/anthology/P18-4022.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of ACL 2018, System Demonstrations","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1805.05225","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1805.05225","pdf_url":"https://arxiv.org/pdf/1805.05225","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.18653/v1/p18-4022","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-4022","pdf_url":"https://www.aclweb.org/anthology/P18-4022.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of ACL 2018, System Demonstrations","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4000000059604645}],"awards":[{"id":"https://openalex.org/G4956428346","display_name":null,"funder_award_id":"Horizon 2020 research and innovatio","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G5036817778","display_name":null,"funder_award_id":"European Union's Horizon 2020 research and innov","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G5106512922","display_name":null,"funder_award_id":"Deutsche Forschungsgemeinschaft (DFG","funder_id":"https://openalex.org/F4320320879","funder_display_name":"Deutsche Forschungsgemeinschaft"},{"id":"https://openalex.org/G7366229540","display_name":"A Sequence Classification Framework for Human Language Technology","funder_award_id":"694537","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G7842005466","display_name":null,"funder_award_id":"Horizon 2020","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8633428685","display_name":null,"funder_award_id":"European Union's Horizon 2020 research and innovat","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320320879","display_name":"Deutsche Forschungsgemeinschaft","ror":"https://ror.org/018mejw64"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2799923439.pdf","grobid_xml":"https://content.openalex.org/works/W2799923439.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W648786980","https://openalex.org/W1522301498","https://openalex.org/W1922655562","https://openalex.org/W2133564696","https://openalex.org/W2137550424","https://openalex.org/W2183341477","https://openalex.org/W2186615578","https://openalex.org/W2384495648","https://openalex.org/W2408504891","https://openalex.org/W2410539690","https://openalex.org/W2471933213","https://openalex.org/W2527845440","https://openalex.org/W2573601984","https://openalex.org/W2575312266","https://openalex.org/W2594229957","https://openalex.org/W2604132379","https://openalex.org/W2606134370","https://openalex.org/W2626778328","https://openalex.org/W2685242699","https://openalex.org/W2738440736","https://openalex.org/W2743473392","https://openalex.org/W2748816379","https://openalex.org/W2755954992","https://openalex.org/W2758605572","https://openalex.org/W2773723600","https://openalex.org/W2778814079","https://openalex.org/W2884561390","https://openalex.org/W2916986993","https://openalex.org/W2950304420","https://openalex.org/W2952688536","https://openalex.org/W2962728618","https://openalex.org/W2962784628","https://openalex.org/W2963260202","https://openalex.org/W2963266252","https://openalex.org/W2963351448","https://openalex.org/W2963403868","https://openalex.org/W2963418779","https://openalex.org/W2963747784","https://openalex.org/W2964121744","https://openalex.org/W2964190861","https://openalex.org/W2964308564","https://openalex.org/W3082674894","https://openalex.org/W4297683868","https://openalex.org/W4297747548","https://openalex.org/W4297825688","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2045049461","https://openalex.org/W1978893398","https://openalex.org/W2201908702","https://openalex.org/W4381094582","https://openalex.org/W2369625323","https://openalex.org/W2364579609","https://openalex.org/W1977906818","https://openalex.org/W1522139108","https://openalex.org/W2353528968","https://openalex.org/W3204412157"],"abstract_inverted_index":{"We":[0,29,65,77],"compare":[1],"the":[2,71,87],"fast":[3,17,23,96],"training":[4,62],"and":[5,21,46,105],"decoding":[6],"speed":[7],"of":[8,10,92,116],"RETURNN":[9,93],"attention":[11,38],"models":[12,39,68],"for":[13,36,83],"translation,":[14],"due":[15],"to":[16,49,100,109],"CUDA":[18],"LSTM":[19],"kernels,":[20],"a":[22,32,95,113],"pure":[24],"Tensor-Flow":[25],"beam":[26],"search":[27],"decoder.":[28],"show":[30],"that":[31],"layer-wise":[33],"pretraining":[34],"scheme":[35],"recurrent":[37,52],"gives":[40],"over":[41],"1%":[42],"BLEU":[43,61],"improvement":[44],"absolute":[45],"it":[47,111],"allows":[48,94,108],"train":[50],"deeper":[51],"encoder":[53],"networks.":[54],"Promising":[55],"preliminary":[56],"results":[57,82],"on":[58,70,86,112],"max.":[59],"expected":[60],"are":[63],"presented.":[64],"obtain":[66],"state-of-the-art":[67],"trained":[69],"WMT":[72],"2017":[73],"GermanEnglish":[74],"translation":[75],"task.":[76,89],"also":[78],"present":[79],"end-to-end":[80],"model":[81],"speech":[84],"recognition":[85],"Switchboard":[88],"The":[90],"flexibility":[91],"research":[97],"feedback":[98],"loop":[99],"experiment":[101],"with":[102],"alternative":[103],"architectures,":[104],"its":[106],"generality":[107],"use":[110],"wide":[114],"range":[115],"applications.":[117]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":18},{"year":2020,"cited_by_count":20},{"year":2019,"cited_by_count":18},{"year":2018,"cited_by_count":2}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2018-05-17T00:00:00"}
