{"id":"https://openalex.org/W2577366047","doi":"https://doi.org/10.21437/interspeech.2017-343","title":"Towards Better Decoding and Language Model Integration in Sequence to Sequence Models","display_name":"Towards Better Decoding and Language Model Integration in Sequence to Sequence Models","publication_year":2017,"publication_date":"2017-08-16","ids":{"openalex":"https://openalex.org/W2577366047","doi":"https://doi.org/10.21437/interspeech.2017-343","mag":"2577366047"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2017-343","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2017-343","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2017","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5000408865","display_name":"Jan Chorowski","orcid":"https://orcid.org/0000-0002-1570-7610"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jan Chorowski","raw_affiliation_strings":["Google Brain Google Inc. Mountain View, CA 94043, USA"],"affiliations":[{"raw_affiliation_string":"Google Brain Google Inc. Mountain View, CA 94043, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112445699","display_name":"Navdeep Jaitly","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Navdeep Jaitly","raw_affiliation_strings":["Google Brain Google Inc. Mountain View, CA 94043, USA"],"affiliations":[{"raw_affiliation_string":"Google Brain Google Inc. Mountain View, CA 94043, USA","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5000408865"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":34.7325,"has_fulltext":false,"cited_by_count":330,"citation_normalized_percentile":{"value":0.99743281,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"523","last_page":"527"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.7851332426071167},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.7291349768638611},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7106620073318481},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.49595198035240173},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.48783209919929504},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43162208795547485},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21627700328826904},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.06043422222137451}],"concepts":[{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.7851332426071167},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.7291349768638611},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7106620073318481},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.49595198035240173},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.48783209919929504},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43162208795547485},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21627700328826904},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.06043422222137451},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2017-343","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2017-343","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2017","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.44999998807907104,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W854541894","https://openalex.org/W1522301498","https://openalex.org/W1524333225","https://openalex.org/W1582482241","https://openalex.org/W1736701665","https://openalex.org/W1855892484","https://openalex.org/W1902237438","https://openalex.org/W1915251500","https://openalex.org/W1922655562","https://openalex.org/W1993411524","https://openalex.org/W2024539680","https://openalex.org/W2102113734","https://openalex.org/W2109886035","https://openalex.org/W2130942839","https://openalex.org/W2133564696","https://openalex.org/W2160815625","https://openalex.org/W2163605009","https://openalex.org/W2183341477","https://openalex.org/W2193413348","https://openalex.org/W2271840356","https://openalex.org/W2345474290","https://openalex.org/W2361821140","https://openalex.org/W2525778437","https://openalex.org/W2530876040","https://openalex.org/W2952288254","https://openalex.org/W2952746495","https://openalex.org/W2962792802","https://openalex.org/W2963158258","https://openalex.org/W2963260202","https://openalex.org/W2963572611","https://openalex.org/W2963620441","https://openalex.org/W2964043796","https://openalex.org/W4255949318","https://openalex.org/W4297798436"],"related_works":["https://openalex.org/W3203142394","https://openalex.org/W4302615923","https://openalex.org/W2351061015","https://openalex.org/W4220731478","https://openalex.org/W2017509870","https://openalex.org/W4360952157","https://openalex.org/W2153647085","https://openalex.org/W2383083288","https://openalex.org/W2161474341","https://openalex.org/W3192589309"],"abstract_inverted_index":{"The":[0],"recently":[1],"proposed":[2],"Sequence-to-Sequence":[3],"(seq2seq)":[4],"framework":[5],"advocates":[6],"replacing":[7],"complex":[8],"data":[9],"processing":[10],"pipelines,":[11],"such":[12],"as":[13],"an":[14,27,34],"entire":[15],"automatic":[16],"speech":[17,37],"recognition":[18,38],"system,":[19],"with":[20,94],"a":[21,54,95],"single":[22],"neural":[23],"network":[24],"trained":[25],"in":[26,50],"end-to-end":[28],"fashion.In":[29],"this":[30],"contribution,":[31],"we":[32,88,99],"analyse":[33],"attention-based":[35],"seq2seq":[36],"system":[39],"that":[40],"directly":[41],"transcribes":[42],"recordings":[43],"into":[44],"characters.We":[45],"observe":[46],"two":[47],"shortcomings:":[48],"overconfidence":[49],"its":[51],"predictions":[52],"and":[53],"tendency":[55],"to":[56,68],"produce":[57],"incomplete":[58],"transcriptions":[59],"when":[60],"language":[61,86,97],"models":[62,87],"are":[63],"used.We":[64],"propose":[65],"practical":[66],"solutions":[67],"both":[69],"problems":[70],"achieving":[71],"competitive":[72],"speaker":[73],"independent":[74],"word":[75],"error":[76],"rates":[77],"on":[78],"the":[79],"Wall":[80],"Street":[81],"Journal":[82],"dataset:":[83],"without":[84],"separate":[85],"reach":[89,100],"10.6%":[90],"WER,":[91],"while":[92],"together":[93],"trigram":[96],"model,":[98],"6.7%":[101],"WER.":[102]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":38},{"year":2022,"cited_by_count":24},{"year":2021,"cited_by_count":74},{"year":2020,"cited_by_count":80},{"year":2019,"cited_by_count":45},{"year":2018,"cited_by_count":34},{"year":2017,"cited_by_count":7}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
