{"id":"https://openalex.org/W1982774639","doi":"https://doi.org/10.1109/jstsp.2014.2364559","title":"A Real-Time End-to-End Multilingual Speech Recognition Architecture","display_name":"A Real-Time End-to-End Multilingual Speech Recognition Architecture","publication_year":2014,"publication_date":"2014-10-23","ids":{"openalex":"https://openalex.org/W1982774639","doi":"https://doi.org/10.1109/jstsp.2014.2364559","mag":"1982774639"},"language":"en","primary_location":{"id":"doi:10.1109/jstsp.2014.2364559","is_oa":true,"landing_page_url":"https://doi.org/10.1109/jstsp.2014.2364559","pdf_url":"https://ieeexplore.ieee.org/ielx7/4200690/7105973/06935076.pdf","source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/4200690/7105973/06935076.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089369295","display_name":"Javier G\u00f3nzalez-Dom\u00ednguez","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I63634437","display_name":"Universidad Aut\u00f3noma de Madrid","ror":"https://ror.org/01cby8j38","country_code":"ES","type":"education","lineage":["https://openalex.org/I63634437"]}],"countries":["ES","US"],"is_corresponding":false,"raw_author_name":"Javier Gonzalez-Dominguez","raw_affiliation_strings":["ATVS Biometric Recognition Group, Madrid, Spain","Google Inc., Universidad Autonoma de Madrid, Madrid"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ATVS Biometric Recognition Group, Madrid, Spain","institution_ids":[]},{"raw_affiliation_string":"Google Inc., Universidad Autonoma de Madrid, Madrid","institution_ids":["https://openalex.org/I63634437","https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055160122","display_name":"David Eustis","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David Eustis","raw_affiliation_strings":["Google Inc, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050898122","display_name":"Ignacio L\u00f3pez Moreno","orcid":"https://orcid.org/0000-0002-0900-3473"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ignacio Lopez-Moreno","raw_affiliation_strings":["Google Inc, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079708487","display_name":"Andrew Senior","orcid":"https://orcid.org/0000-0002-2401-5691"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Senior","raw_affiliation_strings":["Google Inc, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110711540","display_name":"Fran\u00e7oise Beaufays","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Francoise Beaufays","raw_affiliation_strings":["Google Inc, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103874391","display_name":"Pedro J. Moreno","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pedro J. Moreno","raw_affiliation_strings":["Google Inc, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Google Inc, USA","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.652,"has_fulltext":true,"cited_by_count":52,"citation_normalized_percentile":{"value":0.94814554,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"9","issue":"4","first_page":"749","last_page":"759"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8675335645675659},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6148785352706909},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.613968014717102},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.5601617097854614},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5562713146209717},{"id":"https://openalex.org/keywords/spoken-language","display_name":"Spoken language","score":0.5149708390235901},{"id":"https://openalex.org/keywords/end-user","display_name":"End user","score":0.4482630491256714},{"id":"https://openalex.org/keywords/low-latency","display_name":"Low latency (capital markets)","score":0.4366295635700226},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.41058894991874695},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3860224783420563},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36254483461380005},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11002650856971741},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08255976438522339},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07779783010482788}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8675335645675659},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6148785352706909},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.613968014717102},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.5601617097854614},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5562713146209717},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.5149708390235901},{"id":"https://openalex.org/C91262260","wikidata":"https://www.wikidata.org/wiki/Q528074","display_name":"End user","level":2,"score":0.4482630491256714},{"id":"https://openalex.org/C46637626","wikidata":"https://www.wikidata.org/wiki/Q6693015","display_name":"Low latency (capital markets)","level":2,"score":0.4366295635700226},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.41058894991874695},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3860224783420563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36254483461380005},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11002650856971741},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08255976438522339},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07779783010482788},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jstsp.2014.2364559","is_oa":true,"landing_page_url":"https://doi.org/10.1109/jstsp.2014.2364559","pdf_url":"https://ieeexplore.ieee.org/ielx7/4200690/7105973/06935076.pdf","source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/jstsp.2014.2364559","is_oa":true,"landing_page_url":"https://doi.org/10.1109/jstsp.2014.2364559","pdf_url":"https://ieeexplore.ieee.org/ielx7/4200690/7105973/06935076.pdf","source":{"id":"https://openalex.org/S42167783","display_name":"IEEE Journal of Selected Topics in Signal Processing","issn_l":"1932-4553","issn":["1932-4553","1941-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Journal of Selected Topics in Signal Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.550000011920929}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1982774639.pdf","grobid_xml":"https://content.openalex.org/works/W1982774639.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W77790951","https://openalex.org/W587794757","https://openalex.org/W1236994949","https://openalex.org/W1516433687","https://openalex.org/W1529116532","https://openalex.org/W1537735731","https://openalex.org/W1978660892","https://openalex.org/W1993882792","https://openalex.org/W1994631938","https://openalex.org/W2017269134","https://openalex.org/W2035846950","https://openalex.org/W2056119007","https://openalex.org/W2072128103","https://openalex.org/W2078953162","https://openalex.org/W2093866254","https://openalex.org/W2108582047","https://openalex.org/W2108978495","https://openalex.org/W2132424367","https://openalex.org/W2139081859","https://openalex.org/W2150769028","https://openalex.org/W2154607443","https://openalex.org/W2160815625","https://openalex.org/W2168231600","https://openalex.org/W2294962864","https://openalex.org/W2340176088","https://openalex.org/W2604272474","https://openalex.org/W3123753580","https://openalex.org/W4214739450","https://openalex.org/W6617368339","https://openalex.org/W6628027437","https://openalex.org/W6631959037","https://openalex.org/W6676404333","https://openalex.org/W6697031438","https://openalex.org/W6703974891","https://openalex.org/W6910631608"],"related_works":["https://openalex.org/W3205411230","https://openalex.org/W4286899009","https://openalex.org/W3163341049","https://openalex.org/W9168048","https://openalex.org/W4300849822","https://openalex.org/W4376480820","https://openalex.org/W3155891479","https://openalex.org/W3029351463","https://openalex.org/W2885352820","https://openalex.org/W4296591952"],"abstract_inverted_index":{"Automatic":[0],"speech":[1,40],"recognition":[2,119],"(ASR)":[3],"systems":[4],"are":[5,69],"used":[6],"daily":[7],"by":[8],"millions":[9],"of":[10,38,46,62,98,112],"people":[11],"worldwide":[12],"to":[13,21,55,71,94,116],"dictate":[14],"messages,":[15],"control":[16],"devices,":[17],"initiate":[18],"searches":[19],"or":[20],"facilitate":[22],"data":[23],"input":[24],"in":[25,31,66,105],"small":[26],"devices.":[27],"The":[28],"user":[29],"experience":[30],"these":[32],"scenarios":[33],"depends":[34],"on":[35,43],"the":[36,39,44,47,59],"quality":[37],"transcriptions":[41],"and":[42,87,108,121],"responsiveness":[45],"system.":[48,128],"For":[49],"multilingual":[50],"users,":[51],"a":[52,72,109,126],"further":[53],"obstacle":[54],"natural":[56],"interaction":[57],"is":[58],"monolingual":[60,127],"character":[61],"many":[63],"ASR":[64,84],"systems,":[65],"which":[67],"users":[68,93],"constrained":[70],"single":[73],"preset":[74],"language.":[75],"In":[76],"this":[77],"work,":[78],"we":[79],"present":[80],"an":[81],"end-to-end":[82],"multi-language":[83],"architecture,":[85],"developed":[86],"deployed":[88],"at":[89],"Google,":[90],"that":[91],"allows":[92],"select":[95],"arbitrary":[96],"combinations":[97],"spoken":[99],"languages.":[100],"We":[101],"leverage":[102],"recent":[103],"advances":[104],"language":[106,114],"identification":[107],"novel":[110],"method":[111],"real-time":[113],"selection":[115],"achieve":[117],"similar":[118],"accuracy":[120],"nearly-identical":[122],"latency":[123],"characteristics":[124],"as":[125]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":9},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
