{"id":"https://openalex.org/W1984541135","doi":"https://doi.org/10.1109/icassp.2013.6639345","title":"Recent advances in deep learning for speech research at Microsoft","display_name":"Recent advances in deep learning for speech research at Microsoft","publication_year":2013,"publication_date":"2013-05-01","ids":{"openalex":"https://openalex.org/W1984541135","doi":"https://doi.org/10.1109/icassp.2013.6639345","mag":"1984541135"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2013.6639345","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639345","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100671324","display_name":"Li Deng","orcid":"https://orcid.org/0000-0002-1014-0790"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Li Deng","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100365053","display_name":"Jinyu Li","orcid":"https://orcid.org/0000-0002-1089-9748"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jinyu Li","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045413298","display_name":"Jui-Ting Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jui-Ting Huang","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103119755","display_name":"Kaisheng Yao","orcid":"https://orcid.org/0000-0002-8949-9367"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kaisheng Yao","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034476404","display_name":"Dong Yu","orcid":"https://orcid.org/0000-0003-0520-6844"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dong Yu","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072932051","display_name":"Frank Seide","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Frank Seide","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041313589","display_name":"Michael L. Seltzer","orcid":"https://orcid.org/0000-0003-3474-2451"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Seltzer","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064903487","display_name":"Geoff Zweig","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Geoff Zweig","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101727205","display_name":"Xiaodong He","orcid":"https://orcid.org/0000-0002-9463-9168"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaodong He","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103246485","display_name":"J. D. Williams","orcid":"https://orcid.org/0000-0003-2460-9673"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason Williams","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101928537","display_name":"Yifan Gong","orcid":"https://orcid.org/0000-0002-3912-097X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yifan Gong","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111957484","display_name":"Alex Acero","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alex Acero","raw_affiliation_strings":["Microsoft Corporation, Redmond, WA, USA","Microsoft Corporation Redmond,WA,USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Microsoft Corporation Redmond,WA,USA","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5100671324"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":88.468,"has_fulltext":false,"cited_by_count":804,"citation_normalized_percentile":{"value":0.99958606,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"8604","last_page":"8608"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8160018920898438},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5986735820770264},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5939184427261353},{"id":"https://openalex.org/keywords/strengths-and-weaknesses","display_name":"Strengths and weaknesses","score":0.5807219743728638},{"id":"https://openalex.org/keywords/mainstream","display_name":"Mainstream","score":0.4917064309120178},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46441003680229187},{"id":"https://openalex.org/keywords/speech-technology","display_name":"Speech technology","score":0.4430136978626251},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.433695912361145},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.38979262113571167},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3406432271003723},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.334242582321167},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.09170663356781006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8160018920898438},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5986735820770264},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5939184427261353},{"id":"https://openalex.org/C63882131","wikidata":"https://www.wikidata.org/wiki/Q17122954","display_name":"Strengths and weaknesses","level":2,"score":0.5807219743728638},{"id":"https://openalex.org/C2777617010","wikidata":"https://www.wikidata.org/wiki/Q18957","display_name":"Mainstream","level":2,"score":0.4917064309120178},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46441003680229187},{"id":"https://openalex.org/C504749915","wikidata":"https://www.wikidata.org/wiki/Q9010971","display_name":"Speech technology","level":3,"score":0.4430136978626251},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.433695912361145},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38979262113571167},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3406432271003723},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.334242582321167},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.09170663356781006},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2013.6639345","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2013.6639345","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Conference on Acoustics, Speech and Signal Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.306.5800","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.306.5800","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://research.microsoft.com/pubs/188864/ICASSP-2013-OverviewMSRDeepLearning.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.6600000262260437}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W47568227","https://openalex.org/W84880661","https://openalex.org/W179875071","https://openalex.org/W217970951","https://openalex.org/W319941341","https://openalex.org/W1218987319","https://openalex.org/W1537275613","https://openalex.org/W1904365287","https://openalex.org/W1978516841","https://openalex.org/W1978660892","https://openalex.org/W1987238397","https://openalex.org/W1989549063","https://openalex.org/W1994935303","https://openalex.org/W1999965501","https://openalex.org/W2013598660","https://openalex.org/W2025198378","https://openalex.org/W2026445738","https://openalex.org/W2028825255","https://openalex.org/W2036242736","https://openalex.org/W2062164080","https://openalex.org/W2069999512","https://openalex.org/W2074818733","https://openalex.org/W2087006792","https://openalex.org/W2093028810","https://openalex.org/W2095168618","https://openalex.org/W2106347453","https://openalex.org/W2108563286","https://openalex.org/W2108597378","https://openalex.org/W2108817613","https://openalex.org/W2111539083","https://openalex.org/W2112739286","https://openalex.org/W2112984492","https://openalex.org/W2114486181","https://openalex.org/W2118497033","https://openalex.org/W2120209245","https://openalex.org/W2125964738","https://openalex.org/W2130414229","https://openalex.org/W2137782235","https://openalex.org/W2138742901","https://openalex.org/W2139113820","https://openalex.org/W2139622435","https://openalex.org/W2141778357","https://openalex.org/W2147768505","https://openalex.org/W2149600041","https://openalex.org/W2155273149","https://openalex.org/W2160620631","https://openalex.org/W2160815625","https://openalex.org/W2161742217","https://openalex.org/W2162042984","https://openalex.org/W2163922914","https://openalex.org/W2168013545","https://openalex.org/W2168231600","https://openalex.org/W2171723947","https://openalex.org/W2171928131","https://openalex.org/W2184045248","https://openalex.org/W2184188583","https://openalex.org/W2394932179","https://openalex.org/W2403195671","https://openalex.org/W2405047074","https://openalex.org/W2407441242","https://openalex.org/W6601939441","https://openalex.org/W6603374476","https://openalex.org/W6608710415","https://openalex.org/W6653897473","https://openalex.org/W6656619859","https://openalex.org/W6679053740","https://openalex.org/W6680634817","https://openalex.org/W6684010798","https://openalex.org/W6684859321","https://openalex.org/W6685285290","https://openalex.org/W6686207219"],"related_works":["https://openalex.org/W2099475353","https://openalex.org/W1966028611","https://openalex.org/W2568050604","https://openalex.org/W2048673468","https://openalex.org/W3107456284","https://openalex.org/W642007152","https://openalex.org/W3110551121","https://openalex.org/W2105439218","https://openalex.org/W2145680368","https://openalex.org/W4250500033"],"abstract_inverted_index":{"Deep":[0],"learning":[1,50],"is":[2],"becoming":[3],"a":[4],"mainstream":[5],"technology":[6],"for":[7],"speech":[8,25,69,75],"recognition":[9,76],"at":[10],"industrial":[11],"scale.":[12],"In":[13],"this":[14,30,54],"paper,":[15],"we":[16],"provide":[17],"an":[18],"overview":[19,55],"of":[20,46,97,106],"the":[21,41,47,57,64,93,98,102],"work":[22],"by":[23],"Microsoft":[24],"researchers":[26],"since":[27],"2009":[28],"in":[29,101],"area,":[31],"focusing":[32],"on":[33],"more":[34],"recent":[35],"advances":[36],"which":[37],"shed":[38],"light":[39],"to":[40,63,67,89],"basic":[42],"capabilities":[43],"and":[44,59,77,84,91,95,109],"limitations":[45],"current":[48],"deep":[49],"technology.":[51],"We":[52],"organize":[53],"along":[56],"feature-domain":[58],"model-domain":[60],"dimensions":[61],"according":[62],"conventional":[65],"approach":[66],"analyzing":[68],"systems.":[70],"Selected":[71],"experimental":[72],"results,":[73],"including":[74],"related":[78],"applications":[79],"such":[80],"as":[81],"spoken":[82],"dialogue":[83],"language":[85],"modeling,":[86],"are":[87,113],"presented":[88],"demonstrate":[90],"analyze":[92],"strengths":[94],"weaknesses":[96],"techniques":[99,108],"described":[100],"paper.":[103],"Potential":[104],"improvement":[105],"these":[107],"future":[110],"research":[111],"directions":[112],"discussed.":[114]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":71},{"year":2022,"cited_by_count":56},{"year":2021,"cited_by_count":68},{"year":2020,"cited_by_count":94},{"year":2019,"cited_by_count":117},{"year":2018,"cited_by_count":106},{"year":2017,"cited_by_count":75},{"year":2016,"cited_by_count":57},{"year":2015,"cited_by_count":66},{"year":2014,"cited_by_count":43},{"year":2013,"cited_by_count":13},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
