{"id":"https://openalex.org/W2500968368","doi":"https://doi.org/10.21437/odyssey.2016-13","title":"Investigation of Senone-based Long-Short Term Memory RNNs for Spoken Language Recognition","display_name":"Investigation of Senone-based Long-Short Term Memory RNNs for Spoken Language Recognition","publication_year":2016,"publication_date":"2016-06-21","ids":{"openalex":"https://openalex.org/W2500968368","doi":"https://doi.org/10.21437/odyssey.2016-13","mag":"2500968368"},"language":"en","primary_location":{"id":"doi:10.21437/odyssey.2016-13","is_oa":true,"landing_page_url":"https://doi.org/10.21437/odyssey.2016-13","pdf_url":"https://www.isca-archive.org/odyssey_2016/tian16_odyssey.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2016)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.isca-archive.org/odyssey_2016/tian16_odyssey.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100571324","display_name":"Yao Tian","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yao Tian","raw_affiliation_strings":["National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049944728","display_name":"Liang He","orcid":"https://orcid.org/0000-0003-4076-7479"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang He","raw_affiliation_strings":["National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100330560","display_name":"Yi Liu","orcid":"https://orcid.org/0000-0002-6741-6815"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Liu","raw_affiliation_strings":["National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100409741","display_name":"Jia Liu","orcid":"https://orcid.org/0000-0003-0383-0934"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jia Liu","raw_affiliation_strings":["National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory for Information Science and Technology, Department of Electronic Engineering, Tsinghua University, Beijing 100084, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100571324"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":4.4361,"has_fulltext":true,"cited_by_count":17,"citation_normalized_percentile":{"value":0.95055498,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"89","last_page":"93"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spoken-language","display_name":"Spoken language","score":0.7577202916145325},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.751431941986084},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.690832257270813},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5540581345558167},{"id":"https://openalex.org/keywords/long-short-term-memory","display_name":"Long short term memory","score":0.5454895496368408},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5304426550865173},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47310495376586914},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.40967002511024475},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.08187082409858704}],"concepts":[{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.7577202916145325},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.751431941986084},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.690832257270813},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5540581345558167},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.5454895496368408},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5304426550865173},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47310495376586914},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.40967002511024475},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.08187082409858704},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/odyssey.2016-13","is_oa":true,"landing_page_url":"https://doi.org/10.21437/odyssey.2016-13","pdf_url":"https://www.isca-archive.org/odyssey_2016/tian16_odyssey.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2016)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.21437/odyssey.2016-13","is_oa":true,"landing_page_url":"https://doi.org/10.21437/odyssey.2016-13","pdf_url":"https://www.isca-archive.org/odyssey_2016/tian16_odyssey.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Speaker and Language Recognition Workshop (Odyssey 2016)","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5199999809265137}],"awards":[{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2201735945","display_name":null,"funder_award_id":"61273268","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2571867183","display_name":null,"funder_award_id":"61370034","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4665116016","display_name":null,"funder_award_id":"61403224","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6058138561","display_name":null,"funder_award_id":", No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8863666567","display_name":null,"funder_award_id":"and No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2500968368.pdf","grobid_xml":"https://content.openalex.org/works/W2500968368.grobid-xml"},"referenced_works_count":14,"referenced_works":["https://openalex.org/W1970088388","https://openalex.org/W2046056978","https://openalex.org/W2104457544","https://openalex.org/W2123237149","https://openalex.org/W2147768505","https://openalex.org/W2150769028","https://openalex.org/W2153181479","https://openalex.org/W2160815625","https://openalex.org/W2175575774","https://openalex.org/W2189248916","https://openalex.org/W2293634267","https://openalex.org/W2340176088","https://openalex.org/W2406392101","https://openalex.org/W2408021097"],"related_works":["https://openalex.org/W2912153778","https://openalex.org/W4387163678","https://openalex.org/W4288108708","https://openalex.org/W2973430807","https://openalex.org/W4385280324","https://openalex.org/W2890685186","https://openalex.org/W2984436043","https://openalex.org/W4390245176","https://openalex.org/W2912831041","https://openalex.org/W3173606726"],"abstract_inverted_index":{"Recently,":[0],"the":[1,31,37,40,48,59,64,90,93,101,114,119,122],"integration":[2],"of":[3,30,44,121],"deep":[4],"neural":[5],"networks":[6],"(DNNs)":[7],"trained":[8],"to":[9,51,82,99,104],"predict":[10],"senone":[11],"posteriors":[12],"with":[13,39],"conventional":[14,94],"language":[15,24],"modeling":[16],"methods":[17],"has":[18],"been":[19],"proved":[20],"effective":[21],"for":[22,85,108],"spoken":[23],"recognition.":[25],"This":[26],"work":[27],"extends":[28],"some":[29],"senone-based":[32],"DNN":[33,38],"frameworks":[34],"by":[35],"replacing":[36],"LSTM":[41,49,65,102],"RNN.":[42],"Two":[43],"these":[45],"approaches":[46],"use":[47,100],"RNN":[50,66,103],"generate":[52],"features.":[53],"The":[54],"features":[55,71,74],"are":[56,76],"extracted":[57],"from":[58],"recurrent":[60],"projection":[61],"layer":[62],"in":[63,79],"either":[67],"as":[68],"frame-level":[69],"acoustic":[70],"or":[72],"utterance-level":[73],"and":[75],"then":[77],"processed":[78],"different":[80],"ways":[81],"produce":[83,105],"scores":[84],"each":[86],"target":[87],"language.":[88],"In":[89],"third":[91],"approach,":[92],"i-vector":[95],"model":[96],"is":[97],"modified":[98],"frame":[106],"alignments":[107],"sufficient":[109],"statistics":[110],"extraction.":[111],"Experiments":[112],"on":[113],"NIST":[115],"LRE":[116],"2015":[117],"demonstrate":[118],"effectiveness":[120],"proposed":[123],"methods.":[124]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":1}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
