{"id":"https://openalex.org/W2294543795","doi":"https://doi.org/10.21437/interspeech.2013-552","title":"Restructuring of deep neural network acoustic models with singular value decomposition","display_name":"Restructuring of deep neural network acoustic models with singular value decomposition","publication_year":2013,"publication_date":"2013-08-25","ids":{"openalex":"https://openalex.org/W2294543795","doi":"https://doi.org/10.21437/interspeech.2013-552","mag":"2294543795"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2013-552","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2013-552","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2013","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100763213","display_name":"Jian Xue","orcid":"https://orcid.org/0000-0002-9460-802X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jian Xue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100365053","display_name":"Jinyu Li","orcid":"https://orcid.org/0000-0002-1089-9748"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jinyu Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101928537","display_name":"Yifan Gong","orcid":"https://orcid.org/0000-0002-3912-097X"},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yifan Gong","raw_affiliation_strings":["(Microsoft)"],"affiliations":[{"raw_affiliation_string":"(Microsoft)","institution_ids":["https://openalex.org/I4210164937"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100763213"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":54.3825,"has_fulltext":false,"cited_by_count":430,"citation_normalized_percentile":{"value":0.99893119,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"2365","last_page":"2369"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7554571628570557},{"id":"https://openalex.org/keywords/singular-value-decomposition","display_name":"Singular value decomposition","score":0.7463869452476501},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6378222703933716},{"id":"https://openalex.org/keywords/restructuring","display_name":"Restructuring","score":0.6207583546638489},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5684874057769775},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.5430490374565125},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5109859704971313},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.483737975358963},{"id":"https://openalex.org/keywords/singular-value","display_name":"Singular value","score":0.44718611240386963},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.44030922651290894},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.43972620368003845}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7554571628570557},{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.7463869452476501},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6378222703933716},{"id":"https://openalex.org/C45237549","wikidata":"https://www.wikidata.org/wiki/Q1376796","display_name":"Restructuring","level":2,"score":0.6207583546638489},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5684874057769775},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.5430490374565125},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5109859704971313},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.483737975358963},{"id":"https://openalex.org/C109282560","wikidata":"https://www.wikidata.org/wiki/Q4166054","display_name":"Singular value","level":3,"score":0.44718611240386963},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.44030922651290894},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.43972620368003845},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2013-552","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2013-552","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2013","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6299999952316284,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W587794757","https://openalex.org/W1969067576","https://openalex.org/W1987238397","https://openalex.org/W1993882792","https://openalex.org/W2076794394","https://openalex.org/W2105099419","https://openalex.org/W2112984492","https://openalex.org/W2123237149","https://openalex.org/W2125964738","https://openalex.org/W2147768505","https://openalex.org/W2394932179","https://openalex.org/W2403195671","https://openalex.org/W2465562739"],"related_works":["https://openalex.org/W4319586039","https://openalex.org/W4382583540","https://openalex.org/W1607100495","https://openalex.org/W2147072251","https://openalex.org/W1990844505","https://openalex.org/W2148568324","https://openalex.org/W4386721910","https://openalex.org/W4378770618","https://openalex.org/W2164147222","https://openalex.org/W2038393145"],"abstract_inverted_index":{"Recently":[0],"proposed":[1,132,153],"deep":[2,171],"neural":[3,172],"network":[4],"(DNN)":[5],"obtains":[6],"significant":[7],"accuracy":[8,66,106,122],"improvements":[9],"in":[10,42,78],"many":[11],"large":[12],"vocabulary":[13],"continuous":[14],"speech":[15],"recognition":[16],"(LVCSR)":[17],"tasks.":[18],"However,":[19],"DNN":[20,41,56,100,127,143,158],"requires":[21],"much":[22],"more":[23,162],"parameters":[24],"than":[25,163],"traditional":[26],"systems,":[27],"which":[28],"brings":[29],"huge":[30],"cost":[31],"during":[32],"online":[33],"evaluation,":[34],"and":[35,80],"also":[36,109],"limits":[37],"the":[38,60,65,75,83,87,91,99,111,115,121,126,152,157],"application":[39],"of":[40,45,90],"a":[43],"lot":[44],"scenarios.":[46],"In":[47],"this":[48],"paper":[49],"we":[50,96],"present":[51],"our":[52],"new":[53],"effort":[54],"on":[55,74,86,137],"aiming":[57],"at":[58],"reducing":[59,125],"model":[61,84,101,113,128,146,159,177],"size":[62,102,129,160],"while":[63],"keeping":[64],"improvements.":[67],"We":[68,108],"apply":[69],"singular":[70,174],"value":[71,175],"decomposition":[72],"(SVD)":[73],"weight":[76],"matrices":[77],"DNN,":[79],"then":[81],"restructure":[82],"based":[85],"inherent":[88],"sparseness":[89],"original":[92],"matrices.":[93],"After":[94],"restructuring":[95,178],"can":[97],"reduce":[98],"significantly":[103],"with":[104,141],"negligible":[105],"loss.":[107],"fine-tune":[110],"restructured":[112],"using":[114],"regular":[116],"back-propagation":[117],"method":[118,133],"to":[119],"get":[120],"back":[123],"when":[124],"heavily.":[130],"The":[131],"has":[134],"been":[135],"evaluated":[136],"two":[138],"LVCSR":[139],"tasks,":[140],"context-dependent":[142],"hidden":[144],"Markov":[145],"(CD-DNN-HMM).":[147],"Experimental":[148],"results":[149],"show":[150],"that":[151],"approach":[154],"dramatically":[155],"reduces":[156],"by":[161],"80%":[164],"without":[165],"losing":[166],"any":[167],"accuracy.":[168],"Index":[169],"Terms:":[170],"network,":[173],"decomposition,":[176]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":26},{"year":2022,"cited_by_count":22},{"year":2021,"cited_by_count":40},{"year":2020,"cited_by_count":51},{"year":2019,"cited_by_count":50},{"year":2018,"cited_by_count":68},{"year":2017,"cited_by_count":42},{"year":2016,"cited_by_count":50},{"year":2015,"cited_by_count":36},{"year":2014,"cited_by_count":20},{"year":2013,"cited_by_count":4}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
