{"id":"https://openalex.org/W1602122992","doi":"https://doi.org/10.1109/icassp.2016.7472809","title":"Recurrent neural network training with dark knowledge transfer","display_name":"Recurrent neural network training with dark knowledge transfer","publication_year":2016,"publication_date":"2016-03-01","ids":{"openalex":"https://openalex.org/W1602122992","doi":"https://doi.org/10.1109/icassp.2016.7472809","mag":"1602122992"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2016.7472809","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7472809","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1505.04630","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056437232","display_name":"Zhiyuan Tang","orcid":"https://orcid.org/0000-0002-3786-7690"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiyuan Tang","raw_affiliation_strings":["Center for Speech and Language Technologies (CSLT), RIIT, Tsinghua University","Chengdu Institute of Computer Applications, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Center for Speech and Language Technologies (CSLT), RIIT, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Chengdu Institute of Computer Applications, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100391442","display_name":"Dong Wang","orcid":"https://orcid.org/0000-0002-0545-6205"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Wang","raw_affiliation_strings":["Center for Speech and Language Technologies (CSLT), RIIT, Tsinghua University","Tsinghua National Laboratory for Information Science and Technology"],"affiliations":[{"raw_affiliation_string":"Center for Speech and Language Technologies (CSLT), RIIT, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua National Laboratory for Information Science and Technology","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100352621","display_name":"Zhiyong Zhang","orcid":"https://orcid.org/0000-0003-3061-7768"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Zhang","raw_affiliation_strings":["Center for Speech and Language Technologies (CSLT), RIIT, Tsinghua University","Tsinghua National Laboratory for Information Science and Technology"],"affiliations":[{"raw_affiliation_string":"Center for Speech and Language Technologies (CSLT), RIIT, Tsinghua University","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Tsinghua National Laboratory for Information Science and Technology","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5056437232"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":19.9962,"has_fulltext":false,"cited_by_count":109,"citation_normalized_percentile":{"value":0.99275162,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"5900","last_page":"5904"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.5613999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.5613999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.13850000500679016,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.057999998331069946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.9002631902694702},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8277414441108704},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.7235296368598938},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6873779296875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6661427021026611},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6486976146697998},{"id":"https://openalex.org/keywords/knowledge-transfer","display_name":"Knowledge transfer","score":0.5346060991287231},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5057621002197266},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.4841654896736145},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4702058434486389},{"id":"https://openalex.org/keywords/long-short-term-memory","display_name":"Long short term memory","score":0.4610113501548767},{"id":"https://openalex.org/keywords/time-delay-neural-network","display_name":"Time delay neural network","score":0.4335392415523529},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4256702661514282},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.42141348123550415},{"id":"https://openalex.org/keywords/transfer","display_name":"Transfer (computing)","score":0.42030027508735657}],"concepts":[{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.9002631902694702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8277414441108704},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.7235296368598938},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6873779296875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6661427021026611},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6486976146697998},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.5346060991287231},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5057621002197266},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4841654896736145},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4702058434486389},{"id":"https://openalex.org/C133488467","wikidata":"https://www.wikidata.org/wiki/Q6673524","display_name":"Long short term memory","level":4,"score":0.4610113501548767},{"id":"https://openalex.org/C175202392","wikidata":"https://www.wikidata.org/wiki/Q2434543","display_name":"Time delay neural network","level":3,"score":0.4335392415523529},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4256702661514282},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.42141348123550415},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.42030027508735657},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2016.7472809","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7472809","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1505.04630","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1505.04630","pdf_url":"https://arxiv.org/pdf/1505.04630","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1505.04630","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1505.04630","pdf_url":"https://arxiv.org/pdf/1505.04630","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7900000214576721}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W104184427","https://openalex.org/W196761320","https://openalex.org/W1408639475","https://openalex.org/W1498436455","https://openalex.org/W1524333225","https://openalex.org/W1690739335","https://openalex.org/W1821462560","https://openalex.org/W2063224314","https://openalex.org/W2064675550","https://openalex.org/W2076063813","https://openalex.org/W2079735306","https://openalex.org/W2100495367","https://openalex.org/W2102113734","https://openalex.org/W2107878631","https://openalex.org/W2110798204","https://openalex.org/W2118706537","https://openalex.org/W2123585936","https://openalex.org/W2125964738","https://openalex.org/W2134797427","https://openalex.org/W2136933783","https://openalex.org/W2138857742","https://openalex.org/W2143612262","https://openalex.org/W2147768505","https://openalex.org/W2150341604","https://openalex.org/W2160815625","https://openalex.org/W2293634267","https://openalex.org/W2294370754","https://openalex.org/W2402040300","https://openalex.org/W2403787182","https://openalex.org/W4205947740","https://openalex.org/W6604254268","https://openalex.org/W6608133726","https://openalex.org/W6628131027","https://openalex.org/W6631362777","https://openalex.org/W6637551013","https://openalex.org/W6638523607","https://openalex.org/W6675365184","https://openalex.org/W6676481782","https://openalex.org/W6679909955","https://openalex.org/W6680300913","https://openalex.org/W6680549991","https://openalex.org/W6696934422","https://openalex.org/W6712847557"],"related_works":["https://openalex.org/W2912153778","https://openalex.org/W4387163678","https://openalex.org/W4288108708","https://openalex.org/W2109916967","https://openalex.org/W2973430807","https://openalex.org/W4385280324","https://openalex.org/W2890685186","https://openalex.org/W2984436043","https://openalex.org/W4390245176","https://openalex.org/W2912831041"],"abstract_inverted_index":{"Recurrent":[0],"neural":[1,74,115],"networks":[2],"(RNNs),":[3],"particularly":[4],"long":[5],"short-term":[6],"memory":[7],"(LSTM),":[8],"have":[9,22],"gained":[10],"much":[11],"attention":[12],"in":[13],"automatic":[14],"speech":[15],"recognition":[16],"(ASR).":[17],"Although":[18],"some":[19],"successful":[20],"stories":[21],"been":[23,69],"reported,":[24],"training":[25,33,178],"RNNs":[26,109,173],"remains":[27],"highly":[28],"challenging,":[29],"especially":[30],"with":[31,76,176],"limited":[32,177],"data.":[34,179],"Recent":[35],"research":[36,130],"found":[37],"that":[38,81,89,156],"a":[39,46,77,87,113],"well-trained":[40],"model":[41,61,118],"can":[42,85,171],"be":[43,142],"used":[44],"as":[45,62,119],"teacher":[47,60,137],"to":[48,71,92,107,141],"train":[49,72,108,172],"other":[50],"child":[51,146],"models,":[52],"by":[53,58,94],"using":[54,112],"the":[55,59,82,102,120,128,136,145,166],"predictions":[56],"generated":[57],"supervision.":[63],"This":[64,122],"knowledge":[65,103,132],"transfer":[66,104,133],"learning":[67,105,167],"has":[68],"employed":[70],"simple":[73],"nets":[75],"complex":[78],"one,":[79],"so":[80],"final":[83],"performance":[84],"reach":[86],"level":[88],"is":[90,123,139],"infeasible":[91],"obtain":[93],"regular":[95],"training.":[96],"In":[97],"this":[98,169],"paper,":[99],"we":[100],"employ":[101],"approach":[106,170],"(precisely":[110],"LSTM)":[111],"deep":[114],"network":[116],"(DNN)":[117,138],"teacher.":[121],"different":[124],"from":[125],"most":[126],"of":[127],"existing":[129],"on":[131,151,165],"learning,":[134],"since":[135],"assumed":[140],"weaker":[143],"than":[144],"(RNN);":[147],"however,":[148],"our":[149],"experiments":[150],"an":[152],"ASR":[153],"task":[154],"showed":[155],"it":[157],"works":[158],"fairly":[159],"well:":[160],"without":[161],"applying":[162],"any":[163],"tricks":[164],"scheme,":[168],"successfully":[174],"even":[175]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":15},{"year":2020,"cited_by_count":24},{"year":2019,"cited_by_count":18},{"year":2018,"cited_by_count":15},{"year":2017,"cited_by_count":10},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":5}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
