{"id":"https://openalex.org/W2606436965","doi":"https://doi.org/10.1109/hscma.2017.7895555","title":"An extended experimental investigation of DNN uncertainty propagation for noise robust ASR","display_name":"An extended experimental investigation of DNN uncertainty propagation for noise robust ASR","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2606436965","doi":"https://doi.org/10.1109/hscma.2017.7895555","mag":"2606436965"},"language":"en","primary_location":{"id":"doi:10.1109/hscma.2017.7895555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hscma.2017.7895555","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 Hands-free Speech Communications and Microphone Arrays (HSCMA)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107339473","display_name":"Karan Nathwani","orcid":"https://orcid.org/0000-0003-2531-0411"},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Karan Nathwani","raw_affiliation_strings":["CNRS, France","Inria, France","Universit\u00e9 de Lorraine, France"],"affiliations":[{"raw_affiliation_string":"CNRS, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Universit\u00e9 de Lorraine, France","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068044087","display_name":"Juan A. Morales-Cordovilla","orcid":"https://orcid.org/0000-0001-5411-5952"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Juan A. Morales-Cordovilla","raw_affiliation_strings":["Dept. of TSTC, Universidad de Granada, Spain"],"affiliations":[{"raw_affiliation_string":"Dept. of TSTC, Universidad de Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113968312","display_name":"Sunit Sivasankaran","orcid":null},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Sunit Sivasankaran","raw_affiliation_strings":["CNRS, France","Inria, France","Universit\u00e9 de Lorraine, France"],"affiliations":[{"raw_affiliation_string":"CNRS, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Universit\u00e9 de Lorraine, France","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073463405","display_name":"Irina Illina","orcid":"https://orcid.org/0000-0003-2598-4643"},"institutions":[{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Irina Illina","raw_affiliation_strings":["CNRS, France","Inria, France","Universit\u00e9 de Lorraine, France"],"affiliations":[{"raw_affiliation_string":"CNRS, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Universit\u00e9 de Lorraine, France","institution_ids":["https://openalex.org/I90183372"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065635001","display_name":"Emmanuel Vincent","orcid":"https://orcid.org/0000-0002-0183-7289"},"institutions":[{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]},{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en informatique et en automatique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Emmanuel Vincent","raw_affiliation_strings":["CNRS, France","Inria, France","Universit\u00e9 de Lorraine, France"],"affiliations":[{"raw_affiliation_string":"CNRS, France","institution_ids":["https://openalex.org/I1294671590"]},{"raw_affiliation_string":"Inria, France","institution_ids":["https://openalex.org/I1326498283"]},{"raw_affiliation_string":"Universit\u00e9 de Lorraine, France","institution_ids":["https://openalex.org/I90183372"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5107339473"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I90183372"],"apc_list":null,"apc_paid":null,"fwci":0.9327,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.74635608,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"26","last_page":"30"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.8185477256774902},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7091894745826721},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.6483737230300903},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.585598349571228},{"id":"https://openalex.org/keywords/propagation-of-uncertainty","display_name":"Propagation of uncertainty","score":0.5779062509536743},{"id":"https://openalex.org/keywords/backpropagation","display_name":"Backpropagation","score":0.5430601835250854},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.5020663738250732},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.4862907826900482},{"id":"https://openalex.org/keywords/noise-measurement","display_name":"Noise measurement","score":0.4611966609954834},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4477901756763458},{"id":"https://openalex.org/keywords/noisy-data","display_name":"Noisy data","score":0.42281508445739746},{"id":"https://openalex.org/keywords/signal-to-noise-ratio","display_name":"Signal-to-noise ratio (imaging)","score":0.42235666513442993},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4215741455554962},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3770620822906494},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3634297847747803},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.30544131994247437},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.16628578305244446},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.16501948237419128},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.1111757755279541},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.06632307171821594}],"concepts":[{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.8185477256774902},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7091894745826721},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.6483737230300903},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.585598349571228},{"id":"https://openalex.org/C123614077","wikidata":"https://www.wikidata.org/wiki/Q1364905","display_name":"Propagation of uncertainty","level":2,"score":0.5779062509536743},{"id":"https://openalex.org/C155032097","wikidata":"https://www.wikidata.org/wiki/Q798503","display_name":"Backpropagation","level":3,"score":0.5430601835250854},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.5020663738250732},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.4862907826900482},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.4611966609954834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4477901756763458},{"id":"https://openalex.org/C2781170535","wikidata":"https://www.wikidata.org/wiki/Q30587856","display_name":"Noisy data","level":2,"score":0.42281508445739746},{"id":"https://openalex.org/C13944312","wikidata":"https://www.wikidata.org/wiki/Q7512748","display_name":"Signal-to-noise ratio (imaging)","level":2,"score":0.42235666513442993},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4215741455554962},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3770620822906494},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3634297847747803},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.30544131994247437},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.16628578305244446},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.16501948237419128},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.1111757755279541},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.06632307171821594},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hscma.2017.7895555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hscma.2017.7895555","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 Hands-free Speech Communications and Microphone Arrays (HSCMA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320313934","display_name":"Institut national de recherche en informatique et en automatique (INRIA)","ror":"https://ror.org/02kvxyf05"},{"id":"https://openalex.org/F4320316512","display_name":"Bpifrance","ror":"https://ror.org/008zkt807"},{"id":"https://openalex.org/F4320322892","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W74241614","https://openalex.org/W109381481","https://openalex.org/W1492775261","https://openalex.org/W1524333225","https://openalex.org/W1981755271","https://openalex.org/W1981817333","https://openalex.org/W1989389005","https://openalex.org/W2013969331","https://openalex.org/W2020934227","https://openalex.org/W2045607566","https://openalex.org/W2060778387","https://openalex.org/W2063273764","https://openalex.org/W2066086651","https://openalex.org/W2077297191","https://openalex.org/W2083180245","https://openalex.org/W2100046100","https://openalex.org/W2106889843","https://openalex.org/W2111093880","https://openalex.org/W2126622418","https://openalex.org/W2145475542","https://openalex.org/W2148575186","https://openalex.org/W2158273884","https://openalex.org/W2235761953","https://openalex.org/W2256662675","https://openalex.org/W2402467380","https://openalex.org/W2403445744","https://openalex.org/W2559260703","https://openalex.org/W2559809918","https://openalex.org/W2584063687","https://openalex.org/W2683320792","https://openalex.org/W6602998950","https://openalex.org/W6629448772","https://openalex.org/W6631362777","https://openalex.org/W6692374192","https://openalex.org/W6713273328","https://openalex.org/W6732766861","https://openalex.org/W6740347751"],"related_works":["https://openalex.org/W2803237185","https://openalex.org/W2963735582","https://openalex.org/W3113301541","https://openalex.org/W1682666007","https://openalex.org/W1575623062","https://openalex.org/W1522341235","https://openalex.org/W4288260397","https://openalex.org/W1989345694","https://openalex.org/W1927374526","https://openalex.org/W2296110145"],"abstract_inverted_index":{"Automatic":[0],"speech":[1,23],"recognition":[2],"(ASR)":[3],"in":[4,45,67,149],"noisy":[5,52],"environments":[6],"remains":[7],"a":[8,55,97],"challenging":[9],"goal.":[10],"Recently,":[11],"the":[12,16,19,43,46,71,116,139,147,155,163,168],"idea":[13],"of":[14,58,74],"estimating":[15],"uncertainty":[17,59,81,90,101,108,126,141],"about":[18],"features":[20],"obtained":[21],"after":[22],"enhancement":[24],"and":[25,88,103,118,134,137,167],"propagating":[26],"it":[27,105,160],"to":[28,78],"dynamically":[29],"adapt":[30],"deep":[31],"neural":[32,98],"network":[33,99],"(DNN)":[34],"based":[35,100],"acoustic":[36],"models":[37],"has":[38],"raised":[39],"some":[40],"interest.":[41],"However,":[42],"results":[44,114],"literature":[47],"were":[48],"reported":[49],"on":[50,115,124,132,162],"simulated":[51,135],"datasets":[53],"for":[54,84],"limited":[56],"variety":[57],"estimators.":[60,109],"We":[61,110,121,151],"found":[62],"that":[63,138,154],"they":[64],"vary":[65],"significantly":[66,144],"different":[68,85,89],"conditions.":[69],"Hence,":[70],"main":[72],"contribution":[73],"this":[75],"work":[76],"is":[77,157],"assess":[79],"DNN":[80],"decoding":[82],"performance":[83],"data":[86,136],"conditions":[87],"estimation/propagation":[91],"techniques.":[92],"In":[93],"addition,":[94],"we":[95],"propose":[96],"estimator":[102,142],"compare":[104],"with":[106],"other":[107],"report":[111],"detailed":[112],"ASR":[113],"CHiME-2":[117],"CHiME-3":[119],"datasets.":[120],"find":[122,153],"that,":[123],"average,":[125],"propagation":[127],"provides":[128],"similar":[129],"relative":[130],"improvement":[131,156],"real":[133],"proposed":[140],"performs":[143],"better":[145],"than":[146],"one":[148],"[1].":[150],"also":[152],"consistent,":[158],"but":[159],"depends":[161],"signal-to-noise":[164],"ratio":[165],"(SNR)":[166],"noise":[169],"environment.":[170]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2}],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
