{"id":"https://openalex.org/W2086677518","doi":"https://doi.org/10.1109/apsipa.2014.7041556","title":"Noisy speech recognition using blind spatial subtraction array technique and deep bottleneck features","display_name":"Noisy speech recognition using blind spatial subtraction array technique and deep bottleneck features","publication_year":2014,"publication_date":"2014-12-01","ids":{"openalex":"https://openalex.org/W2086677518","doi":"https://doi.org/10.1109/apsipa.2014.7041556","mag":"2086677518"},"language":"en","primary_location":{"id":"doi:10.1109/apsipa.2014.7041556","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2014.7041556","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Signal and Information Processing Association Annual Summit and Conference (APSIPA), 2014 Asia-Pacific","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077234015","display_name":"Norihide Kitaoka","orcid":"https://orcid.org/0000-0003-2028-8585"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Norihide Kitaoka","raw_affiliation_strings":["Nagoya Unviersity"],"affiliations":[{"raw_affiliation_string":"Nagoya Unviersity","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078778981","display_name":"Tomoki Hayashi","orcid":"https://orcid.org/0000-0001-8782-4093"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tomoki Hayashi","raw_affiliation_strings":["Nagoya Unviersity"],"affiliations":[{"raw_affiliation_string":"Nagoya Unviersity","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042118446","display_name":"Kazuya Takeda","orcid":"https://orcid.org/0000-0002-0330-1787"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kazuya Takeda","raw_affiliation_strings":["Nagoya Unviersity"],"affiliations":[{"raw_affiliation_string":"Nagoya Unviersity","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5077234015"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.27213328,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.5881122,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.8156616687774658},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.7824243903160095},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7634782791137695},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7225168943405151},{"id":"https://openalex.org/keywords/background-subtraction","display_name":"Background subtraction","score":0.6238261461257935},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5678315162658691},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5505101084709167},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5348407626152039},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.49708059430122375},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.48625385761260986},{"id":"https://openalex.org/keywords/subtraction","display_name":"Subtraction","score":0.46755966544151306},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.46170857548713684},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4176490604877472},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.41433730721473694},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.41137710213661194},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.24008789658546448},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10457807779312134},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.08982962369918823}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.8156616687774658},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.7824243903160095},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7634782791137695},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7225168943405151},{"id":"https://openalex.org/C32653426","wikidata":"https://www.wikidata.org/wiki/Q3813641","display_name":"Background subtraction","level":3,"score":0.6238261461257935},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5678315162658691},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5505101084709167},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5348407626152039},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.49708059430122375},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.48625385761260986},{"id":"https://openalex.org/C68060419","wikidata":"https://www.wikidata.org/wiki/Q40754","display_name":"Subtraction","level":2,"score":0.46755966544151306},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.46170857548713684},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4176490604877472},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.41433730721473694},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.41137710213661194},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.24008789658546448},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10457807779312134},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.08982962369918823},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipa.2014.7041556","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipa.2014.7041556","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Signal and Information Processing Association Annual Summit and Conference (APSIPA), 2014 Asia-Pacific","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334789","display_name":"Japan Science and Technology Agency","ror":"https://ror.org/00097mb19"},{"id":"https://openalex.org/F4320338075","display_name":"Core Research for Evolutional Science and Technology","ror":"https://ror.org/00097mb19"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W46366292","https://openalex.org/W72347498","https://openalex.org/W1510095622","https://openalex.org/W2005522781","https://openalex.org/W2099741732","https://openalex.org/W2128653836","https://openalex.org/W2130432819","https://openalex.org/W2136922672","https://openalex.org/W2137429825","https://openalex.org/W2159485234","https://openalex.org/W2161742217","https://openalex.org/W4238331734","https://openalex.org/W4247773827","https://openalex.org/W4310638450","https://openalex.org/W6602935006"],"related_works":["https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W2373675101","https://openalex.org/W4385672897","https://openalex.org/W106160982","https://openalex.org/W2359140082","https://openalex.org/W2074132948","https://openalex.org/W2160511961","https://openalex.org/W2066371342"],"abstract_inverted_index":{"In":[0],"this":[1],"study,":[2],"we":[3],"investigate":[4],"the":[5,19,56,66,71,90],"effect":[6],"of":[7,21,55,73,82,92],"blind":[8],"spatial":[9],"subtraction":[10],"arrays":[11],"(BSSA)":[12],"on":[13,38],"speech":[14,95],"recognition":[15],"systems":[16],"by":[17,63],"comparing":[18],"performance":[20,54,72],"a":[22,30],"method":[23,31],"using":[24,32],"Mel-Frequency":[25],"Cepstral":[26],"Coefficients":[27],"(MFCCs)":[28],"with":[29],"Deep":[33,39],"Bottleneck":[34],"Features":[35],"(DBNF)":[36],"based":[37],"Neural":[40],"Networks":[41],"(DNN).":[42],"Performance":[43],"is":[44],"evaluated":[45],"under":[46],"various":[47],"conditions,":[48],"including":[49],"noisy,":[50],"in-vehicle":[51],"conditions.":[52],"Although":[53],"DBNF-based":[57],"system":[58],"was":[59,85],"much":[60],"more":[61],"degraded":[62],"noise":[64],"than":[65],"MFCC-based":[67],"system,":[68],"BSSA":[69,93],"improved":[70],"both":[74],"methods":[75],"greatly,":[76],"especially":[77],"when":[78],"matched":[79],"condition":[80],"training":[81],"acoustic":[83],"models":[84],"employed.":[86],"These":[87],"results":[88],"show":[89],"effectiveness":[91],"for":[94],"recognition.":[96]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
