{"id":"https://openalex.org/W2999908512","doi":"https://doi.org/10.1109/ic3ina48034.2019.8949593","title":"Generalized Filter-bank Features for Robust Speech Recognition Against Reverberation","display_name":"Generalized Filter-bank Features for Robust Speech Recognition Against Reverberation","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2999908512","doi":"https://doi.org/10.1109/ic3ina48034.2019.8949593","mag":"2999908512"},"language":"en","primary_location":{"id":"doi:10.1109/ic3ina48034.2019.8949593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ic3ina48034.2019.8949593","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Conference on Computer, Control, Informatics and its Applications (IC3INA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018559332","display_name":"Hilman F. Pardede","orcid":"https://orcid.org/0000-0001-8078-7592"},"institutions":[{"id":"https://openalex.org/I19128659","display_name":"Indonesian Institute of Sciences","ror":"https://ror.org/03d7c1451","country_code":"ID","type":"facility","lineage":["https://openalex.org/I19128659"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Hilman F. Pardede","raw_affiliation_strings":["Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia","institution_ids":["https://openalex.org/I19128659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010533917","display_name":"Vicky Zilvan","orcid":"https://orcid.org/0000-0001-7896-5804"},"institutions":[{"id":"https://openalex.org/I19128659","display_name":"Indonesian Institute of Sciences","ror":"https://ror.org/03d7c1451","country_code":"ID","type":"facility","lineage":["https://openalex.org/I19128659"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Vicky Zilvan","raw_affiliation_strings":["Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia","institution_ids":["https://openalex.org/I19128659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009423697","display_name":"Dikdik Krisnandi","orcid":"https://orcid.org/0000-0003-1611-9631"},"institutions":[{"id":"https://openalex.org/I19128659","display_name":"Indonesian Institute of Sciences","ror":"https://ror.org/03d7c1451","country_code":"ID","type":"facility","lineage":["https://openalex.org/I19128659"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Dikdik Krisnandi","raw_affiliation_strings":["Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia","institution_ids":["https://openalex.org/I19128659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082845858","display_name":"Ana Heryana","orcid":"https://orcid.org/0000-0002-3907-3835"},"institutions":[{"id":"https://openalex.org/I19128659","display_name":"Indonesian Institute of Sciences","ror":"https://ror.org/03d7c1451","country_code":"ID","type":"facility","lineage":["https://openalex.org/I19128659"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Ana Heryana","raw_affiliation_strings":["Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia","institution_ids":["https://openalex.org/I19128659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019634360","display_name":"R. Budiarianto Suryo Kusumo","orcid":null},"institutions":[{"id":"https://openalex.org/I19128659","display_name":"Indonesian Institute of Sciences","ror":"https://ror.org/03d7c1451","country_code":"ID","type":"facility","lineage":["https://openalex.org/I19128659"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"R. Budiarianto S. Kusumo","raw_affiliation_strings":["Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Research Center for Informatics, Indonesian Institute of Sciences, Bandung, Indonesia","institution_ids":["https://openalex.org/I19128659"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5007,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.65542638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"19","last_page":"24"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.7684862613677979},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7651275396347046},{"id":"https://openalex.org/keywords/filter-bank","display_name":"Filter bank","score":0.7174942493438721},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6892958283424377},{"id":"https://openalex.org/keywords/discrete-cosine-transform","display_name":"Discrete cosine transform","score":0.6687794923782349},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.6661074757575989},{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.5678431987762451},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5224258303642273},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.502227783203125},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4746951460838318},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.4398967921733856},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43493330478668213},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4220837652683258},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.38662976026535034},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.10782736539840698}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.7684862613677979},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7651275396347046},{"id":"https://openalex.org/C100515483","wikidata":"https://www.wikidata.org/wiki/Q3268235","display_name":"Filter bank","level":3,"score":0.7174942493438721},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6892958283424377},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.6687794923782349},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.6661074757575989},{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.5678431987762451},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5224258303642273},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.502227783203125},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4746951460838318},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.4398967921733856},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43493330478668213},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4220837652683258},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.38662976026535034},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.10782736539840698},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ic3ina48034.2019.8949593","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ic3ina48034.2019.8949593","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Conference on Computer, Control, Informatics and its Applications (IC3INA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.7400000095367432}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W1524333225","https://openalex.org/W1604406927","https://openalex.org/W1951896508","https://openalex.org/W1970088388","https://openalex.org/W1971065938","https://openalex.org/W1973669708","https://openalex.org/W1973787919","https://openalex.org/W1983874169","https://openalex.org/W1984570643","https://openalex.org/W1989314204","https://openalex.org/W1992817080","https://openalex.org/W1993882792","https://openalex.org/W2005679925","https://openalex.org/W2032793676","https://openalex.org/W2045043668","https://openalex.org/W2047546246","https://openalex.org/W2048981179","https://openalex.org/W2052003115","https://openalex.org/W2072128103","https://openalex.org/W2073979726","https://openalex.org/W2100969003","https://openalex.org/W2109770219","https://openalex.org/W2112739286","https://openalex.org/W2113932204","https://openalex.org/W2126597753","https://openalex.org/W2129800309","https://openalex.org/W2131342762","https://openalex.org/W2136682440","https://openalex.org/W2136922672","https://openalex.org/W2139737683","https://openalex.org/W2146871184","https://openalex.org/W2148154194","https://openalex.org/W2152131029","https://openalex.org/W2157515590","https://openalex.org/W2160815625","https://openalex.org/W2168961642","https://openalex.org/W2213952365","https://openalex.org/W2222568552","https://openalex.org/W2291864985","https://openalex.org/W2294256493","https://openalex.org/W2401289784","https://openalex.org/W3104170010","https://openalex.org/W4231109964","https://openalex.org/W6631362777","https://openalex.org/W6688428952"],"related_works":["https://openalex.org/W2766680336","https://openalex.org/W1559551917","https://openalex.org/W2548564146","https://openalex.org/W2133320490","https://openalex.org/W4289830142","https://openalex.org/W1497065097","https://openalex.org/W3150393935","https://openalex.org/W2048014685","https://openalex.org/W2125446021","https://openalex.org/W2980055100"],"abstract_inverted_index":{"Traditionally,":[0],"automatic":[1],"speech":[2,65,144,166],"recognition":[3],"(ASR)":[4],"uses":[5],"a":[6,143,151,157],"Hidden":[7],"Markov":[8],"Model":[9,13],"with":[10],"Gaussian":[11],"Mixture":[12],"(HMM-GMM)":[14],"as":[15,22,27,75,105],"acoustic":[16,28],"model":[17],"and":[18,177,190],"hand-designed":[19],"features":[20,36,171],"such":[21,74,104],"Mel-frequency":[23],"Cepstral":[24],"Coefficient":[25],"(MFCC)":[26],"features.":[29,126],"It":[30],"is":[31,85,115,156],"usually":[32],"assumed":[33],"that":[34,62,168],"the":[35,47,55,64,78,122,125,128,137,169],"are":[37,108],"uncorrelated,":[38],"making":[39],"it":[40],"possible":[41],"to":[42,54,93,188],"use":[43,56,129],"diagonal":[44],"covariances":[45],"for":[46],"GMM.":[48],"The":[49,161],"assumption":[50],"generally":[51],"holds":[52],"due":[53],"of":[57,124,130,139,159],"Discrete":[58],"Cosine":[59],"Transformation":[60],"(DCT)":[61],"de-correlates":[63],"spectra.":[66],"However,":[67],"DCT":[68],"could":[69],"cause":[70,136],"some":[71],"information":[72],"loss,":[73],"correlations":[76,141],"between":[77,121],"feature":[79],"components.":[80],"Current":[81],"ASR":[82],"systems,":[83],"which":[84,155],"based":[86],"on":[87,163,179],"Deep":[88],"Neural":[89],"Network":[90],"(DNN)":[91],"show":[92,167],"be":[94,112],"better":[95,116,173],"especially":[96],"in":[97,117,133,142],"reverberant":[98,165],"conditions":[99],"when":[100],"more":[101],"primitive":[102],"features,":[103],"filter-bank":[106],"(FBANK),":[107],"used.":[109],"This":[110],"might":[111],"because":[113],"DNN":[114],"modeling":[118],"non-linear":[119],"relations":[120],"components":[123],"But":[127],"short-time":[131],"processing":[132],"FBANK":[134,178],"may":[135],"lost":[138],"long-term":[140],"pattern.":[145],"To":[146],"tackle":[147],"this,":[148],"we":[149],"propose":[150],"new":[152],"feature,":[153],"q-FBANK,":[154],"generalization":[158],"FBANK.":[160],"results":[162],"artificially":[164],"proposed":[170],"achieve":[172],"performance":[174],"than":[175],"MFCC":[176],"DNN-HMM":[180],"systems":[181],"where":[182],"an":[183],"average":[184],"error":[185],"reduction":[186],"up":[187],"39.73%":[189],"13.5%":[191],"were":[192],"achieved":[193],"respectively.":[194]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
