{"id":"https://openalex.org/W3038454187","doi":"https://doi.org/10.1109/lsp.2020.3006447","title":"A Novel Modified Mel-DCT Filter Bank Structure With Application to Voice Activity Detection","display_name":"A Novel Modified Mel-DCT Filter Bank Structure With Application to Voice Activity Detection","publication_year":2020,"publication_date":"2020-01-01","ids":{"openalex":"https://openalex.org/W3038454187","doi":"https://doi.org/10.1109/lsp.2020.3006447","mag":"3038454187"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2020.3006447","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2020.3006447","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023433960","display_name":"R. Muralishankar","orcid":null},"institutions":[{"id":"https://openalex.org/I4210104573","display_name":"CMR University","ror":"https://ror.org/015waqy33","country_code":"IN","type":"education","lineage":["https://openalex.org/I4210104573"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"R. Muralishankar","raw_affiliation_strings":["School of Engineering and Technology, CMR University, Bengaluru, India"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Technology, CMR University, Bengaluru, India","institution_ids":["https://openalex.org/I4210104573"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080164252","display_name":"Debayan Ghosh","orcid":"https://orcid.org/0000-0002-4415-8657"},"institutions":[{"id":"https://openalex.org/I196608512","display_name":"PES University","ror":"https://ror.org/05m169e78","country_code":"IN","type":"education","lineage":["https://openalex.org/I196608512"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Debayan Ghosh","raw_affiliation_strings":["Department of Electronics and Communication Engineering, PES University, Bengaluru, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, PES University, Bengaluru, India","institution_ids":["https://openalex.org/I196608512"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031193084","display_name":"Sanjeev Gurugopinath","orcid":"https://orcid.org/0000-0003-0401-6651"},"institutions":[{"id":"https://openalex.org/I196608512","display_name":"PES University","ror":"https://ror.org/05m169e78","country_code":"IN","type":"education","lineage":["https://openalex.org/I196608512"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sanjeev Gurugopinath","raw_affiliation_strings":["Department of Electronics and Communication Engineering, PES University, Bengaluru, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, PES University, Bengaluru, India","institution_ids":["https://openalex.org/I196608512"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5023433960"],"corresponding_institution_ids":["https://openalex.org/I4210104573"],"apc_list":null,"apc_paid":null,"fwci":0.9092,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.73791968,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"27","issue":null,"first_page":"1240","last_page":"1244"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.8409193754196167},{"id":"https://openalex.org/keywords/filter-bank","display_name":"Filter bank","score":0.8125410079956055},{"id":"https://openalex.org/keywords/discrete-cosine-transform","display_name":"Discrete cosine transform","score":0.7967885732650757},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7124350070953369},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6332467794418335},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5606210231781006},{"id":"https://openalex.org/keywords/modified-discrete-cosine-transform","display_name":"Modified discrete cosine transform","score":0.48899829387664795},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46494144201278687},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37353479862213135},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.36913007497787476},{"id":"https://openalex.org/keywords/transform-coding","display_name":"Transform coding","score":0.15756472945213318},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.1572589874267578}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.8409193754196167},{"id":"https://openalex.org/C100515483","wikidata":"https://www.wikidata.org/wiki/Q3268235","display_name":"Filter bank","level":3,"score":0.8125410079956055},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.7967885732650757},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7124350070953369},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6332467794418335},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5606210231781006},{"id":"https://openalex.org/C28726691","wikidata":"https://www.wikidata.org/wiki/Q1268231","display_name":"Modified discrete cosine transform","level":5,"score":0.48899829387664795},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46494144201278687},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37353479862213135},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.36913007497787476},{"id":"https://openalex.org/C169805256","wikidata":"https://www.wikidata.org/wiki/Q1361381","display_name":"Transform coding","level":4,"score":0.15756472945213318},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.1572589874267578},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2020.3006447","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2020.3006447","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7900000214576721}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1974387177","https://openalex.org/W2090711167","https://openalex.org/W2090861223","https://openalex.org/W2097036989","https://openalex.org/W2107926288","https://openalex.org/W2126693545","https://openalex.org/W2129120544","https://openalex.org/W2148154194","https://openalex.org/W2149053750","https://openalex.org/W2159531755","https://openalex.org/W2160254053","https://openalex.org/W2166637769","https://openalex.org/W2240641835","https://openalex.org/W2805399811","https://openalex.org/W2889192039","https://openalex.org/W6683747465"],"related_works":["https://openalex.org/W2565123265","https://openalex.org/W2090071970","https://openalex.org/W2112852877","https://openalex.org/W2766680336","https://openalex.org/W2133320490","https://openalex.org/W2108727544","https://openalex.org/W1507290937","https://openalex.org/W4289830142","https://openalex.org/W1559551917","https://openalex.org/W2548564146"],"abstract_inverted_index":{"We":[0],"propose":[1],"a":[2,46,58,93,118],"novel":[3],"modified":[4],"Mel-discrete":[5],"cosine":[6,52],"transform":[7],"(MMD)":[8],"filter":[9,18,43,181],"bank":[10,182],"structure,":[11],"which":[12],"restricts":[13],"the":[14,27,33,36,41,65,70,84,88,122,142,146,164,174,178],"overlap":[15],"of":[16,35,67,130,150,177],"each":[17],"response":[19,48],"to":[20,26,116],"its":[21],"immediate":[22],"neighbor.":[23],"In":[24,134],"contrast":[25],"well-known":[28,166],"triangular":[29],"filters":[30],"employed":[31],"in":[32,57,83,121,158],"extraction":[34],"Mel-frequency":[37],"cepstral":[38],"coefficients":[39],"(MFCC),":[40],"proposed":[42,179],"structure":[44],"has":[45],"smoother":[47],"and":[49,54],"offers":[50],"discrete":[51],"transformation":[53],"Mel-scale":[55],"filtering":[56],"single":[59],"operation.":[60],"It":[61],"is":[62],"known":[63,115],"that":[64,139],"choice":[66],"MFCC":[68,100,112],"as":[69],"only":[71],"feature":[72],"for":[73,153,183],"voice":[74,151],"activity":[75],"detection":[76,159],"(VAD)":[77],"does":[78],"not":[79,94],"yield":[80],"substantial":[81,119],"improvements":[82,157],"performance.":[85],"Even":[86],"with":[87,127,163],"long-term":[89,106,147,167],"approach,":[90],"we":[91,137],"observe":[92],"so":[95],"encouraging":[96],"VAD":[97,108,154],"performance":[98,123],"when":[99,161],"features":[101],"are":[102,114],"employed.":[103],"However,":[104],"other":[105,165,184],"based":[107],"algorithms":[109],"-":[110,113],"without":[111],"provide":[117],"improvement":[120],"under":[124],"low":[125],"SNR":[126],"time-varying":[128],"statistics":[129],"speech":[131,185],"and/or":[132],"noise.":[133],"this":[135,170],"work,":[136],"show":[138],"by":[140,145],"employing":[141],"MMD":[143,180],"followed":[144],"differential":[148],"entropy":[149],"signal":[152],"provides":[155],"significant":[156],"accuracy":[160],"compared":[162],"algorithms.":[168],"Thus,":[169],"study":[171],"opens":[172],"up":[173],"possible":[175],"benefits":[176],"processing":[186],"applications.":[187]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
