{"id":"https://openalex.org/W15731617","doi":"https://doi.org/10.21437/interspeech.2005-179","title":"Statistical properties of the warped discrete cosine transform cepstrum compared with MFCC","display_name":"Statistical properties of the warped discrete cosine transform cepstrum compared with MFCC","publication_year":2005,"publication_date":"2005-09-04","ids":{"openalex":"https://openalex.org/W15731617","doi":"https://doi.org/10.21437/interspeech.2005-179","mag":"15731617"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2005-179","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2005-179","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2005","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023433960","display_name":"R. Muralishankar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"R. Muralishankar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111469714","display_name":"Abhijeet Sangwan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abhijeet Sangwan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5011489869","display_name":"Douglas O\u2019Shaughnessy","orcid":"https://orcid.org/0000-0002-0110-2346"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Douglas O'Shaughnessy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.9721,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.73429805,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"341","last_page":"344"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.928803563117981},{"id":"https://openalex.org/keywords/codebook","display_name":"Codebook","score":0.8207980394363403},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.7419308423995972},{"id":"https://openalex.org/keywords/discrete-cosine-transform","display_name":"Discrete cosine transform","score":0.7018063068389893},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6792769432067871},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6423707008361816},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5762550830841064},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5310196280479431},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.5282420516014099},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4814966917037964},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4148520827293396},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.36449718475341797}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.928803563117981},{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.8207980394363403},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.7419308423995972},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.7018063068389893},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6792769432067871},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6423707008361816},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5762550830841064},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5310196280479431},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.5282420516014099},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4814966917037964},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4148520827293396},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.36449718475341797},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2005-179","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2005-179","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2005","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6800000071525574,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W1559551917","https://openalex.org/W1590403649","https://openalex.org/W2070238296","https://openalex.org/W2096935579","https://openalex.org/W2135934764","https://openalex.org/W2138692623","https://openalex.org/W2160254053"],"related_works":["https://openalex.org/W2148772884","https://openalex.org/W2017514583","https://openalex.org/W2100120615","https://openalex.org/W2147406819","https://openalex.org/W2352648934","https://openalex.org/W1929869830","https://openalex.org/W2387054321","https://openalex.org/W2017401491","https://openalex.org/W2062765737","https://openalex.org/W2012827167"],"abstract_inverted_index":{"Abstract":[0],"In":[1],"this":[2],"paper,":[3],"we":[4,25,71],"continue":[5],"our":[6],"investigation":[7],"of":[8,30,45,168,207,234,275],"the":[9,27,31,36,46,51,92,99,118,147,156,161,197,205,217,221,231,236,272],"warpeddiscrete":[10],"cosine":[11,102],"transform":[12],"cepstrum":[13,104],"(WDCTC),":[14],"which":[15],"wasearlier":[16],"introduced":[17,98],"as":[18,106,136],"a":[19,78,107,124,137,165,192,243],"new":[20,108],"speech":[21,109,138,183],"processing":[22,110,139],"feature":[23,140,170],"[1].Here,":[24],"study":[26],"statistical":[28,54,151],"properties":[29,44],"WDCTC":[32,73,132,148,187,218,237,267],"andcompare":[33],"them":[34],"with":[35,59],"mel-frequency":[37,119],"cepstral":[38,120],"coef\ufb01cients(MFCC).":[39],"We":[40,96,257],"report":[41],"some":[42],"interesting":[43],"WD-CTC":[47],"when":[48],"compared":[49],"to":[50,144,182,229],"MFCC:":[52],"its":[53,114,150],"distrib-ution":[55],"is":[56,159,255],"more":[57],"Gaussian-like":[58],"lower":[60],"variance,":[61],"it":[62],"obtainsbettervowel":[63],"clusterseparability,it":[64],"formstightervowelclus-ters":[65],"and":[66,74,85,112,127,141,163,180,188,195,201,238,250,261,270],"generates":[67],"better":[68,115,225],"codebooks.":[69],"Further,":[70],"employthe":[72],"MFCC":[75,189,239],"features":[76,269],"in":[77,123,242],"5-vowel":[79,244],"recognitiontask":[80],"using":[81,191,204],"Vector":[82,247],"Quantization":[83],"(VQ)":[84,249],"1-Nearest":[86],"Neigh-bour(1-NN)as":[87],"classi\ufb01ers.":[88],"Inourexperiments,the":[89],"WDCTCconsistently":[90],"outperforms":[91],"MFCC.":[93],"1.":[94],"Introduction":[95],"recently":[97],"warped":[100],"discrete":[101],"trans-form":[103],"(WDCTC)":[105],"fea-ture":[111],"demonstrated":[113],"performance":[116,254],"than":[117,226],"coef\ufb01cients":[121],"(MFCC)":[122],"vowel":[125,223,263],"recog-nition":[126],"speaker-identi\ufb01cation":[128],"task":[129],"[1].":[130],"The":[131],"hasshown":[133],"good":[134],"promise":[135],"weare":[142],"encouraged":[143],"further":[145],"investigate":[146],"featureand":[149],"properties.Alargevolumeoftrainingdataisrequiredto":[152],"buildspea-ker-independentspeechrecognitionsystems.":[153],"Onetechniqueof":[154],"reducing":[155],"data":[157,162,224],"size":[158],"clustering":[160],"choos-ing":[164],"reasonable":[166],"number":[167],"representative":[169],"vectorsto":[171],"form":[172,186],"codebooks":[173,190,219],"[2].":[174],"Hence,":[175],"codebook":[176,198],"techniques":[177],"arevery":[178],"relevant":[179],"practical":[181],"recognition":[184,245],"systems.We":[185],"k-meansclustering":[193],"algorithm":[194],"compare":[196,230],"statisticsfor":[199],"clean":[200,260],"noisy":[202,262],"vowels":[203],"coef\ufb01cient":[206],"varianceand":[208],"overlap":[209],"ratio":[210],"(de\ufb01ned":[211],"later).":[212],"Our":[213],"experiment":[214],"demon-strates":[215],"that":[216],"represent":[220],"underly-ing":[222],"MFCC.In":[227],"order":[228],"classi\ufb01cation":[232],"capability":[233],"thefeatures,":[235],"are":[240],"employed":[241],"task.":[246],"quantization":[248],"1-nearestneighbor(1-NN,[2])are":[251],"usedas":[252],"classi\ufb01ersandtheirrecognition":[253],"reported.":[256],"also":[258],"investigatethe":[259],"clusters":[264],"formed":[265],"by":[266],"andMFCC":[268],"present":[271],"average":[273],"separability":[274],"thevowel":[276],"classes.":[277]},"counts_by_year":[{"year":2015,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
