{"id":"https://openalex.org/W2144298644","doi":"https://doi.org/10.1186/s13636-014-0040-7","title":"A sub-band-based feature reconstruction approach for robust speaker recognition","display_name":"A sub-band-based feature reconstruction approach for robust speaker recognition","publication_year":2014,"publication_date":"2014-10-20","ids":{"openalex":"https://openalex.org/W2144298644","doi":"https://doi.org/10.1186/s13636-014-0040-7","mag":"2144298644"},"language":"en","primary_location":{"id":"doi:10.1186/s13636-014-0040-7","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-014-0040-7","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-014-0040-7","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-014-0040-7","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044641652","display_name":"Furong Yan","orcid":"https://orcid.org/0000-0002-7969-7204"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Furong Yan","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, No.10 Xitucheng Road, Beijing, 100876, China","Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, No.10 Xitucheng Road, Beijing, 100876, China","institution_ids":["https://openalex.org/I139759216"]},{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100680383","display_name":"Yanbin Zhang","orcid":"https://orcid.org/0000-0002-6292-8352"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanbin Zhang","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, No.10 Xitucheng Road, Beijing, 100876, China","Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, No.10 Xitucheng Road, Beijing, 100876, China","institution_ids":["https://openalex.org/I139759216"]},{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010995528","display_name":"Jiachang Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiachang Yan","raw_affiliation_strings":["Beijing University of Posts and Telecommunications, No.10 Xitucheng Road, Beijing, 100876, China","Beijing University of Posts and Telecommunications,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beijing University of Posts and Telecommunications, No.10 Xitucheng Road, Beijing, 100876, China","institution_ids":["https://openalex.org/I139759216"]},{"raw_affiliation_string":"Beijing University of Posts and Telecommunications,Beijing,China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5044641652"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":{"value":1115,"currency":"GBP","value_usd":1367},"apc_paid":{"value":1115,"currency":"GBP","value_usd":1367},"fwci":0.8734,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.76018519,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"2014","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.8230217099189758},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6626802682876587},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6422120332717896},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6377583742141724},{"id":"https://openalex.org/keywords/principal-component-analysis","display_name":"Principal component analysis","score":0.6374441385269165},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6050169467926025},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5810962319374084},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5246220827102661},{"id":"https://openalex.org/keywords/frequency-band","display_name":"Frequency band","score":0.5171663165092468},{"id":"https://openalex.org/keywords/radio-spectrum","display_name":"Radio spectrum","score":0.5162196159362793},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4521104395389557},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4212753474712372},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.13959461450576782},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.0787748396396637}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.8230217099189758},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6626802682876587},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6422120332717896},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6377583742141724},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.6374441385269165},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6050169467926025},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5810962319374084},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5246220827102661},{"id":"https://openalex.org/C2778116611","wikidata":"https://www.wikidata.org/wiki/Q25110567","display_name":"Frequency band","level":3,"score":0.5171663165092468},{"id":"https://openalex.org/C92545706","wikidata":"https://www.wikidata.org/wiki/Q902174","display_name":"Radio spectrum","level":2,"score":0.5162196159362793},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4521104395389557},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4212753474712372},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.13959461450576782},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0787748396396637},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1186/s13636-014-0040-7","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-014-0040-7","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-014-0040-7","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1186/s13636-014-0040-7","is_oa":true,"landing_page_url":"https://doi.org/10.1186/s13636-014-0040-7","pdf_url":"https://asmp-eurasipjournals.springeropen.com/counter/pdf/10.1186/s13636-014-0040-7","source":{"id":"https://openalex.org/S19605986","display_name":"EURASIP Journal on Audio Speech and Music Processing","issn_l":"1687-4714","issn":["1687-4714","1687-4722"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EURASIP Journal on Audio, Speech, and Music Processing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2144298644.pdf","grobid_xml":"https://content.openalex.org/works/W2144298644.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W133022121","https://openalex.org/W1532958172","https://openalex.org/W1543669765","https://openalex.org/W1555148682","https://openalex.org/W1567962139","https://openalex.org/W1586405805","https://openalex.org/W1594612032","https://openalex.org/W1667165204","https://openalex.org/W1887190047","https://openalex.org/W1922557984","https://openalex.org/W2036488048","https://openalex.org/W2041823554","https://openalex.org/W2055611715","https://openalex.org/W2056999733","https://openalex.org/W2061140267","https://openalex.org/W2074354966","https://openalex.org/W2078953162","https://openalex.org/W2080794664","https://openalex.org/W2082470439","https://openalex.org/W2105393821","https://openalex.org/W2111406180","https://openalex.org/W2120689488","https://openalex.org/W2131037542","https://openalex.org/W2143855671","https://openalex.org/W2146083413","https://openalex.org/W2147147599","https://openalex.org/W2150866759","https://openalex.org/W2153311664","https://openalex.org/W2155636609","https://openalex.org/W2158336491","https://openalex.org/W2165880886","https://openalex.org/W2166817508","https://openalex.org/W2397634864","https://openalex.org/W2405891901","https://openalex.org/W3031363333","https://openalex.org/W3148076546","https://openalex.org/W4301253858","https://openalex.org/W6600379119","https://openalex.org/W6812480115"],"related_works":["https://openalex.org/W3119288895","https://openalex.org/W2185075503","https://openalex.org/W2749720872","https://openalex.org/W2131673591","https://openalex.org/W2186375278","https://openalex.org/W2793748347","https://openalex.org/W2104528589","https://openalex.org/W2155047054","https://openalex.org/W2002404399","https://openalex.org/W2379120504"],"abstract_inverted_index":{"Although":[0],"the":[1,14,17,40,57,62,86,89,94,101,105,113,139,152,175,194,202,215],"field":[2],"of":[3,19,64,88,183,197,214],"automatic":[4],"speaker":[5,168],"or":[6],"speech":[7],"recognition":[8,159,169,184,203,233],"has":[9,21],"been":[10],"extensively":[11],"studied":[12],"over":[13],"past":[15],"decades,":[16],"lack":[18],"robustness":[20],"remained":[22],"a":[23,32,48,117],"major":[24],"challenge.":[25],"The":[26,161,171],"missing":[27],"data":[28],"technique":[29],"(MDT)":[30],"is":[31,69,83,97,165,207],"promising":[33],"approach.":[34],"However,":[35],"its":[36],"performance":[37,185],"depends":[38],"on":[39,56,136],"correlation":[41,87],"across":[42,66,217],"frequency":[43,67,198,218],"bands.":[44],"This":[45],"paper":[46,120],"presents":[47],"new":[49],"reconstruction":[50,163,180],"method":[51],"for":[52,158,201],"feature":[53,90],"enhancement":[54],"based":[55,135],"trait.":[58],"In":[59],"this":[60,119],"paper,":[61],"degree":[63],"concentration":[65],"bands":[68],"measured":[70],"with":[71,112],"principal":[72],"component":[73],"analysis":[74,78],"(PCA).":[75],"Through":[76],"theoretical":[77],"and":[79,125],"experimental":[80],"results,":[81],"it":[82],"found":[84],"that":[85,174],"vector":[91],"extracted":[92,103,131],"from":[93,104,132,144],"sub-band":[95],"(SB)":[96],"much":[98,210],"stronger":[99],"than":[100,110],"ones":[102],"full-band":[106,122,179],"(FB).":[107],"Thus,":[108],"rather":[109],"dealing":[111],"spectral":[114,129],"features":[115,130,143],"as":[116],"whole,":[118],"splits":[121],"into":[123,209],"sub-bands":[124,146],"then":[126],"individually":[127],"reconstructs":[128],"each":[133],"SB":[134],"MDT.":[137],"At":[138],"end,":[140],"those":[141],"constructed":[142],"all":[145,187],"will":[147],"be":[148,228],"recombined":[149],"to":[150,227,230],"yield":[151],"conventional":[153],"mel-frequency":[154],"cepstral":[155],"coefficient":[156],"(MFCC)":[157],"experiments.":[160],"2-sub-band":[162],"approach":[164,177],"evaluated":[166],"in":[167,181,186],"system.":[170],"results":[172],"show":[173],"proposed":[176],"outperforms":[178],"terms":[182],"noise":[188],"conditions.":[189],"Finally,":[190],"we":[191],"particularly":[192],"discuss":[193],"optimal":[195],"selection":[196],"division":[199,224],"ways":[200,225],"task.":[204],"When":[205],"FB":[206],"divided":[208],"more":[211],"sub-bands,":[212],"some":[213],"correlations":[216],"channels":[219],"are":[220],"lost.":[221],"Consequently,":[222],"efficient":[223],"need":[226],"investigated":[229],"perform":[231],"further":[232],"performance.":[234]},"counts_by_year":[{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
