{"id":"https://openalex.org/W2944612567","doi":"https://doi.org/10.1109/iscslp.2018.8706699","title":"Robust Front-End Processing For Emotion Recognition In Noisy Speech","display_name":"Robust Front-End Processing For Emotion Recognition In Noisy Speech","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2944612567","doi":"https://doi.org/10.1109/iscslp.2018.8706699","mag":"2944612567"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp.2018.8706699","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2018.8706699","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5077399768","display_name":"Meghna Pandharipande","orcid":null},"institutions":[{"id":"https://openalex.org/I55215948","display_name":"Tata Consultancy Services (India)","ror":"https://ror.org/01b9n8m42","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210086519","https://openalex.org/I55215948"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Meghna Pandharipande","raw_affiliation_strings":["TCS Research and Innovation, Mumbai, INDIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TCS Research and Innovation, Mumbai, INDIA","institution_ids":["https://openalex.org/I55215948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077689139","display_name":"Rupayan Chakraborty","orcid":"https://orcid.org/0000-0002-3566-0784"},"institutions":[{"id":"https://openalex.org/I55215948","display_name":"Tata Consultancy Services (India)","ror":"https://ror.org/01b9n8m42","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210086519","https://openalex.org/I55215948"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Rupayan Chakraborty","raw_affiliation_strings":["TCS Research and Innovation, Mumbai, INDIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TCS Research and Innovation, Mumbai, INDIA","institution_ids":["https://openalex.org/I55215948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103959037","display_name":"Ashish Panda","orcid":null},"institutions":[{"id":"https://openalex.org/I55215948","display_name":"Tata Consultancy Services (India)","ror":"https://ror.org/01b9n8m42","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210086519","https://openalex.org/I55215948"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Ashish Panda","raw_affiliation_strings":["TCS Research and Innovation, Mumbai, INDIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TCS Research and Innovation, Mumbai, INDIA","institution_ids":["https://openalex.org/I55215948"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047383705","display_name":"Sunil Kumar Kopparapu","orcid":"https://orcid.org/0000-0002-0502-527X"},"institutions":[{"id":"https://openalex.org/I55215948","display_name":"Tata Consultancy Services (India)","ror":"https://ror.org/01b9n8m42","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210086519","https://openalex.org/I55215948"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sunil Kumar Kopparapu","raw_affiliation_strings":["TCS Research and Innovation, Mumbai, INDIA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"TCS Research and Innovation, Mumbai, INDIA","institution_ids":["https://openalex.org/I55215948"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.1639,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.80929414,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"324","last_page":"328"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7908391952514648},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.759893536567688},{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.7088369131088257},{"id":"https://openalex.org/keywords/front-and-back-ends","display_name":"Front and back ends","score":0.6579158306121826},{"id":"https://openalex.org/keywords/voice-activity-detection","display_name":"Voice activity detection","score":0.5912095904350281},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5085538625717163},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4685709476470947},{"id":"https://openalex.org/keywords/energy","display_name":"Energy (signal processing)","score":0.4465470314025879},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.44185692071914673},{"id":"https://openalex.org/keywords/detector","display_name":"Detector","score":0.43731069564819336},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.432849645614624},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3834025263786316},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.24383580684661865},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.2392905056476593},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.06904566287994385}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7908391952514648},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.759893536567688},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.7088369131088257},{"id":"https://openalex.org/C53016008","wikidata":"https://www.wikidata.org/wiki/Q620167","display_name":"Front and back ends","level":2,"score":0.6579158306121826},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.5912095904350281},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5085538625717163},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4685709476470947},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.4465470314025879},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.44185692071914673},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.43731069564819336},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.432849645614624},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3834025263786316},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.24383580684661865},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.2392905056476593},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.06904566287994385},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp.2018.8706699","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp.2018.8706699","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 11th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.4000000059604645}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W174669002","https://openalex.org/W175750906","https://openalex.org/W177923765","https://openalex.org/W231801308","https://openalex.org/W1966359074","https://openalex.org/W1999454387","https://openalex.org/W2010520781","https://openalex.org/W2013608223","https://openalex.org/W2030739378","https://openalex.org/W2074179263","https://openalex.org/W2074788634","https://openalex.org/W2082492120","https://openalex.org/W2083094940","https://openalex.org/W2130917731","https://openalex.org/W2135195345","https://openalex.org/W2146334809","https://openalex.org/W2154024118","https://openalex.org/W2287742606","https://openalex.org/W2339850901","https://openalex.org/W2487667478","https://openalex.org/W2525246137","https://openalex.org/W2754698175","https://openalex.org/W4297817736","https://openalex.org/W6607181510","https://openalex.org/W6607193717","https://openalex.org/W6609093682","https://openalex.org/W6653777654","https://openalex.org/W6679418476","https://openalex.org/W6703703274","https://openalex.org/W6744298679"],"related_works":["https://openalex.org/W2919389044","https://openalex.org/W1997528538","https://openalex.org/W2777466939","https://openalex.org/W2890579888","https://openalex.org/W1966856063","https://openalex.org/W2593427229","https://openalex.org/W2120771489","https://openalex.org/W2051376034","https://openalex.org/W2294333436","https://openalex.org/W284174822"],"abstract_inverted_index":{"Since":[0],"the":[1,18,43,53,72,79,85,125,142,145],"emotion":[2,88],"recognition":[3,89],"performances":[4],"degrade":[5],"drastically":[6],"for":[7],"noisy":[8,38,113],"speech,":[9],"we":[10,105],"propose":[11],"a":[12,26,94],"robust":[13],"front-end":[14,23,147],"processing":[15],"to":[16,82,140],"reduce":[17],"effect":[19],"of":[20,25,97,116,144],"noise.":[21],"The":[22,87],"consists":[24],"novel":[27],"energy":[28],"based":[29,60],"voice":[30],"activity":[31],"detector":[32],"(VAD),":[33],"which":[34],"discards":[35],"silence":[36],"or":[37],"frames.":[39],"We":[40],"show":[41],"that":[42],"proposed":[44,73,146],"VAD":[45,61,74],"results":[46],"in":[47],"significant":[48],"performance":[49,143],"gain":[50],"and":[51,104,122],"outperforms":[52],"more":[54],"complex":[55],"Recurrent":[56],"Neural":[57],"Network":[58],"(RNN)":[59],"as":[62,64],"well":[63],"popular":[65],"Non-negative":[66],"Matrix":[67],"Factorization":[68],"(NMF)":[69],"technique.":[70],"Moreover,":[71],"can":[75],"be":[76],"used":[77,107],"alongside":[78],"NMF":[80],"technique":[81],"further":[83],"improve":[84],"performance.":[86],"is":[90],"done":[91],"by":[92],"extracting":[93],"large":[95],"number":[96],"statistical":[98],"features":[99],"from":[100,124],"low-level":[101],"audio":[102],"descriptors,":[103],"have":[106,136],"state-of-the-art":[108],"classifiers.":[109],"Extensive":[110],"experimentation":[111],"on":[112],"(5":[114],"types":[115],"noise:":[117],"Babble,":[118],"F-16,":[119],"Factory,":[120],"Volvo,":[121],"HF-channel":[123],"Noisex-92":[126],"database)":[127],"speech":[128],"contaminated":[129],"at":[130],"5":[131],"different":[132],"SNR":[133],"levels":[134],"(0,5,10,15,20dB)":[135],"been":[137],"carried":[138],"out":[139],"measure":[141],"techniques.":[148]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
