{"id":"https://openalex.org/W3160505857","doi":"https://doi.org/10.23919/eusipco54536.2021.9615958","title":"Deep scattering network for speech emotion recognition","display_name":"Deep scattering network for speech emotion recognition","publication_year":2021,"publication_date":"2021-08-23","ids":{"openalex":"https://openalex.org/W3160505857","doi":"https://doi.org/10.23919/eusipco54536.2021.9615958","mag":"3160505857"},"language":"en","primary_location":{"id":"doi:10.23919/eusipco54536.2021.9615958","is_oa":false,"landing_page_url":"https://doi.org/10.23919/eusipco54536.2021.9615958","pdf_url":null,"source":{"id":"https://openalex.org/S4363607854","display_name":"2021 29th European Signal Processing Conference (EUSIPCO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 29th European Signal Processing Conference (EUSIPCO)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2105.04806","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101252426","display_name":"Premjeet Singh","orcid":"https://orcid.org/0009-0001-9650-1138"},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Premjeet Singh","raw_affiliation_strings":["Dept of Electronics and ECE, Indian Institute of Technology Kharagpur, Kharagpur, India","Indian Institute of Technology\u2013Kharagpur"],"affiliations":[{"raw_affiliation_string":"Dept of Electronics and ECE, Indian Institute of Technology Kharagpur, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]},{"raw_affiliation_string":"Indian Institute of Technology\u2013Kharagpur","institution_ids":["https://openalex.org/I145894827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069790572","display_name":"Goutam Saha","orcid":"https://orcid.org/0000-0001-6187-1684"},"institutions":[{"id":"https://openalex.org/I145894827","display_name":"Indian Institute of Technology Kharagpur","ror":"https://ror.org/03w5sq511","country_code":"IN","type":"education","lineage":["https://openalex.org/I145894827"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Goutam Saha","raw_affiliation_strings":["Dept of Electronics and ECE, Indian Institute of Technology Kharagpur, Kharagpur, India","Indian Institute of Technology\u2013Kharagpur"],"affiliations":[{"raw_affiliation_string":"Dept of Electronics and ECE, Indian Institute of Technology Kharagpur, Kharagpur, India","institution_ids":["https://openalex.org/I145894827"]},{"raw_affiliation_string":"Indian Institute of Technology\u2013Kharagpur","institution_ids":["https://openalex.org/I145894827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079693142","display_name":"Md Sahidullah","orcid":"https://orcid.org/0000-0002-0624-2903"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210121838","display_name":"Laboratoire Lorrain de Recherche en Informatique et ses Applications","ror":"https://ror.org/02vnf0c38","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I277688954","https://openalex.org/I4210107720","https://openalex.org/I4210121838","https://openalex.org/I4210159245","https://openalex.org/I90183372"]},{"id":"https://openalex.org/I90183372","display_name":"Universit\u00e9 de Lorraine","ror":"https://ror.org/04vfs2w97","country_code":"FR","type":"education","lineage":["https://openalex.org/I90183372"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Md Sahidullah","raw_affiliation_strings":["Universit\u00e9 de Lorraine, CNRS, Inria, LORIA, Nancy, France","French Institute for Research in Computer Science and Automation"],"affiliations":[{"raw_affiliation_string":"Universit\u00e9 de Lorraine, CNRS, Inria, LORIA, Nancy, France","institution_ids":["https://openalex.org/I90183372","https://openalex.org/I4210121838","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"French Institute for Research in Computer Science and Automation","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101252426"],"corresponding_institution_ids":["https://openalex.org/I145894827"],"apc_list":null,"apc_paid":null,"fwci":0.2249,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.41010101,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"131","last_page":"135"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.7856554985046387},{"id":"https://openalex.org/keywords/scattering","display_name":"Scattering","score":0.7152081727981567},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6111218333244324},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.565962553024292},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5181478261947632},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.501183271408081},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44096243381500244},{"id":"https://openalex.org/keywords/time\u2013frequency-analysis","display_name":"Time\u2013frequency analysis","score":0.43970999121665955},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3594890832901001},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.31941571831703186},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.2543390989303589},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.13423514366149902},{"id":"https://openalex.org/keywords/optics","display_name":"Optics","score":0.11755558848381042}],"concepts":[{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.7856554985046387},{"id":"https://openalex.org/C191486275","wikidata":"https://www.wikidata.org/wiki/Q210028","display_name":"Scattering","level":2,"score":0.7152081727981567},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6111218333244324},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.565962553024292},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5181478261947632},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.501183271408081},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44096243381500244},{"id":"https://openalex.org/C142433447","wikidata":"https://www.wikidata.org/wiki/Q7806653","display_name":"Time\u2013frequency analysis","level":3,"score":0.43970999121665955},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3594890832901001},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.31941571831703186},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.2543390989303589},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.13423514366149902},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.11755558848381042},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.23919/eusipco54536.2021.9615958","is_oa":false,"landing_page_url":"https://doi.org/10.23919/eusipco54536.2021.9615958","pdf_url":null,"source":{"id":"https://openalex.org/S4363607854","display_name":"2021 29th European Signal Processing Conference (EUSIPCO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 29th European Signal Processing Conference (EUSIPCO)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2105.04806","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.04806","pdf_url":"https://arxiv.org/pdf/2105.04806","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3160505857","is_oa":true,"landing_page_url":"http://arxiv.org/pdf/2105.04806.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"pmh:oai:HAL:hal-03218278v1","is_oa":true,"landing_page_url":"https://hal.science/hal-03218278","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EUSIPCO 2021 - 29th European Signal Processing Conference, Aug 2021, Dublin / Virtual, Ireland. &#x27E8;10.23919/EUSIPCO54536.2021.9615958&#x27E9;","raw_type":"Conference papers"},{"id":"pmh:oai:oskar-bordeaux.fr:20.500.12278/31381","is_oa":false,"landing_page_url":"https://oskar-bordeaux.fr/handle/20.500.12278/31381","pdf_url":null,"source":{"id":"https://openalex.org/S4306402569","display_name":"Oskar-Bordeaux (Universite de Bordeaux)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Communication dans un congr\u00e8s avec actes"},{"id":"doi:10.48550/arxiv.2105.04806","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2105.04806","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2105.04806","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2105.04806","pdf_url":"https://arxiv.org/pdf/2105.04806","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W175750906","https://openalex.org/W1510825849","https://openalex.org/W1641465689","https://openalex.org/W1994906459","https://openalex.org/W1995562189","https://openalex.org/W2072072671","https://openalex.org/W2074788634","https://openalex.org/W2087618018","https://openalex.org/W2093231248","https://openalex.org/W2146334809","https://openalex.org/W2159333554","https://openalex.org/W2196961052","https://openalex.org/W2399733683","https://openalex.org/W2405274704","https://openalex.org/W2618574054","https://openalex.org/W2766272105","https://openalex.org/W2803193013","https://openalex.org/W2888786729","https://openalex.org/W2945837706","https://openalex.org/W2962790223","https://openalex.org/W2972691009","https://openalex.org/W2972717745","https://openalex.org/W2997399314","https://openalex.org/W3111213250","https://openalex.org/W3113497772","https://openalex.org/W3120557855","https://openalex.org/W3127806559","https://openalex.org/W3138819813","https://openalex.org/W6636832325","https://openalex.org/W6737985840","https://openalex.org/W6767895713"],"related_works":["https://openalex.org/W2959460518","https://openalex.org/W199595529","https://openalex.org/W2746415023","https://openalex.org/W2988796883","https://openalex.org/W2016207770","https://openalex.org/W1986532109","https://openalex.org/W2914956632","https://openalex.org/W2991314292","https://openalex.org/W2103257373","https://openalex.org/W2159333554","https://openalex.org/W2169234936","https://openalex.org/W2738674843","https://openalex.org/W2241564424","https://openalex.org/W2067687945","https://openalex.org/W1889034575","https://openalex.org/W1607510692","https://openalex.org/W267714254","https://openalex.org/W1585607783","https://openalex.org/W2168758670","https://openalex.org/W202998574"],"abstract_inverted_index":{"This":[0],"paper":[1],"introduces":[2],"scattering":[3,51,92,108,113,120],"transform":[4,11],"for":[5,137],"speech":[6],"emotion":[7,34,58,73,81],"recognition":[8],"(SER).":[9],"Scattering":[10],"generates":[12],"feature":[13],"representations":[14],"which":[15],"remain":[16],"stable":[17,131],"to":[18,90,122],"deformations":[19],"and":[20,24,40,46,114,129,133],"shifting":[21],"in":[22,42],"time":[23,39,45,127],"frequency":[25,47,107],"without":[26],"much":[27],"loss":[28],"of":[29,50,126],"information.":[30],"In":[31],"speech,":[32],"the":[33,69,80,124],"cues":[35],"are":[36],"spread":[37],"across":[38],"localised":[41],"frequency.":[43],"The":[44],"invariance":[48],"characteristic":[49],"coefficients":[52,93,98,121,136,143],"provides":[53],"a":[54,77],"representation":[55,78],"robust":[56],"against":[57],"irrelevant":[59],"variations":[60,70],"e.g.,":[61],"different":[62,101],"speakers,":[63],"language,":[64],"gender":[65],"etc.":[66],"while":[67],"preserving":[68],"caused":[71],"by":[72],"cues.":[74],"Hence,":[75],"such":[76],"captures":[79],"information":[82],"more":[83],"efficiently":[84],"from":[85],"speech.":[86],"We":[87,116,139],"perform":[88,147],"experiments":[89],"compare":[91],"with":[94],"standard":[95],"mel-frequency":[96],"cepstral":[97],"(MFCCs)":[99],"over":[100],"databases.":[102],"It":[103],"is":[104],"observed":[105],"that":[106,141],"performs":[109],"better":[110,148],"than":[111,149],"time-domain":[112],"MFCCs.":[115,150],"also":[117,146],"investigate":[118],"layer-wise":[119,142],"analyse":[123],"importance":[125],"shift":[128],"deformation":[130],"scalogram":[132],"modulation":[134],"spectrum":[135],"SER.":[138],"observe":[140],"taken":[144],"independently":[145]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
