{"id":"https://openalex.org/W4386176982","doi":"https://doi.org/10.1109/tnnls.2023.3304516","title":"DSTCNet: Deep Spectro-Temporal-Channel Attention Network for Speech Emotion Recognition","display_name":"DSTCNet: Deep Spectro-Temporal-Channel Attention Network for Speech Emotion Recognition","publication_year":2023,"publication_date":"2023-08-25","ids":{"openalex":"https://openalex.org/W4386176982","doi":"https://doi.org/10.1109/tnnls.2023.3304516","pmid":"https://pubmed.ncbi.nlm.nih.gov/37624721"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2023.3304516","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3304516","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055229622","display_name":"Lili Guo","orcid":null},"institutions":[{"id":"https://openalex.org/I25757504","display_name":"China University of Mining and Technology","ror":"https://ror.org/01xt2dr21","country_code":"CN","type":"education","lineage":["https://openalex.org/I25757504"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lili Guo","raw_affiliation_strings":["School of Computer Science and Technology, China University of Mining and Technology, Xuzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-5526-0980","affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, China University of Mining and Technology, Xuzhou, China","institution_ids":["https://openalex.org/I25757504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082274996","display_name":"Shifei Ding","orcid":"https://orcid.org/0000-0002-1391-2717"},"institutions":[{"id":"https://openalex.org/I25757504","display_name":"China University of Mining and Technology","ror":"https://ror.org/01xt2dr21","country_code":"CN","type":"education","lineage":["https://openalex.org/I25757504"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shifei Ding","raw_affiliation_strings":["School of Computer Science and Technology, China University of Mining and Technology, Xuzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-1391-2717","affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, China University of Mining and Technology, Xuzhou, China","institution_ids":["https://openalex.org/I25757504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101745213","display_name":"Longbiao Wang","orcid":"https://orcid.org/0000-0002-8094-6861"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Longbiao Wang","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","College of Intelligence and Computing, Tianjin Key Laboratory of Cognitive Computing and Application, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0002-8094-6861","affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin Key Laboratory of Cognitive Computing and Application, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017251198","display_name":"Jianwu Dang","orcid":"https://orcid.org/0000-0002-9237-4821"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianwu Dang","raw_affiliation_strings":["Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","College of Intelligence and Computing, Tianjin Key Laboratory of Cognitive Computing and Application, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0002-9237-4821","affiliations":[{"raw_affiliation_string":"Tianjin Key Laboratory of Cognitive Computing and Application, College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin Key Laboratory of Cognitive Computing and Application, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5055229622"],"corresponding_institution_ids":["https://openalex.org/I25757504"],"apc_list":null,"apc_paid":null,"fwci":4.4665,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.95738355,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"36","issue":"1","first_page":"188","last_page":"197"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.964900016784668,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9541000127792358,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5704208612442017},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.5323629379272461},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.43198806047439575},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.42203816771507263},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.3968486189842224}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5704208612442017},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.5323629379272461},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.43198806047439575},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.42203816771507263},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3968486189842224}],"mesh":[{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000077321","descriptor_name":"Deep Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D001288","descriptor_name":"Attention","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D013060","descriptor_name":"Speech","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D013060","descriptor_name":"Speech","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D013060","descriptor_name":"Speech","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":false},{"descriptor_ui":"D013060","descriptor_name":"Speech","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D013060","descriptor_name":"Speech","qualifier_ui":"Q000502","qualifier_name":"physiology","is_major_topic":true},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016208","descriptor_name":"Databases, Factual","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D016571","descriptor_name":"Neural Networks, Computer","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2023.3304516","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3304516","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:37624721","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37624721","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.41999998688697815}],"awards":[{"id":"https://openalex.org/G1799562806","display_name":null,"funder_award_id":"62276185","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2162735739","display_name":null,"funder_award_id":"61976216","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4570677827","display_name":null,"funder_award_id":"62276265","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7018490659","display_name":null,"funder_award_id":"2022QN1096","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G7732325329","display_name":null,"funder_award_id":"62176182","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W175750906","https://openalex.org/W211912913","https://openalex.org/W1731081199","https://openalex.org/W1972340877","https://openalex.org/W2042700175","https://openalex.org/W2055911634","https://openalex.org/W2080289724","https://openalex.org/W2096987757","https://openalex.org/W2111072639","https://openalex.org/W2128021225","https://openalex.org/W2146334809","https://openalex.org/W2158061940","https://openalex.org/W2599621350","https://openalex.org/W2747664154","https://openalex.org/W2766272105","https://openalex.org/W2800253600","https://openalex.org/W2885005742","https://openalex.org/W2889374687","https://openalex.org/W2889717020","https://openalex.org/W2898004252","https://openalex.org/W2962736520","https://openalex.org/W2970737019","https://openalex.org/W2980520956","https://openalex.org/W2992341299","https://openalex.org/W2996249958","https://openalex.org/W2996799978","https://openalex.org/W2999653953","https://openalex.org/W3011859875","https://openalex.org/W3022013598","https://openalex.org/W3092190487","https://openalex.org/W3129702347","https://openalex.org/W3162387328","https://openalex.org/W3162475537","https://openalex.org/W3163091219","https://openalex.org/W3184215204","https://openalex.org/W3204087964","https://openalex.org/W4200502037","https://openalex.org/W4213424653","https://openalex.org/W4214872590","https://openalex.org/W4282542617","https://openalex.org/W4286544676","https://openalex.org/W4287890650","https://openalex.org/W4289752563","https://openalex.org/W4312771325","https://openalex.org/W6683633756","https://openalex.org/W6733353833"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2530322880","https://openalex.org/W1596801655","https://openalex.org/W3126677997"],"abstract_inverted_index":{"Speech":[0],"emotion":[1],"recognition":[2],"(SER)":[3],"plays":[4],"an":[5],"important":[6],"role":[7],"in":[8,59],"human-computer":[9],"interaction,":[10],"which":[11,70],"can":[12,130,169],"provide":[13],"better":[14],"interactivity":[15],"to":[16,23,29,45,86],"enhance":[17],"user":[18],"experiences.":[19],"Existing":[20],"approaches":[21],"tend":[22],"directly":[24],"apply":[25],"deep":[26,82],"learning":[27],"networks":[28],"distinguish":[30],"emotions.":[31],"Among":[32],"them,":[33],"the":[34,40,60,73,88,110,120,134,150,171],"convolutional":[35],"neural":[36],"network":[37,84],"(CNN)":[38],"is":[39],"most":[41],"commonly":[42],"used":[43],"method":[44],"learn":[46],"emotional":[47,152,157],"representations":[48],"from":[49],"spectrograms.":[50],"However,":[51],"CNN":[52],"does":[53],"not":[54],"explicitly":[55],"model":[56],"features'":[57],"associations":[58],"spectral-,":[61],"temporal-,":[62],"and":[63,125,142,155,174],"channel-wise":[64],"axes":[65],"or":[66],"their":[67],"relative":[68],"relevance,":[69],"will":[71],"limit":[72],"representation":[74],"learning.":[75],"In":[76],"this":[77],"article,":[78],"we":[79,108],"propose":[80,109],"a":[81,104,115],"spectro-temporal-channel":[83,99],"(DSTCNet)":[85],"improve":[87],"representational":[89],"ability":[90],"for":[91],"speech":[92],"emotion.":[93],"The":[94,127,163],"proposed":[95],"DSTCNet":[96,168],"integrates":[97],"several":[98,175],"(STC)":[100],"attention":[101,117,129],"modules":[102],"into":[103],"general":[105],"CNN.":[106],"Specifically,":[107],"STC":[111,128],"module":[112],"that":[113,166],"infers":[114],"3-D":[116],"map":[118],"along":[119],"dimensions":[121],"of":[122,136],"time,":[123],"frequency,":[124],"channel.":[126],"focus":[131],"more":[132],"on":[133,149],"regions":[135],"crucial":[137],"time":[138],"frames,":[139],"frequency":[140],"ranges,":[141],"feature":[143],"channels.":[144],"Finally,":[145],"experiments":[146],"were":[147],"conducted":[148],"Berlin":[151],"database":[153],"(EmoDB)":[154],"interactive":[156],"dyadic":[158],"motion":[159],"capture":[160],"(IEMOCAP)":[161],"databases.":[162],"results":[164],"reveal":[165],"our":[167],"outperform":[170],"traditional":[172],"CNN-based":[173],"state-of-the-art":[176],"methods.":[177]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":7}],"updated_date":"2026-06-02T09:04:35.204637","created_date":"2025-10-10T00:00:00"}
