{"id":"https://openalex.org/W4321609205","doi":"https://doi.org/10.1109/taslp.2023.3245401","title":"A Discriminative Feature Representation Method Based on Cascaded Attention Network With Adversarial Strategy for Speech Emotion Recognition","display_name":"A Discriminative Feature Representation Method Based on Cascaded Attention Network With Adversarial Strategy for Speech Emotion Recognition","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4321609205","doi":"https://doi.org/10.1109/taslp.2023.3245401"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2023.3245401","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3245401","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066331204","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0002-9976-8671"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang Liu","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-9976-8671","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035524175","display_name":"Haoqin Sun","orcid":"https://orcid.org/0000-0002-8554-8969"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoqin Sun","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-8554-8969","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004108905","display_name":"Wenbo Guan","orcid":"https://orcid.org/0000-0002-6448-0387"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenbo Guan","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-6448-0387","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058642737","display_name":"Yuqi Xia","orcid":"https://orcid.org/0000-0001-9485-6739"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuqi Xia","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0001-9485-6739","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100717753","display_name":"Yongwei Li","orcid":"https://orcid.org/0000-0001-7799-366X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongwei Li","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7799-366X","affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014199725","display_name":"Masashi Unoki","orcid":"https://orcid.org/0000-0002-6605-2052"},"institutions":[{"id":"https://openalex.org/I177738480","display_name":"Japan Advanced Institute of Science and Technology","ror":"https://ror.org/03frj4r98","country_code":"JP","type":"education","lineage":["https://openalex.org/I177738480"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masashi Unoki","raw_affiliation_strings":["School of Information Science, Japan Advanced Institute of Science and Technology, Nomi, Ishikawa, Japan"],"raw_orcid":"https://orcid.org/0000-0002-6605-2052","affiliations":[{"raw_affiliation_string":"School of Information Science, Japan Advanced Institute of Science and Technology, Nomi, Ishikawa, Japan","institution_ids":["https://openalex.org/I177738480"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5080527694","display_name":"Zhen Zhao","orcid":"https://orcid.org/0000-0002-7898-8974"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Zhao","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China"],"raw_orcid":"https://orcid.org/0000-0002-7898-8974","affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology, Qingdao, China","institution_ids":["https://openalex.org/I143413998"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5066331204"],"corresponding_institution_ids":["https://openalex.org/I143413998"],"apc_list":null,"apc_paid":null,"fwci":8.0954,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.98034004,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"31","issue":null,"first_page":"1063","last_page":"1074"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.816308856010437},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7700413465499878},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7308229804039001},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6110225319862366},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5863907933235168},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5292108654975891},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5276557207107544},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.4527204632759094},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44656825065612793},{"id":"https://openalex.org/keywords/interference","display_name":"Interference (communication)","score":0.42999914288520813},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3874180316925049},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32036370038986206},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.19349241256713867},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.0801909863948822}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.816308856010437},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7700413465499878},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7308229804039001},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6110225319862366},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5863907933235168},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5292108654975891},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5276557207107544},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.4527204632759094},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44656825065612793},{"id":"https://openalex.org/C32022120","wikidata":"https://www.wikidata.org/wiki/Q797225","display_name":"Interference (communication)","level":3,"score":0.42999914288520813},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3874180316925049},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32036370038986206},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.19349241256713867},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0801909863948822},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2023.3245401","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2023.3245401","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.6899999976158142}],"awards":[{"id":"https://openalex.org/G268415559","display_name":null,"funder_award_id":"ZR2020QF007","funder_id":"https://openalex.org/F4320324174","funder_display_name":"Natural Science Foundation of Shandong Province"},{"id":"https://openalex.org/G7194583006","display_name":null,"funder_award_id":"19JCYBJC15600","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"}],"funders":[{"id":"https://openalex.org/F4320323993","display_name":"Natural Science Foundation of Tianjin City","ror":null},{"id":"https://openalex.org/F4320324174","display_name":"Natural Science Foundation of Shandong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W175750906","https://openalex.org/W177923765","https://openalex.org/W1556467653","https://openalex.org/W2047337856","https://openalex.org/W2080576537","https://openalex.org/W2087618018","https://openalex.org/W2092718714","https://openalex.org/W2099767163","https://openalex.org/W2116516955","https://openalex.org/W2140801466","https://openalex.org/W2146334809","https://openalex.org/W2186582707","https://openalex.org/W2194775991","https://openalex.org/W2214134199","https://openalex.org/W2239141610","https://openalex.org/W2314084222","https://openalex.org/W2518110751","https://openalex.org/W2549858646","https://openalex.org/W2592497314","https://openalex.org/W2592702372","https://openalex.org/W2766272105","https://openalex.org/W2784163702","https://openalex.org/W2885005742","https://openalex.org/W2889544113","https://openalex.org/W2901446695","https://openalex.org/W2910121883","https://openalex.org/W2936372954","https://openalex.org/W2936774411","https://openalex.org/W2939129695","https://openalex.org/W2939488497","https://openalex.org/W2959133507","https://openalex.org/W2962686539","https://openalex.org/W2963026686","https://openalex.org/W2972498864","https://openalex.org/W3011859875","https://openalex.org/W3097567450","https://openalex.org/W3100321043","https://openalex.org/W3103152812","https://openalex.org/W3138410940","https://openalex.org/W3159124063","https://openalex.org/W3178599867","https://openalex.org/W3196443845","https://openalex.org/W3197101920","https://openalex.org/W3198893858","https://openalex.org/W4214825215","https://openalex.org/W4288038809","https://openalex.org/W4289752563","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W4246396837","https://openalex.org/W2482350142","https://openalex.org/W3176240006","https://openalex.org/W3126451824","https://openalex.org/W2965546495","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W2735297260"],"abstract_inverted_index":{"Currently,":[0],"speech":[1,55],"emotion":[2,56],"recognition":[3],"models":[4],"still":[5],"could":[6],"not":[7],"show":[8],"satisfactory":[9],"performance":[10],"due":[11],"to":[12,72,88,103,146],"the":[13,20,31,61,67,91,113,118,125,132,148,155,172,188],"complexity":[14],"of":[15,19,30,83,93,135],"emotions.":[16],"In":[17,37,121],"most":[18],"previous":[21],"studies,":[22],"there":[23],"is":[24,144],"a":[25,42,99],"common":[26],"problem":[27],"that":[28,182],"some":[29],"particular":[32],"emotions":[33,68],"are":[34,70,169],"severely":[35],"misclassified.":[36],"this":[38],"article,":[39],"we":[40,77,97],"propose":[41],"novel":[43],"framework":[44],"integrating":[45],"cascaded":[46,100],"attention":[47,101,110,127],"network":[48,102],"and":[49,81,175],"adversarial":[50,140,161],"joint":[51,141],"loss":[52,142],"strategy":[53,143],"for":[54],"recognition,":[57],"aiming":[58],"at":[59],"discriminating":[60],"confusions":[62],"by":[63,154],"emphasizing":[64],"more":[65],"on":[66,191],"which":[69],"difficult":[71],"be":[73],"correctly":[74],"classified.":[75],"First,":[76],"extract":[78,104],"log-Mels,":[79],"deltas":[80],"delta-deltas":[82],"log-Mels":[84],"as":[85],"3D":[86],"features":[87],"effectively":[89],"reduce":[90],"interference":[92],"external":[94],"factors.":[95],"Next,":[96],"introduce":[98],"effective":[105],"emotional":[106,115,149],"features,":[107],"where":[108],"spatiotemporal":[109],"selectively":[111],"locates":[112],"targeted":[114,123],"regions":[116],"from":[117],"input":[119],"features.":[120,137],"these":[122],"regions,":[124],"self":[126],"with":[128,151,171],"head":[129],"fusion":[130],"captures":[131],"long-distance":[133],"dependence":[134],"temporal":[136],"Finally,":[138],"an":[139,160],"proposed":[145,166,184],"distinguish":[147],"embeddings":[150],"high":[152],"similarity":[153],"generated":[156],"hard":[157],"triplets":[158],"in":[159],"fashion.":[162],"To":[163],"evaluate":[164],"our":[165,183],"method,":[167],"experiments":[168],"performed":[170],"IEMOCAP,":[173],"CASIA,":[174],"EMODB":[176],"corpora.":[177],"The":[178],"experimental":[179],"results":[180],"demonstrate":[181],"method":[185],"significantly":[186],"outperforms":[187],"state-of-the-art":[189],"approaches":[190],"all":[192],"datasets.":[193]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":1}],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
