{"id":"https://openalex.org/W4312251832","doi":"https://doi.org/10.1587/transfun.2022eap1091","title":"A Multitask Learning Approach Based on Cascaded Attention Network and Self-Adaption Loss for Speech Emotion Recognition","display_name":"A Multitask Learning Approach Based on Cascaded Attention Network and Self-Adaption Loss for Speech Emotion Recognition","publication_year":2022,"publication_date":"2022-12-07","ids":{"openalex":"https://openalex.org/W4312251832","doi":"https://doi.org/10.1587/transfun.2022eap1091"},"language":"en","primary_location":{"id":"doi:10.1587/transfun.2022eap1091","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transfun.2022eap1091","pdf_url":"https://www.jstage.jst.go.jp/article/transfun/E106.A/6/E106.A_2022EAP1091/_pdf","source":{"id":"https://openalex.org/S166990724","display_name":"IEICE Transactions on Fundamentals of Electronics Communications and Computer Sciences","issn_l":"0916-8508","issn":["0916-8508","1745-1337"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Fundamentals of Electronics, Communications and Computer Sciences","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.jstage.jst.go.jp/article/transfun/E106.A/6/E106.A_2022EAP1091/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066331204","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0002-9976-8671"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yang LIU","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058642737","display_name":"Yuqi Xia","orcid":"https://orcid.org/0000-0001-9485-6739"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuqi XIA","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035524175","display_name":"Haoqin Sun","orcid":"https://orcid.org/0000-0002-8554-8969"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoqin SUN","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033661018","display_name":"Xiaolei MENG","orcid":null},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolei MENG","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016373821","display_name":"Jianxiong BAI","orcid":null},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianxiong BAI","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004108905","display_name":"Wenbo Guan","orcid":"https://orcid.org/0000-0002-6448-0387"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenbo GUAN","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100658759","display_name":"Zhen Zhao","orcid":"https://orcid.org/0000-0001-5825-5346"},"institutions":[{"id":"https://openalex.org/I143413998","display_name":"Qingdao University of Science and Technology","ror":"https://ror.org/041j8js14","country_code":"CN","type":"education","lineage":["https://openalex.org/I143413998"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen ZHAO","raw_affiliation_strings":["School of Information Science and Technology, Qingdao University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, Qingdao University of Science and Technology","institution_ids":["https://openalex.org/I143413998"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030173820","display_name":"Yongwei LI","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongwei LI","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5066331204"],"corresponding_institution_ids":["https://openalex.org/I143413998"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17454345,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"E106.A","issue":"6","first_page":"876","last_page":"885"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7351152896881104},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.6577823162078857},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.6034442186355591},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5604173541069031},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5526132583618164},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5008416175842285},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.47679972648620605},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.46918749809265137},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4434191882610321},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35049235820770264},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.14486920833587646},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0744161307811737}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7351152896881104},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.6577823162078857},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.6034442186355591},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5604173541069031},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5526132583618164},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5008416175842285},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.47679972648620605},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.46918749809265137},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4434191882610321},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35049235820770264},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.14486920833587646},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0744161307811737},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transfun.2022eap1091","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transfun.2022eap1091","pdf_url":"https://www.jstage.jst.go.jp/article/transfun/E106.A/6/E106.A_2022EAP1091/_pdf","source":{"id":"https://openalex.org/S166990724","display_name":"IEICE Transactions on Fundamentals of Electronics Communications and Computer Sciences","issn_l":"0916-8508","issn":["0916-8508","1745-1337"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Fundamentals of Electronics, Communications and Computer Sciences","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transfun.2022eap1091","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transfun.2022eap1091","pdf_url":"https://www.jstage.jst.go.jp/article/transfun/E106.A/6/E106.A_2022EAP1091/_pdf","source":{"id":"https://openalex.org/S166990724","display_name":"IEICE Transactions on Fundamentals of Electronics Communications and Computer Sciences","issn_l":"0916-8508","issn":["0916-8508","1745-1337"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Fundamentals of Electronics, Communications and Computer Sciences","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4312251832.pdf","grobid_xml":"https://content.openalex.org/works/W4312251832.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W2087618018","https://openalex.org/W2087750470","https://openalex.org/W2102953093","https://openalex.org/W2110052520","https://openalex.org/W2130427639","https://openalex.org/W2131537280","https://openalex.org/W2140801466","https://openalex.org/W2146334809","https://openalex.org/W2171728561","https://openalex.org/W2295001676","https://openalex.org/W2343758848","https://openalex.org/W2399733683","https://openalex.org/W2408520939","https://openalex.org/W2625297138","https://openalex.org/W2747506362","https://openalex.org/W2750666523","https://openalex.org/W2752782242","https://openalex.org/W2766272105","https://openalex.org/W2885005742","https://openalex.org/W2889374687","https://openalex.org/W2936113082","https://openalex.org/W2962815376","https://openalex.org/W2972602947","https://openalex.org/W3128401974"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4319309271","https://openalex.org/W4366320140","https://openalex.org/W2784094750","https://openalex.org/W4285160008","https://openalex.org/W1812322370","https://openalex.org/W2597787948","https://openalex.org/W3200098538","https://openalex.org/W3047894882","https://openalex.org/W3208584567"],"abstract_inverted_index":{"Speech":[0],"emotion":[1,49,61],"recognition":[2],"(SER)":[3],"has":[4],"been":[5],"a":[6,12,24,63,110,115],"complex":[7],"and":[8,34,100,143,154],"difficult":[9],"task":[10],"for":[11,37],"long":[13],"time":[14],"due":[15],"to":[16,44,57,120],"emotional":[17],"complexity.":[18],"In":[19],"this":[20],"paper,":[21],"we":[22],"propose":[23],"multitask":[25,111],"deep":[26],"learning":[27,112],"approach":[28],"based":[29],"on":[30,88,130],"cascaded":[31],"attention":[32,65,72],"network":[33,66],"self-adaption":[35,116],"loss":[36,117],"SER.":[38],"First,":[39],"non-personalized":[40],"features":[41],"are":[42],"extracted":[43],"represent":[45],"the":[46,76,86,92,96,122],"process":[47],"of":[48,78,103,124,141,150],"change":[50],"while":[51,83],"reducing":[52],"external":[53,89,104],"variables'":[54],"influence.":[55],"Second,":[56],"highlight":[58],"salient":[59],"speech":[60,79],"features,":[62],"cascade":[64],"is":[67,106,118],"proposed,":[68],"where":[69,114],"spatial":[70],"temporal":[71],"can":[73],"effectively":[74],"locate":[75],"regions":[77],"that":[80,134],"express":[81],"emotion,":[82],"self-attention":[84],"reduces":[85],"dependence":[87],"information.":[90],"Finally,":[91],"influence":[93],"brought":[94],"by":[95,108],"differences":[97],"in":[98,148],"gender":[99],"human":[101],"perception":[102],"information":[105],"alleviated":[107],"using":[109],"strategy,":[113],"introduced":[119],"determine":[121],"weights":[123],"different":[125],"tasks":[126],"dynamically.":[127],"Experimental":[128],"results":[129],"IEMOCAP":[131],"dataset":[132],"demonstrate":[133],"our":[135],"method":[136],"gains":[137],"an":[138],"absolute":[139],"improvement":[140],"1.97%":[142],"0.91%":[144],"over":[145],"state-of-the-art":[146],"strategies":[147],"terms":[149],"weighted":[151],"accuracy":[152,156],"(WA)":[153],"unweighted":[155],"(UA),":[157],"respectively.":[158]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
