{"id":"https://openalex.org/W4415709584","doi":"https://doi.org/10.1109/icme59968.2025.11209814","title":"DiBAN: Dual-Drive Broad Attentive Network for Speech Emotion Recognition","display_name":"DiBAN: Dual-Drive Broad Attentive Network for Speech Emotion Recognition","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415709584","doi":"https://doi.org/10.1109/icme59968.2025.11209814"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11209814","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109903598","display_name":"Gengbin ZHANG","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gongli Zhang","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100643265","display_name":"C. L. Philip Chen","orcid":"https://orcid.org/0000-0001-5451-7230"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"C. L. Philip Chen","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101455067","display_name":"Tong Zhang","orcid":"https://orcid.org/0009-0001-9155-8178"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Zhang","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029578429","display_name":"Zhulin Liu","orcid":"https://orcid.org/0000-0003-4145-823X"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhulin Liu","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082022304","display_name":"Xiaoman Hu","orcid":"https://orcid.org/0000-0002-7222-0673"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoman Hu","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108108538","display_name":"Bianna Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bianna Chen","raw_affiliation_strings":["South China University of Technology,School of Computer Science and Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"South China University of Technology,School of Computer Science and Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I90610280"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5109903598"],"corresponding_institution_ids":["https://openalex.org/I90610280"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.32192669,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9815999865531921,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9815999865531921,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.005100000184029341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.0012000000569969416,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.6169999837875366},{"id":"https://openalex.org/keywords/knowledge-base","display_name":"Knowledge base","score":0.4147000014781952},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.3862000107765198},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.3587999939918518},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.3472999930381775},{"id":"https://openalex.org/keywords/decision-model","display_name":"Decision model","score":0.31949999928474426},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.31769999861717224},{"id":"https://openalex.org/keywords/supervised-learning","display_name":"Supervised learning","score":0.305400013923645}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7031999826431274},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.6169999837875366},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5730000138282776},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.46549999713897705},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42320001125335693},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.4147000014781952},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.39500001072883606},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.3862000107765198},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.3587999939918518},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C59594135","wikidata":"https://www.wikidata.org/wiki/Q5249242","display_name":"Decision model","level":2,"score":0.31949999928474426},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.31769999861717224},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.305400013923645},{"id":"https://openalex.org/C167981619","wikidata":"https://www.wikidata.org/wiki/Q1685498","display_name":"Cross entropy","level":3,"score":0.3046000003814697},{"id":"https://openalex.org/C163007329","wikidata":"https://www.wikidata.org/wiki/Q106679114","display_name":"Social emotional learning","level":2,"score":0.2896000146865845},{"id":"https://openalex.org/C6438553","wikidata":"https://www.wikidata.org/wiki/Q1185804","display_name":"Affective computing","level":2,"score":0.27959999442100525},{"id":"https://openalex.org/C2988148770","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion detection","level":3,"score":0.27619999647140503},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C206310091","wikidata":"https://www.wikidata.org/wiki/Q750859","display_name":"Emotion classification","level":2,"score":0.2542000114917755},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.25040000677108765}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11209814","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11209814","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309618","display_name":"Ministry of Science and Technology","ror":"https://ror.org/02b207r52"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W175750906","https://openalex.org/W2030931454","https://openalex.org/W2122111042","https://openalex.org/W2146334809","https://openalex.org/W2149706766","https://openalex.org/W2620962372","https://openalex.org/W2738226240","https://openalex.org/W2803098682","https://openalex.org/W2980520956","https://openalex.org/W3081192838","https://openalex.org/W3196974791","https://openalex.org/W3209059054","https://openalex.org/W3209984917","https://openalex.org/W4239510810","https://openalex.org/W4372266717","https://openalex.org/W4372269797","https://openalex.org/W4372341110","https://openalex.org/W4385245566","https://openalex.org/W4389459413","https://openalex.org/W4392309135","https://openalex.org/W4392903396","https://openalex.org/W4392904469","https://openalex.org/W4392931772","https://openalex.org/W4400762160"],"related_works":[],"abstract_inverted_index":{"Data-Knowledge":[0],"dual-driven":[1],"fashion":[2],"can":[3],"enhance":[4],"model":[5,76],"performance":[6],"by":[7],"complementing":[8],"data-driven":[9,25],"basis":[10],"with":[11],"expert":[12],"knowledge.":[13],"However,":[14],"cutting-edge":[15],"works":[16],"in":[17,24],"speech":[18],"emotion":[19],"recognition":[20],"(SER)":[21],"primarily":[22],"evolve":[23],"training,":[26],"failing":[27],"to":[28,32,41,59,81,94],"incorporate":[29],"prior":[30],"knowledge":[31],"form":[33],"a":[34,53],"closed":[35],"loop":[36],"and":[37,77,138],"posing":[38],"an":[39],"obstacle":[40],"capture":[42],"task-specific":[43],"details":[44],"when":[45],"used":[46],"independently.":[47],"In":[48],"this":[49],"paper,":[50],"we":[51],"propose":[52],"Dual-Drive":[54,68],"Broad":[55,108],"Attentive":[56],"Network":[57],"(DiBAN)":[58],"achieve":[60],"comprehensive":[61],"emotional":[62,84,98,117],"learning":[63],"for":[64],"SER.":[65],"Specifically,":[66],"the":[67,87,96,102,107,135],"Emotional":[69],"Modeling":[70],"module":[71,91,112],"incorporates":[72],"handcrafted":[73],"extractor,":[74],"pre-trained":[75],"tailored":[78],"base":[79,136],"models,":[80],"conduct":[82],"integral":[83],"modeling.":[85],"Subsequently,":[86],"Multi-Model":[88],"Attention-Aware":[89],"Learning":[90],"is":[92],"designed":[93],"refine":[95],"data-knowledge":[97],"disparities":[99],"based":[100],"on":[101,124],"attention-enhanced":[103],"entropy":[104],"loss.":[105],"Finally,":[106],"Adaptive":[109],"Decision":[110],"Fusion":[111],"performs":[113],"adaptive":[114],"fusion":[115],"of":[116],"decisions":[118],"from":[119],"different":[120],"drives.":[121],"Extensive":[122],"experiments":[123],"seven":[125],"SER":[126],"corpora":[127],"demonstrate":[128],"that":[129],"DiBAN":[130],"achieves":[131],"significant":[132],"improvements":[133],"over":[134],"models":[137],"outperforms":[139],"comparative":[140],"methods,":[141],"fully":[142],"showcasing":[143],"its":[144],"superiority.":[145]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-30T00:00:00"}
