{"id":"https://openalex.org/W4292980177","doi":"https://doi.org/10.1109/tcyb.2022.3195739","title":"AIA-Net: Adaptive Interactive Attention Network for Text\u2013Audio Emotion Recognition","display_name":"AIA-Net: Adaptive Interactive Attention Network for Text\u2013Audio Emotion Recognition","publication_year":2022,"publication_date":"2022-08-22","ids":{"openalex":"https://openalex.org/W4292980177","doi":"https://doi.org/10.1109/tcyb.2022.3195739","pmid":"https://pubmed.ncbi.nlm.nih.gov/35994535"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2022.3195739","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2022.3195739","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100378800","display_name":"Tong Zhang","orcid":"https://orcid.org/0000-0002-7025-6365"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Zhang","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-7025-6365","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027023224","display_name":"Shuzhen Li","orcid":"https://orcid.org/0000-0001-6847-6740"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuzhen Li","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-6847-6740","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108108538","display_name":"Bianna Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bianna Chen","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-5451-7230","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020996953","display_name":"Haozhang Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haozhang Yuan","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100643265","display_name":"C. L. Philip Chen","orcid":"https://orcid.org/0000-0001-5451-7230"},"institutions":[{"id":"https://openalex.org/I90610280","display_name":"South China University of Technology","ror":"https://ror.org/0530pts50","country_code":"CN","type":"education","lineage":["https://openalex.org/I90610280"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"C. L. Philip Chen","raw_affiliation_strings":["School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, South China University of Technology, Guangzhou, China","institution_ids":["https://openalex.org/I90610280"]},{"raw_affiliation_string":"Brain and Affective Cognitive Research Center, Pazhou Lab, Guangzhou, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":5.3514,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.96640267,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"53","issue":"12","first_page":"7659","last_page":"7671"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5810286998748779},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5012199878692627},{"id":"https://openalex.org/keywords/net","display_name":"Net (polyhedron)","score":0.45899444818496704},{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.4152721166610718},{"id":"https://openalex.org/keywords/cognitive-psychology","display_name":"Cognitive psychology","score":0.35241878032684326},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.33080530166625977},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3126738667488098},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0501399040222168}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5810286998748779},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5012199878692627},{"id":"https://openalex.org/C14166107","wikidata":"https://www.wikidata.org/wiki/Q253829","display_name":"Net (polyhedron)","level":2,"score":0.45899444818496704},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.4152721166610718},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.35241878032684326},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.33080530166625977},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3126738667488098},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0501399040222168},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000162","descriptor_name":"Acoustics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000162","descriptor_name":"Acoustics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000162","descriptor_name":"Acoustics","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003199","descriptor_name":"Computer Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003199","descriptor_name":"Computer Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003199","descriptor_name":"Computer Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004644","descriptor_name":"Emotions","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D006801","descriptor_name":"Humans","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D007858","descriptor_name":"Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2022.3195739","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2022.3195739","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:35994535","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/35994535","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1487701234","display_name":null,"funder_award_id":"62222603","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G420612141","display_name":null,"funder_award_id":"U1801262","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5197980865","display_name":null,"funder_award_id":"2019YFA0706200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5198162578","display_name":null,"funder_award_id":"62076102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5750115239","display_name":null,"funder_award_id":"U1813203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":80,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1703987040","https://openalex.org/W1832693441","https://openalex.org/W1932847118","https://openalex.org/W2029996593","https://openalex.org/W2120615054","https://openalex.org/W2132860741","https://openalex.org/W2146334809","https://openalex.org/W2187089797","https://openalex.org/W2194775991","https://openalex.org/W2556418146","https://openalex.org/W2610961739","https://openalex.org/W2619383789","https://openalex.org/W2703895418","https://openalex.org/W2740550900","https://openalex.org/W2747664154","https://openalex.org/W2766272105","https://openalex.org/W2783274584","https://openalex.org/W2786768213","https://openalex.org/W2884561390","https://openalex.org/W2889325879","https://openalex.org/W2889374687","https://openalex.org/W2896457183","https://openalex.org/W2897132394","https://openalex.org/W2920885526","https://openalex.org/W2933138175","https://openalex.org/W2941503969","https://openalex.org/W2949391930","https://openalex.org/W2950978907","https://openalex.org/W2955084925","https://openalex.org/W2958722525","https://openalex.org/W2963686995","https://openalex.org/W2964010806","https://openalex.org/W2964051877","https://openalex.org/W2964300796","https://openalex.org/W2964346351","https://openalex.org/W2966140490","https://openalex.org/W2972463723","https://openalex.org/W2973049979","https://openalex.org/W2977752818","https://openalex.org/W2998470965","https://openalex.org/W3012721484","https://openalex.org/W3024507639","https://openalex.org/W3028041000","https://openalex.org/W3037572520","https://openalex.org/W3038471032","https://openalex.org/W3041730883","https://openalex.org/W3048195943","https://openalex.org/W3087647883","https://openalex.org/W3091972294","https://openalex.org/W3093043896","https://openalex.org/W3093051361","https://openalex.org/W3093400813","https://openalex.org/W3093434718","https://openalex.org/W3095251683","https://openalex.org/W3095334805","https://openalex.org/W3096164988","https://openalex.org/W3096690837","https://openalex.org/W3097571315","https://openalex.org/W3120680448","https://openalex.org/W3127474142","https://openalex.org/W3135148659","https://openalex.org/W3137536308","https://openalex.org/W3141688548","https://openalex.org/W3160574821","https://openalex.org/W3177085913","https://openalex.org/W3199305386","https://openalex.org/W3203395742","https://openalex.org/W3208639589","https://openalex.org/W4221154966","https://openalex.org/W4285149123","https://openalex.org/W6631190155","https://openalex.org/W6638667902","https://openalex.org/W6719057275","https://openalex.org/W6729831399","https://openalex.org/W6739901393","https://openalex.org/W6752724743","https://openalex.org/W6766673545","https://openalex.org/W6767287485","https://openalex.org/W6769196770"],"related_works":["https://openalex.org/W2271369634","https://openalex.org/W3147472394","https://openalex.org/W2047100085","https://openalex.org/W2350550760","https://openalex.org/W578794879","https://openalex.org/W2625296515","https://openalex.org/W3137890128","https://openalex.org/W1984634519","https://openalex.org/W4245955731","https://openalex.org/W2393726419"],"abstract_inverted_index":{"Emotion":[0],"recognition":[1,66],"based":[2,74],"on":[3,75,139,187],"text-audio":[4],"modalities":[5,52],"is":[6,67,95,103],"the":[7,60,76,140,156,161,178,192,196,200],"core":[8],"technology":[9],"for":[10,146],"transforming":[11],"a":[12,17,24,98,124],"graphical":[13],"user":[14,19],"interface":[15],"into":[16],"voice":[18],"interface,":[20],"and":[21,101,111,117,177],"it":[22],"plays":[23],"vital":[25],"role":[26],"in":[27,56,63,123,153],"natural":[28],"human-computer":[29],"interaction":[30],"systems.":[31],"Currently,":[32],"mainstream":[33],"multimodal":[34,64,175],"learning":[35,168],"research":[36],"has":[37],"designed":[38],"various":[39],"fusion":[40,72],"strategies":[41],"to":[42,69,109,137],"learn":[43],"intermodality":[44],"interactions":[45,176],"but":[46],"hardly":[47],"considers":[48],"that":[49,143],"not":[50],"all":[51],"play":[53],"equal":[54],"roles":[55],"emotion":[57,65],"recognition.":[58],"Therefore,":[59],"main":[61],"challenge":[62],"how":[68],"implement":[70],"effective":[71,145],"algorithms":[73],"auxiliary":[77,105],"structure.":[78],"To":[79],"address":[80],"this":[81,83],"problem,":[82],"article":[84],"proposes":[85],"an":[86,104],"adaptive":[87],"interactive":[88,121,129,134],"attention":[89,135],"network":[90],"(AIA-Net).":[91],"In":[92],"AIA-Net,":[93],"text":[94],"treated":[96],"as":[97,133],"primary":[99],"modality,":[100],"audio":[102],"modality.":[106],"AIA-Net":[107,150,172],"adapts":[108],"textual":[110,147,157],"acoustic":[112,141,162],"features":[113,142],"with":[114,160],"different":[115],"dimensions":[116],"learns":[118],"their":[119],"dynamic":[120],"relations":[122,130],"more":[125],"flexible":[126],"way.":[127],"The":[128],"are":[131,144],"encoded":[132],"weights":[136],"focus":[138],"emotional":[148,158,163,183],"representations.":[149,184],"performs":[151],"well":[152],"adaptively":[154],"assisting":[155],"representation":[159],"information.":[164],"Moreover,":[165],"multiple":[166,174],"collaborative":[167],"(co-learning)":[169],"layers":[170],"of":[171,182,195],"achieve":[173],"deep":[179],"bottom-up":[180],"evolution":[181],"Experimental":[185],"results":[186],"three":[188],"benchmark":[189],"datasets":[190],"demonstrate":[191],"great":[193],"effectiveness":[194],"proposed":[197],"method":[198],"over":[199],"state-of-the-art":[201],"methods.":[202]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":14},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
