{"id":"https://openalex.org/W3120680448","doi":"https://doi.org/10.1109/taslp.2021.3049898","title":"CTNet: Conversational Transformer Network for Emotion Recognition","display_name":"CTNet: Conversational Transformer Network for Emotion Recognition","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3120680448","doi":"https://doi.org/10.1109/taslp.2021.3049898","mag":"3120680448"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2021.3049898","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3049898","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001973434","display_name":"Zheng Lian","orcid":"https://orcid.org/0000-0001-9477-0599"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zheng Lian","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100395562","display_name":"Bin Liu","orcid":"https://orcid.org/0000-0003-1529-1552"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Liu","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112613657","display_name":"Jianhua Tao","orcid":"https://orcid.org/0000-0002-9344-6428"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210097554","display_name":"Center for Excellence in Brain Science and Intelligence Technology","ror":"https://ror.org/00vpwhm04","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210097554"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianhua Tao","raw_affiliation_strings":["CAS Center for Excellence in Brain Science and Intelligence Technology, Beijing, China","National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"CAS Center for Excellence in Brain Science and Intelligence Technology, Beijing, China","institution_ids":["https://openalex.org/I4210097554"]},{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5001973434"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210100255","https://openalex.org/I4210112150","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":34.1266,"has_fulltext":false,"cited_by_count":269,"citation_normalized_percentile":{"value":0.99880502,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"29","issue":null,"first_page":"985","last_page":"1000"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8065599799156189},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.6322242617607117},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6322143077850342},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6007729172706604},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.5909513831138611},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.580984354019165},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.5564005374908447},{"id":"https://openalex.org/keywords/emotion-recognition","display_name":"Emotion recognition","score":0.504546046257019},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5035783648490906},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4973657429218292},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.08790373802185059}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8065599799156189},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.6322242617607117},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6322143077850342},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6007729172706604},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.5909513831138611},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.580984354019165},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.5564005374908447},{"id":"https://openalex.org/C2777438025","wikidata":"https://www.wikidata.org/wiki/Q1339090","display_name":"Emotion recognition","level":2,"score":0.504546046257019},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5035783648490906},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4973657429218292},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.08790373802185059},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2021.3049898","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3049898","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.699999988079071,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G5381013183","display_name":null,"funder_award_id":"61831022","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7264488544","display_name":null,"funder_award_id":"61771472","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8374701036","display_name":null,"funder_award_id":"61901473","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G953811167","display_name":null,"funder_award_id":"61773379","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":90,"referenced_works":["https://openalex.org/W22229905","https://openalex.org/W43346191","https://openalex.org/W123007118","https://openalex.org/W1524333225","https://openalex.org/W1651753422","https://openalex.org/W1663973292","https://openalex.org/W1793121960","https://openalex.org/W1973453096","https://openalex.org/W2009086942","https://openalex.org/W2041823554","https://openalex.org/W2064675550","https://openalex.org/W2085662862","https://openalex.org/W2095705004","https://openalex.org/W2097998348","https://openalex.org/W2109743529","https://openalex.org/W2114535528","https://openalex.org/W2116341502","https://openalex.org/W2117671523","https://openalex.org/W2129999749","https://openalex.org/W2138611879","https://openalex.org/W2144760012","https://openalex.org/W2146334809","https://openalex.org/W2147800946","https://openalex.org/W2148146486","https://openalex.org/W2150769028","https://openalex.org/W2150906796","https://openalex.org/W2157331557","https://openalex.org/W2194775991","https://openalex.org/W2239141610","https://openalex.org/W2314395941","https://openalex.org/W2402144811","https://openalex.org/W2404617565","https://openalex.org/W2470413457","https://openalex.org/W2523856713","https://openalex.org/W2533262878","https://openalex.org/W2608438166","https://openalex.org/W2619383789","https://openalex.org/W2740550900","https://openalex.org/W2748488820","https://openalex.org/W2749891261","https://openalex.org/W2767249564","https://openalex.org/W2772633765","https://openalex.org/W2787581402","https://openalex.org/W2805662932","https://openalex.org/W2890964092","https://openalex.org/W2891359673","https://openalex.org/W2897337310","https://openalex.org/W2937584914","https://openalex.org/W2949391930","https://openalex.org/W2951008357","https://openalex.org/W2952307697","https://openalex.org/W2953384591","https://openalex.org/W2953739332","https://openalex.org/W2962718314","https://openalex.org/W2963045354","https://openalex.org/W2963403868","https://openalex.org/W2963647655","https://openalex.org/W2963667932","https://openalex.org/W2963686995","https://openalex.org/W2963873807","https://openalex.org/W2964010806","https://openalex.org/W2964015378","https://openalex.org/W2964051877","https://openalex.org/W2964266095","https://openalex.org/W2964300796","https://openalex.org/W2964346351","https://openalex.org/W2965453734","https://openalex.org/W2966518489","https://openalex.org/W2972965453","https://openalex.org/W2985882473","https://openalex.org/W3015707499","https://openalex.org/W3205498744","https://openalex.org/W4206192903","https://openalex.org/W4297801177","https://openalex.org/W4385245566","https://openalex.org/W6601784809","https://openalex.org/W6605010638","https://openalex.org/W6631362777","https://openalex.org/W6638318767","https://openalex.org/W6674330103","https://openalex.org/W6674385629","https://openalex.org/W6681923411","https://openalex.org/W6713134421","https://openalex.org/W6726873649","https://openalex.org/W6739901393","https://openalex.org/W6748148878","https://openalex.org/W6748304040","https://openalex.org/W6748551036","https://openalex.org/W6765690761","https://openalex.org/W6780226713"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W1968552888","https://openalex.org/W2374116601","https://openalex.org/W3093134843","https://openalex.org/W1511346092","https://openalex.org/W1527532029","https://openalex.org/W2529301793","https://openalex.org/W3133700904","https://openalex.org/W3105646692","https://openalex.org/W4387914125"],"abstract_inverted_index":{"Emotion":[0],"recognition":[1,21,27],"in":[2,12,64,129],"conversation":[3],"is":[4],"a":[5,79],"crucial":[6],"topic":[7],"for":[8,83],"its":[9],"widespread":[10],"applications":[11],"the":[13,36,52,66,97,120,130,143,156,162,165],"field":[14],"of":[15,22,39,55,164],"human-computer":[16],"interactions.":[17,70],"Unlike":[18],"vanilla":[19],"emotion":[20,26,85],"individual":[23],"utterances,":[24],"conversational":[25,84,88],"requires":[28],"modeling":[29,65],"both":[30],"context-sensitive":[31,135],"and":[32,68,103,115,136,150,158],"speaker-sensitive":[33,137],"dependencies.":[34],"Despite":[35],"promising":[37],"results":[38,154],"recent":[40],"works,":[41],"they":[42,61],"generally":[43],"do":[44],"not":[45],"leverage":[46],"advanced":[47],"fusion":[48],"techniques":[49],"to":[50,73,95,100,125,133,141],"generate":[51],"multimodal":[53,80,107],"representations":[54],"an":[56,171],"utterance.":[57,131],"In":[58,71],"this":[59],"way,":[60],"have":[62],"limitations":[63],"intra-modal":[67,102],"cross-modal":[69,104],"order":[72],"address":[74],"these":[75],"problems,":[76],"we":[77,93,110,139],"propose":[78,94,140],"learning":[81],"framework":[82],"recognition,":[86],"called":[87],"transformer":[89],"network":[90],"(CTNet).":[91],"Specifically,":[92],"use":[96,142],"transformer-based":[98],"structure":[99],"model":[101,134],"interactions":[105],"among":[106],"features.":[108],"Meanwhile,":[109],"utilize":[111],"word-level":[112],"lexical":[113],"features":[114,118],"segment-level":[116],"acoustic":[117],"as":[119],"inputs,":[121],"thus":[122],"enabling":[123],"us":[124],"capture":[126],"temporal":[127],"information":[128],"Additionally,":[132],"dependencies,":[138],"multihead":[144],"attention":[145],"based":[146],"bi-directional":[147],"GRU":[148],"component":[149],"speaker":[151],"embeddings.":[152],"Experimental":[153],"on":[155,176],"IEMOCAP":[157],"MELD":[159],"datasets":[160],"demonstrate":[161],"effectiveness":[163],"proposed":[166],"method.":[167],"Our":[168],"method":[169],"shows":[170],"absolute":[172],"2.1~6.2%":[173],"performance":[174],"improvement":[175],"weighted":[177],"average":[178],"F1":[179],"over":[180],"state-of-the-art":[181],"strategies.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":9},{"year":2025,"cited_by_count":74},{"year":2024,"cited_by_count":66},{"year":2023,"cited_by_count":67},{"year":2022,"cited_by_count":37},{"year":2021,"cited_by_count":16}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
