{"id":"https://openalex.org/W3141688548","doi":"https://doi.org/10.1109/taslp.2021.3068598","title":"Analyzing Multimodal Sentiment Via Acoustic- and Visual-LSTM With Channel-Aware Temporal Convolution Network","display_name":"Analyzing Multimodal Sentiment Via Acoustic- and Visual-LSTM With Channel-Aware Temporal Convolution Network","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3141688548","doi":"https://doi.org/10.1109/taslp.2021.3068598","mag":"3141688548"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2021.3068598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3068598","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010270301","display_name":"Sijie Mai","orcid":"https://orcid.org/0000-0001-9763-375X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Sijie Mai","raw_affiliation_strings":["School of Electronics and Information Technology, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information Technology, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051867844","display_name":"Songlong Xing","orcid":"https://orcid.org/0000-0002-2734-1695"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Songlong Xing","raw_affiliation_strings":["School of Electronics and Information Technology, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information Technology, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056953478","display_name":"Haifeng Hu","orcid":"https://orcid.org/0000-0002-4884-323X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haifeng Hu","raw_affiliation_strings":["School of Electronics and Information Technology, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Information Technology, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5010270301"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":12.2929,"has_fulltext":false,"cited_by_count":84,"citation_normalized_percentile":{"value":0.99074589,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"29","issue":null,"first_page":"1424","last_page":"1437"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8051124811172485},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.7324830889701843},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.558853268623352},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5494120717048645},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.5081989765167236},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.4801318347454071},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.4725648760795593},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.47101888060569763},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.45102399587631226},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4351637065410614},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.42932701110839844},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40871667861938477},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36348316073417664},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.2387763261795044}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8051124811172485},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.7324830889701843},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.558853268623352},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5494120717048645},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.5081989765167236},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.4801318347454071},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.4725648760795593},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.47101888060569763},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.45102399587631226},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4351637065410614},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.42932701110839844},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40871667861938477},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36348316073417664},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2387763261795044},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/taslp.2021.3068598","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2021.3068598","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6600000262260437}],"awards":[{"id":"https://openalex.org/G4228998522","display_name":null,"funder_award_id":"2017A030311029","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G8307738215","display_name":null,"funder_award_id":"62076262","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":105,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1614298861","https://openalex.org/W1983364832","https://openalex.org/W1995562189","https://openalex.org/W2029996593","https://openalex.org/W2061116763","https://openalex.org/W2064675550","https://openalex.org/W2079725295","https://openalex.org/W2085662862","https://openalex.org/W2095176743","https://openalex.org/W2099355420","https://openalex.org/W2117671523","https://openalex.org/W2146334809","https://openalex.org/W2149359396","https://openalex.org/W2157331557","https://openalex.org/W2158899491","https://openalex.org/W2168465881","https://openalex.org/W2194775991","https://openalex.org/W2250539671","https://openalex.org/W2519091744","https://openalex.org/W2519656895","https://openalex.org/W2533262878","https://openalex.org/W2546919788","https://openalex.org/W2556418146","https://openalex.org/W2583643061","https://openalex.org/W2587019100","https://openalex.org/W2613904329","https://openalex.org/W2619383789","https://openalex.org/W2740550900","https://openalex.org/W2767249564","https://openalex.org/W2772633765","https://openalex.org/W2787581402","https://openalex.org/W2792764867","https://openalex.org/W2798330760","https://openalex.org/W2808359495","https://openalex.org/W2883409523","https://openalex.org/W2886193235","https://openalex.org/W2891369367","https://openalex.org/W2896457183","https://openalex.org/W2896528354","https://openalex.org/W2937484199","https://openalex.org/W2949391930","https://openalex.org/W2952230511","https://openalex.org/W2958722525","https://openalex.org/W2962718314","https://openalex.org/W2962931510","https://openalex.org/W2963016848","https://openalex.org/W2963063161","https://openalex.org/W2963128932","https://openalex.org/W2963285578","https://openalex.org/W2963317470","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W2963420686","https://openalex.org/W2963685106","https://openalex.org/W2963710346","https://openalex.org/W2963840672","https://openalex.org/W2963983719","https://openalex.org/W2964010806","https://openalex.org/W2964051877","https://openalex.org/W2964059481","https://openalex.org/W2964121744","https://openalex.org/W2964158702","https://openalex.org/W2964216663","https://openalex.org/W2964265128","https://openalex.org/W2964266095","https://openalex.org/W2964286182","https://openalex.org/W2964346351","https://openalex.org/W2970309699","https://openalex.org/W2970972665","https://openalex.org/W2971004099","https://openalex.org/W2971050617","https://openalex.org/W2972460025","https://openalex.org/W2997573100","https://openalex.org/W3034897750","https://openalex.org/W3108764796","https://openalex.org/W4294555862","https://openalex.org/W4385245566","https://openalex.org/W6631190155","https://openalex.org/W6636510571","https://openalex.org/W6674902714","https://openalex.org/W6683738474","https://openalex.org/W6685562342","https://openalex.org/W6696085341","https://openalex.org/W6720905350","https://openalex.org/W6726977916","https://openalex.org/W6729014267","https://openalex.org/W6733081445","https://openalex.org/W6737778391","https://openalex.org/W6739901393","https://openalex.org/W6744073670","https://openalex.org/W6748551036","https://openalex.org/W6748726628","https://openalex.org/W6749825310","https://openalex.org/W6750417760","https://openalex.org/W6751495912","https://openalex.org/W6752724743","https://openalex.org/W6753277404","https://openalex.org/W6754823179","https://openalex.org/W6755207826","https://openalex.org/W6755868333","https://openalex.org/W6762250955","https://openalex.org/W6767287485","https://openalex.org/W6780493881","https://openalex.org/W6786244873"],"related_works":["https://openalex.org/W4283320496","https://openalex.org/W3157841754","https://openalex.org/W4381827277","https://openalex.org/W4390136517","https://openalex.org/W2895918973","https://openalex.org/W4387316634","https://openalex.org/W3167558523","https://openalex.org/W3120825179","https://openalex.org/W4285815173","https://openalex.org/W2946165673"],"abstract_inverted_index":{"The":[0],"emotion":[1,156],"of":[2,21,109],"human":[3,13],"is":[4,50,89],"always":[5],"expressed":[6],"in":[7,24,66,102],"a":[8,67,85],"multimodal":[9,12,28,152],"perspective.":[10],"Analyzing":[11],"sentiment":[14,153],"remains":[15],"challenging":[16],"due":[17],"to":[18,32,37,91,118,125,143],"the":[19,22,44,47,55,93,97,103,144],"difficulties":[20],"interpretation":[23],"inter-modality":[25,39,64],"dynamics.":[26],"Mainstream":[27],"learning":[29,106],"architectures":[30],"tend":[31],"design":[33],"various":[34],"fusion":[35],"strategies":[36],"learn":[38,63],"interactions,":[40],"which":[41],"barely":[42],"consider":[43],"fact":[45],"that":[46,135],"language":[48,75,94],"modality":[49,124],"far":[51],"more":[52],"important":[53],"than":[54],"acoustic":[56],"and":[57,72,129,155],"visual":[58],"modalities.":[59],"In":[60],"contrast,":[61],"we":[62,112],"dynamics":[65],"different":[68],"perspective":[69],"via":[70,96],"acoustic-":[71],"visual-LSTMs":[73],"where":[74],"features":[76],"play":[77],"dominant":[78],"role.":[79],"Specifically,":[80],"inside":[81],"each":[82,123],"LSTM":[83],"variant,":[84],"well-designed":[86],"gating":[87],"mechanism":[88],"introduced":[90],"enhance":[92],"representation":[95,105],"corresponding":[98],"auxiliary":[99],"modality.":[100],"Furthermore,":[101],"unimodal":[104],"stage,":[107],"instead":[108],"using":[110],"RNNs,":[111],"introduce":[113],"`channel-aware'":[114],"temporal":[115,128],"convolution":[116],"network":[117],"extract":[119],"high-level":[120],"representations":[121],"for":[122,151],"explore":[126],"both":[127],"channel-wise":[130],"interdependencies.":[131],"Extensive":[132],"experiments":[133],"demonstrate":[134],"our":[136],"approach":[137],"achieves":[138],"very":[139],"competitive":[140],"performance":[141],"compared":[142],"state-of-the-art":[145],"methods":[146],"on":[147],"three":[148],"widely-used":[149],"benchmarks":[150],"analysis":[154],"recognition.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":19},{"year":2023,"cited_by_count":21},{"year":2022,"cited_by_count":21},{"year":2021,"cited_by_count":6}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
