{"id":"https://openalex.org/W4387814637","doi":"https://doi.org/10.1145/3606039.3613113","title":"Multimodal Sentiment Analysis via Efficient Multimodal Transformer and Modality-Aware Adaptive Training Strategy","display_name":"Multimodal Sentiment Analysis via Efficient Multimodal Transformer and Modality-Aware Adaptive Training Strategy","publication_year":2023,"publication_date":"2023-10-20","ids":{"openalex":"https://openalex.org/W4387814637","doi":"https://doi.org/10.1145/3606039.3613113"},"language":"en","primary_location":{"id":"doi:10.1145/3606039.3613113","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3606039.3613113","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 4th on Multimodal Sentiment Analysis Challenge and Workshop: Mimicked Emotions, Humour and Personalisation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032101339","display_name":"Chaoyue Ding","orcid":"https://orcid.org/0009-0000-0161-4838"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chaoyue Ding","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004411500","display_name":"Daoming Zong","orcid":"https://orcid.org/0009-0004-8109-2943"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Daoming Zong","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003607066","display_name":"Baoxiang Li","orcid":"https://orcid.org/0009-0009-4490-2157"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baoxiang Li","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061720532","display_name":"Song Zhang","orcid":"https://orcid.org/0009-0004-5856-9969"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Song Zhang","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056940037","display_name":"Xiaoxu Zhu","orcid":"https://orcid.org/0009-0004-3562-4507"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoxu Zhu","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101456431","display_name":"Guiping Zhong","orcid":"https://orcid.org/0009-0004-1530-0783"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guiping Zhong","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002904368","display_name":"Dinghao Zhou","orcid":"https://orcid.org/0009-0000-8519-4630"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dinghao Zhou","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5032101339"],"corresponding_institution_ids":["https://openalex.org/I4210128910"],"apc_list":null,"apc_paid":null,"fwci":0.5232,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.68800609,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"11","last_page":"17"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7940952181816101},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.6968938708305359},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.5965667366981506},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5913280248641968},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5238801836967468},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5173794031143188}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7940952181816101},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.6968938708305359},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.5965667366981506},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5913280248641968},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5238801836967468},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5173794031143188},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3606039.3613113","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3606039.3613113","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 4th on Multimodal Sentiment Analysis Challenge and Workshop: Mimicked Emotions, Humour and Personalisation","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W2003948868","https://openalex.org/W2239141610","https://openalex.org/W2341528187","https://openalex.org/W2619383789","https://openalex.org/W2742542661","https://openalex.org/W2746419079","https://openalex.org/W3011574394","https://openalex.org/W3035333188","https://openalex.org/W3036601975","https://openalex.org/W3088409176","https://openalex.org/W3094918372","https://openalex.org/W3100676321","https://openalex.org/W3101998545","https://openalex.org/W3159481202","https://openalex.org/W3179103990","https://openalex.org/W3206776536","https://openalex.org/W3209059054","https://openalex.org/W4221145199","https://openalex.org/W4224916413","https://openalex.org/W4291741556","https://openalex.org/W4297510486","https://openalex.org/W4297510548","https://openalex.org/W4297510847","https://openalex.org/W4361994820","https://openalex.org/W4376455521","https://openalex.org/W4387814874","https://openalex.org/W6784910987","https://openalex.org/W6844956273"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W203959209","https://openalex.org/W2167701463","https://openalex.org/W2110287964","https://openalex.org/W4307407935"],"abstract_inverted_index":{"In":[0,34],"this":[1],"paper,":[2],"we":[3,37,84],"present":[4],"the":[5,8,12,23,76,124],"solution":[6],"to":[7,21,62,97],"MuSe-Mimic":[9],"subchallenge":[10],"of":[11,25,43,54,118,129,137],"4th":[13],"Multimodal":[14],"Sentiment":[15],"Analysis":[16],"Challenge.":[17],"This":[18,106],"sub-challenge":[19],"aims":[20],"predict":[22],"level":[24],"approval,":[26],"disappointment":[27],"and":[28],"uncertainty":[29],"in":[30,51,110],"user-generated":[31],"video":[32],"clips.":[33],"our":[35],"experiments,":[36],"found":[38],"that":[39],"naive":[40],"joint":[41,100],"training":[42,95,101],"multiple":[44],"modalities":[45,59],"by":[46],"late":[47],"fusion":[48],"would":[49],"result":[50,136],"insufficient":[52],"learning":[53,117],"unimodal":[55,71,119],"features.":[56,120],"Moreover,":[57],"different":[58],"contribute":[60],"differently":[61],"MuSe-Mimic.":[63],"Relying":[64],"solely":[65],"on":[66,102],"multimodal":[67,88,103],"features":[68,72],"or":[69],"treating":[70],"equally":[73],"may":[74],"limit":[75],"model's":[77],"generalization":[78],"performance.":[79],"To":[80],"address":[81],"these":[82],"challenges,":[83],"propose":[85],"an":[86],"efficient":[87],"transformer":[89],"equipped":[90],"with":[91],"a":[92],"modality-aware":[93],"adaptive":[94],"strategy":[96],"facilitate":[98],"optimal":[99],"sequence":[104],"inputs.":[105],"framework":[107],"holds":[108],"promise":[109],"leveraging":[111],"cross-modal":[112],"interactions":[113],"while":[114],"ensuring":[115],"adequate":[116],"Our":[121,139],"model":[122],"achieves":[123],"mean":[125],"Pearson's":[126],"Correlation":[127],"Coefficient":[128],".729":[130],"(ranking":[131],"2nd),":[132],"outperforming":[133],"official":[134],"baseline":[135],".473.":[138],"code":[140],"is":[141],"available":[142],"at":[143],"https://github.com/dingchaoyue/Multimodal-Emotion-Recognition-MER-and-MuSe-2023-Challenges.":[144]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
