{"id":"https://openalex.org/W4387698231","doi":"https://doi.org/10.1145/3607865.3613181","title":"First-order Multi-label Learning with Cross-modal Interactions for Multimodal Emotion Recognition","display_name":"First-order Multi-label Learning with Cross-modal Interactions for Multimodal Emotion Recognition","publication_year":2023,"publication_date":"2023-10-17","ids":{"openalex":"https://openalex.org/W4387698231","doi":"https://doi.org/10.1145/3607865.3613181"},"language":"en","primary_location":{"id":"doi:10.1145/3607865.3613181","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3607865.3613181","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607865.3613181","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimodal and Responsible Affective Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3607865.3613181","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004864776","display_name":"Yunrui Cai","orcid":"https://orcid.org/0009-0009-4431-2886"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yunrui Cai","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0009-4431-2886","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055370974","display_name":"Jingran Xie","orcid":"https://orcid.org/0009-0007-2050-263X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingran Xie","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0007-2050-263X","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025022632","display_name":"Boshi Tang","orcid":"https://orcid.org/0009-0007-6786-4806"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Boshi Tang","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0007-6786-4806","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031375380","display_name":"Yuanyuan Wang","orcid":"https://orcid.org/0009-0005-8766-3118"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanyuan Wang","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0005-8766-3118","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450139","display_name":"Jun Chen","orcid":"https://orcid.org/0000-0001-7201-1989"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Chen","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-7201-1989","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102788950","display_name":"Haiwei Xue","orcid":"https://orcid.org/0000-0001-7318-9682"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haiwei Xue","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-7318-9682","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102869280","display_name":"Zhiyong Wu","orcid":"https://orcid.org/0000-0001-8533-0524"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Wu","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-8533-0524","affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5004864776"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.1704,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.57336764,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"13","last_page":"20"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.74979567527771},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6706880927085876},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6644818186759949},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6098648309707642},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.5048502087593079},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4637598991394043},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.45672377943992615},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.44544944167137146},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.41905325651168823},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3761371970176697},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09792327880859375}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.74979567527771},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6706880927085876},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6644818186759949},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6098648309707642},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.5048502087593079},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4637598991394043},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.45672377943992615},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.44544944167137146},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.41905325651168823},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3761371970176697},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09792327880859375},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3607865.3613181","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3607865.3613181","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607865.3613181","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimodal and Responsible Affective Computing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3607865.3613181","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3607865.3613181","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3607865.3613181","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 1st International Workshop on Multimodal and Responsible Affective Computing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2603945996","display_name":null,"funder_award_id":"62076144","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387698231.pdf","grobid_xml":"https://content.openalex.org/works/W4387698231.grobid-xml"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W1998839399","https://openalex.org/W2041616772","https://openalex.org/W2114315281","https://openalex.org/W2123217057","https://openalex.org/W2156935079","https://openalex.org/W2194775991","https://openalex.org/W2584561145","https://openalex.org/W2738672149","https://openalex.org/W2789758093","https://openalex.org/W2803098682","https://openalex.org/W2947476638","https://openalex.org/W2963104701","https://openalex.org/W3169320628","https://openalex.org/W3176382883","https://openalex.org/W3179103990","https://openalex.org/W3185864054","https://openalex.org/W3206603478","https://openalex.org/W3206842948","https://openalex.org/W3207379732","https://openalex.org/W4235788770","https://openalex.org/W4287119707","https://openalex.org/W4297510543","https://openalex.org/W6600721412","https://openalex.org/W6649806852","https://openalex.org/W6677222910","https://openalex.org/W6677758222","https://openalex.org/W6678975374","https://openalex.org/W6739901393","https://openalex.org/W6755182888","https://openalex.org/W6779740423"],"related_works":["https://openalex.org/W3000097931","https://openalex.org/W2354322770","https://openalex.org/W4237547500","https://openalex.org/W1570848052","https://openalex.org/W2373192430","https://openalex.org/W4239268388","https://openalex.org/W4243305035","https://openalex.org/W1537496349","https://openalex.org/W2379407973","https://openalex.org/W2350267540"],"abstract_inverted_index":{"Multimodal":[0,131],"emotion":[1],"recognition":[2],"(MER)":[3],"is":[4,24],"essential":[5],"for":[6],"the":[7,41,52,103,106,116,119,123,127,140,150,156],"machine":[8],"to":[9,27,80,101,113],"fully":[10],"understand":[11],"human":[12],"intentions.":[13],"Various":[14],"deep":[15],"neural":[16],"network":[17],"based":[18,64],"models":[19],"are":[20],"proposed":[21,124,145],"but":[22],"it":[23],"still":[25],"challenging":[26],"better":[28],"model":[29,63],"and":[30,68,71,84],"fuse":[31],"multimodal":[32,61],"features.":[33],"In":[34,55],"addition,":[35],"recent":[36],"studies":[37],"have":[38],"focused":[39],"on":[40,65,126,155],"classification":[42],"task":[43],"of":[44,51,77,95,105,118,130,143,153],"predicting":[45],"discrete":[46,82],"labels,":[47],"while":[48],"lacking":[49],"consideration":[50],"dimension":[53,85],"value.":[54],"this":[56],"paper,":[57],"we":[58,109],"propose":[59,90],"a":[60,73,91],"fusion":[62],"Transformer":[66],"architecture":[67],"cross-modal":[69],"interactions,":[70],"adopt":[72],"multi-label":[74],"learning":[75,93,112],"algorithm":[76],"first-order":[78],"strategy":[79],"predict":[81],"labels":[83],"values":[86],"respectively.":[87],"We":[88,121],"also":[89],"semi-supervised":[92],"method":[94,125],"moment":[96],"injection":[97],"with":[98],"unlabeled":[99],"data":[100],"enhance":[102],"robustness":[104],"model.":[107,120],"Finally,":[108],"use":[110],"ensemble":[111],"further":[114],"improve":[115],"performance":[117,142],"evaluate":[122],"MER-MULTI":[128],"sub-challenge":[129],"Emotion":[132],"Recognition":[133],"Challenge":[134],"(MER":[135],"2023).":[136],"Experimental":[137],"results":[138],"demonstrate":[139],"promising":[141],"our":[144],"method,":[146],"which":[147],"can":[148],"achieve":[149],"evaluation":[151],"metric":[152],"0.6765":[154],"test":[157],"set.":[158]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
