{"id":"https://openalex.org/W4415708829","doi":"https://doi.org/10.1109/icme59968.2025.11210029","title":"Multimodal Conversatioal Emotion Analysis with Robustness to Incomplete Modality Details","display_name":"Multimodal Conversatioal Emotion Analysis with Robustness to Incomplete Modality Details","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415708829","doi":"https://doi.org/10.1109/icme59968.2025.11210029"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11210029","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11210029","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078148438","display_name":"Sidharth Anand","orcid":"https://orcid.org/0000-0001-5750-6860"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sidharth Anand","raw_affiliation_strings":["The State University of New York,Buffalo,NY,USA"],"affiliations":[{"raw_affiliation_string":"The State University of New York,Buffalo,NY,USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025882712","display_name":"Chaitanya Sai Chandu Yendru","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chaitanya Sai Chandu Yendru","raw_affiliation_strings":["The State University of New York,Buffalo,NY,USA"],"affiliations":[{"raw_affiliation_string":"The State University of New York,Buffalo,NY,USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102791840","display_name":"Sreyasee Das Bhattacharjee","orcid":"https://orcid.org/0000-0001-5393-0840"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sreyasee Das Bhattacharjee","raw_affiliation_strings":["The State University of New York,Buffalo,NY,USA"],"affiliations":[{"raw_affiliation_string":"The State University of New York,Buffalo,NY,USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085245110","display_name":"Junsong Yuan","orcid":"https://orcid.org/0000-0002-7901-8793"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Junsong Yuan","raw_affiliation_strings":["The State University of New York,Buffalo,NY,USA"],"affiliations":[{"raw_affiliation_string":"The State University of New York,Buffalo,NY,USA","institution_ids":["https://openalex.org/I63190737"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5078148438"],"corresponding_institution_ids":["https://openalex.org/I63190737"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.34408708,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.004699999932199717,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.000699999975040555,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7208999991416931},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7116000056266785},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5432000160217285},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5062000155448914},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.3935000002384186},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.37700000405311584},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.37059998512268066}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7732999920845032},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7208999991416931},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7116000056266785},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5432000160217285},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5246000289916992},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5062000155448914},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4034000039100647},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3935000002384186},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.37700000405311584},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.3481000065803528},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.34119999408721924},{"id":"https://openalex.org/C71611378","wikidata":"https://www.wikidata.org/wiki/Q5165191","display_name":"Contextual design","level":3,"score":0.3165000081062317},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.30649998784065247},{"id":"https://openalex.org/C113336015","wikidata":"https://www.wikidata.org/wiki/Q574010","display_name":"Complete information","level":2,"score":0.29409998655319214},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.28839999437332153},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.2872999906539917},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2603999972343445},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.25679999589920044},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11210029","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11210029","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1595942023","https://openalex.org/W2146334809","https://openalex.org/W2546919788","https://openalex.org/W2593116425","https://openalex.org/W2963686995","https://openalex.org/W2963710346","https://openalex.org/W2997258743","https://openalex.org/W3098556456","https://openalex.org/W3120680448","https://openalex.org/W4221147459","https://openalex.org/W4281701185","https://openalex.org/W4312619379","https://openalex.org/W4312706447","https://openalex.org/W4312866014","https://openalex.org/W4313531231","https://openalex.org/W4321022102","https://openalex.org/W4360930863","https://openalex.org/W4385570058","https://openalex.org/W4385573848","https://openalex.org/W4386057714","https://openalex.org/W4386071994","https://openalex.org/W4387967914","https://openalex.org/W4391558025","https://openalex.org/W4393146934","https://openalex.org/W4394862741","https://openalex.org/W4404781709","https://openalex.org/W4411245083"],"related_works":[],"abstract_inverted_index":{"Emotion":[0],"recognition\u2019s":[1],"efficacy":[2],"for":[3],"individual":[4],"and":[5,18,172,185,222],"group":[6],"conversations":[7],"hinges":[8],"upon":[9],"integrating":[10],"data":[11,26],"from":[12],"diverse":[13],"modalities":[14,54,100,209],"(e.g.,":[15],"text,":[16],"audio,":[17],"video).":[19],"However,":[20],"the":[21,30,50,55,75,166,196,232],"intrinsic":[22],"heterogeneity":[23],"of":[24,52,86,99,115,136,175,231],"these":[25],"sources,":[27],"coupled":[28],"with":[29,132,207],"interpersonal":[31],"contextual":[32],"influences":[33],"in":[34,80,113,191],"groups,":[35],"present":[36,102],"significant":[37],"challenges":[38],"to":[39,73,130,155,168,195,213,227],"accurately":[40],"identifying":[41],"emotion.":[42],"Furthermore,":[43],"during":[44,103],"inference":[45],"most":[46],"applications":[47],"cannot":[48],"guarantee":[49],"presence":[51,114],"all":[53],"model":[56,167],"was":[57],"trained":[58],"on.":[59],"Towards":[60],"this,":[61],"we":[62],"propose":[63],"Missing":[64],"Information":[65],"robust":[66],"Joint":[67],"Transformer":[68],"(MIJoT),":[69],"which":[70,89,217],"is":[71,101],"designed":[72],"capture":[74],"extensive":[76],"cross-modal":[77],"spatio-temporal":[78],"context":[79],"a":[81,84,92,96,133,143,152],"dialogue.":[82],"Unlike":[83],"majority":[85],"existing":[87,214],"works,":[88],"rely":[90],"on":[91,151,158],"fundamental":[93],"assumption":[94],"that":[95,147],"full":[97],"set":[98],"inference,":[104],"MIJoT\u2019s":[105],"Masked":[106],"Mode-specific":[107],"Data":[108],"Modelling":[109],"ensures":[110],"consistent":[111],"performance":[112,157,188,212],"partial":[116,228],"modality":[117,138],"details.":[118],"By":[119],"enabling":[120],"powerful":[121],"masked":[122],"modeling":[123],"pretraining,":[124],"MIJoT":[125,206],"delivers":[126],"an":[127,181],"impressive":[128],"ability":[129],"deal":[131],"wide":[134],"range":[135],"incomplete":[137,208],"scenarios.":[139],"We":[140],"also":[141],"utilize":[142],"Contrastive":[144],"Imbalance":[145],"Loss":[146],"maximizes":[148],"inter-class":[149],"distance":[150],"high-dimensional":[153],"hyper-sphere,":[154],"improve":[156],"minority":[159],"classes.":[160],"An":[161],"effective":[162],"multimodal":[163],"fusion":[164],"enables":[165],"analyze":[169],"both":[170],"utterances":[171],"dialogue":[173],"(sequence":[174],"utterances)":[176],"between":[177],"multiple":[178],"people":[179],"within":[180],"integrated":[182],"computation":[183],"framework":[184],"deliver":[186],"superior":[187],"(4-12%)":[189],"improvement":[190],"weighted-F1":[192],"scores)":[193],"compared":[194],"current":[197],"best-performing":[198],"methods":[199],"across":[200],"several":[201],"large-scale":[202],"public":[203],"datasets.":[204],"Additionally,":[205],"report":[210],"comparable":[211],"state-of-the-art":[215],"techniques":[216],"use":[218],"complete":[219],"multi-mode":[220],"information,":[221],"thereby":[223],"demonstrate":[224],"its":[225],"robustness":[226],"mode":[229],"information":[230],"queries.":[233]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-30T00:00:00"}
