{"id":"https://openalex.org/W7106708167","doi":"https://doi.org/10.48550/arxiv.2511.18751","title":"Robust Multimodal Sentiment Analysis of Image-Text Pairs by Distribution-Based Feature Recovery and Fusion","display_name":"Robust Multimodal Sentiment Analysis of Image-Text Pairs by Distribution-Based Feature Recovery and Fusion","publication_year":2025,"publication_date":"2025-11-24","ids":{"openalex":"https://openalex.org/W7106708167","doi":"https://doi.org/10.48550/arxiv.2511.18751"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2511.18751","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.18751","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2511.18751","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wu, Daiqing","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wu, Daiqing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yang, Dongbao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Dongbao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhou, Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Ma, Can","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Can","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9107999801635742,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9107999801635742,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.021400000900030136,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.011599999852478504,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7644000053405762},{"id":"https://openalex.org/keywords/sentiment-analysis","display_name":"Sentiment analysis","score":0.6996999979019165},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6460999846458435},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5799999833106995},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.5253999829292297},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.38260000944137573}],"concepts":[{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7644000053405762},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7623999714851379},{"id":"https://openalex.org/C66402592","wikidata":"https://www.wikidata.org/wiki/Q2271421","display_name":"Sentiment analysis","level":2,"score":0.6996999979019165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6718999743461609},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6460999846458435},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5799999833106995},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.5253999829292297},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4334999918937683},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.38260000944137573},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3497999906539917},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3416000008583069},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3066999912261963},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.299699991941452},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.29589998722076416},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.27709999680519104},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.2732999920845032},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.2574999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2511.18751","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.18751","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2511.18751","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.18751","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.6995483040809631,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"posts":[1],"on":[2,128,181],"social":[3],"media":[4],"increase":[5],"rapidly,":[6],"analyzing":[7],"the":[8,38,120,129,146,169,189],"sentiments":[9],"embedded":[10],"in":[11,20,29,108,163,174,205],"image-text":[12,82,185],"pairs":[13],"has":[14],"become":[15],"a":[16,68,87,109],"popular":[17],"research":[18],"topic":[19],"recent":[21],"years.":[22],"Although":[23],"existing":[24],"works":[25],"achieve":[26],"impressive":[27],"accomplishments":[28],"simultaneously":[30,102],"harnessing":[31],"image":[32],"and":[33,43,72,105,142,159,171],"text":[34],"information,":[35],"they":[36],"lack":[37],"considerations":[39],"of":[40,61,81,192],"possible":[41],"low-quality":[42,104,113,170],"missing":[44,106,132,147,172],"modalities.":[45],"In":[46,152],"real-world":[47,176],"applications,":[48],"these":[49],"issues":[50],"might":[51],"frequently":[52],"occur,":[53],"leading":[54],"to":[55,93,119,167,195],"urgent":[56],"needs":[57],"for":[58,76,90],"models":[59],"capable":[60],"predicting":[62],"sentiment":[63,79,208],"robustly.":[64],"Therefore,":[65],"we":[66,85,100,115,134,187],"propose":[67],"Distribution-based":[69],"feature":[70,88,96],"Recovery":[71],"Fusion":[73],"(DRF)":[74],"method":[75],"robust":[77,206],"multimodal":[78,207],"analysis":[80],"pairs.":[83],"Specifically,":[84],"maintain":[86],"queue":[89],"each":[91],"modality":[92,125],"approximate":[94],"their":[95,117],"distributions,":[97,143],"through":[98],"which":[99],"can":[101],"handle":[103],"modalities":[107,148,162,173],"unified":[110],"framework.":[111],"For":[112,131],"modalities,":[114,133],"reduce":[116],"contributions":[118],"fusion":[121],"by":[122,140],"quantitatively":[123],"estimating":[124],"qualities":[126],"based":[127],"distributions.":[130],"build":[135],"inter-modal":[136],"mapping":[137],"relationships":[138],"supervised":[139],"samples":[141,164],"thereby":[144],"recovering":[145],"from":[149],"available":[150,184],"ones.":[151],"experiments,":[153],"two":[154,200],"disruption":[155],"strategies":[156],"that":[157],"corrupt":[158],"discard":[160],"some":[161],"are":[165],"adopted":[166],"mimic":[168],"various":[175],"scenarios.":[177],"Through":[178],"comprehensive":[179],"experiments":[180],"three":[182],"publicly":[183],"datasets,":[186],"demonstrate":[188],"universal":[190],"improvements":[191],"DRF":[193],"compared":[194],"SOTA":[196],"methods":[197],"under":[198],"both":[199],"strategies,":[201],"validating":[202],"its":[203],"effectiveness":[204],"analysis.":[209]},"counts_by_year":[],"updated_date":"2025-12-05T23:21:25.405358","created_date":"2025-11-27T00:00:00"}
