{"id":"https://openalex.org/W7125930945","doi":"https://doi.org/10.1109/smc58881.2025.11343481","title":"Revisiting Multi-Modal Alignment: In Distribution View","display_name":"Revisiting Multi-Modal Alignment: In Distribution View","publication_year":2025,"publication_date":"2025-10-05","ids":{"openalex":"https://openalex.org/W7125930945","doi":"https://doi.org/10.1109/smc58881.2025.11343481"},"language":null,"primary_location":{"id":"doi:10.1109/smc58881.2025.11343481","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11343481","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5104263476","display_name":"Weikai Li","orcid":null},"institutions":[{"id":"https://openalex.org/I63371133","display_name":"Chongqing Jiaotong University","ror":"https://ror.org/01t001k65","country_code":"CN","type":"education","lineage":["https://openalex.org/I63371133"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weikai Li","raw_affiliation_strings":["Chongqing Jiaotong University,School of Mathematics and Statistics,Chongqing,China,400074"],"affiliations":[{"raw_affiliation_string":"Chongqing Jiaotong University,School of Mathematics and Statistics,Chongqing,China,400074","institution_ids":["https://openalex.org/I63371133"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123774305","display_name":"Nan Tian","orcid":null},"institutions":[{"id":"https://openalex.org/I63371133","display_name":"Chongqing Jiaotong University","ror":"https://ror.org/01t001k65","country_code":"CN","type":"education","lineage":["https://openalex.org/I63371133"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nan Tian","raw_affiliation_strings":["Chongqing Jiaotong University,School of Mathematics and Statistics,Chongqing,China,400074"],"affiliations":[{"raw_affiliation_string":"Chongqing Jiaotong University,School of Mathematics and Statistics,Chongqing,China,400074","institution_ids":["https://openalex.org/I63371133"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101768855","display_name":"Yuan Li","orcid":"https://orcid.org/0000-0001-6824-4122"},"institutions":[{"id":"https://openalex.org/I4210109416","display_name":"Anhui Science and Technology University","ror":"https://ror.org/01pn91c28","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210109416"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Li","raw_affiliation_strings":["China Science IntelliCloud Technology, Co., Ltd.,Anhui,China,230000"],"affiliations":[{"raw_affiliation_string":"China Science IntelliCloud Technology, Co., Ltd.,Anhui,China,230000","institution_ids":["https://openalex.org/I4210109416"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5124103484","display_name":"Ying Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I44265643","display_name":"Rowan University","ror":"https://ror.org/049v69k10","country_code":"US","type":"education","lineage":["https://openalex.org/I44265643"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ying Tang","raw_affiliation_strings":["Rowan University,Department of Electrical and Computer Engineering,Glassboro,NJ,USA,08028"],"affiliations":[{"raw_affiliation_string":"Rowan University,Department of Electrical and Computer Engineering,Glassboro,NJ,USA,08028","institution_ids":["https://openalex.org/I44265643"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5104263476"],"corresponding_institution_ids":["https://openalex.org/I63371133"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.68628188,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"6325","last_page":"6330"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.30880001187324524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.30880001187324524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1647000014781952,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.11810000240802765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/covariance","display_name":"Covariance","score":0.7073000073432922},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.6937999725341797},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.492900013923645},{"id":"https://openalex.org/keywords/vulnerability","display_name":"Vulnerability (computing)","score":0.4643999934196472},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.3995000123977661},{"id":"https://openalex.org/keywords/distribution","display_name":"Distribution (mathematics)","score":0.3833000063896179},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.3785000145435333},{"id":"https://openalex.org/keywords/statistical-model","display_name":"Statistical model","score":0.37229999899864197},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.33550000190734863}],"concepts":[{"id":"https://openalex.org/C178650346","wikidata":"https://www.wikidata.org/wiki/Q201984","display_name":"Covariance","level":2,"score":0.7073000073432922},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.6937999725341797},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5622000098228455},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.492900013923645},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4677000045776367},{"id":"https://openalex.org/C95713431","wikidata":"https://www.wikidata.org/wiki/Q631425","display_name":"Vulnerability (computing)","level":2,"score":0.4643999934196472},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40639999508857727},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.3995000123977661},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.3833000063896179},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.3785000145435333},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.37229999899864197},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.33550000190734863},{"id":"https://openalex.org/C2986587452","wikidata":"https://www.wikidata.org/wiki/Q938438","display_name":"Statistical analysis","level":2,"score":0.31790000200271606},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.31130000948905945},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30160000920295715},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2976999878883362},{"id":"https://openalex.org/C180877172","wikidata":"https://www.wikidata.org/wiki/Q5401390","display_name":"Estimation of covariance matrices","level":3,"score":0.2935999929904938},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.29170000553131104},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.28299999237060547},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.2809000015258789},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C148043351","wikidata":"https://www.wikidata.org/wiki/Q4456944","display_name":"Current (fluid)","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C137250428","wikidata":"https://www.wikidata.org/wiki/Q5178897","display_name":"Covariance function","level":3,"score":0.2630999982357025},{"id":"https://openalex.org/C119340705","wikidata":"https://www.wikidata.org/wiki/Q1628597","display_name":"Analysis of covariance","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C2776289891","wikidata":"https://www.wikidata.org/wiki/Q1931511","display_name":"Neglect","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2558000087738037},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.25429999828338623},{"id":"https://openalex.org/C2983787585","wikidata":"https://www.wikidata.org/wiki/Q93586","display_name":"Feature matching","level":3,"score":0.25429999828338623},{"id":"https://openalex.org/C185142706","wikidata":"https://www.wikidata.org/wiki/Q1134404","display_name":"Covariance matrix","level":2,"score":0.2533000111579895},{"id":"https://openalex.org/C96608239","wikidata":"https://www.wikidata.org/wiki/Q1199823","display_name":"Statistical power","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/smc58881.2025.11343481","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc58881.2025.11343481","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320324805","display_name":"Chongqing Municipal Education Commission","ror":"https://ror.org/031nm5713"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W12634471","https://openalex.org/W1977295328","https://openalex.org/W2017814585","https://openalex.org/W2047643928","https://openalex.org/W2108598243","https://openalex.org/W2138011018","https://openalex.org/W2155904486","https://openalex.org/W2533598788","https://openalex.org/W2964194231","https://openalex.org/W2964288524","https://openalex.org/W3035524453","https://openalex.org/W3198377975","https://openalex.org/W4312956471","https://openalex.org/W4386071547","https://openalex.org/W4390660439","https://openalex.org/W4390872745","https://openalex.org/W4402704633","https://openalex.org/W4402727764","https://openalex.org/W4402753597","https://openalex.org/W4402754214","https://openalex.org/W4403726563","https://openalex.org/W4404612908","https://openalex.org/W4413146712","https://openalex.org/W4413147831","https://openalex.org/W4415798716"],"related_works":[],"abstract_inverted_index":{"Current":[0],"Multi-Modal":[1],"Large":[2],"language":[3],"Models":[4],"(MMLMs)":[5],"primarily":[6],"rely":[7],"on":[8,97],"instance-level":[9],"feature":[10],"statistics":[11],"for":[12,80,120],"cross-modal":[13,53,81,121],"alignment.":[14,63,82],"However,":[15],"they":[16],"commonly":[17],"suffer":[18],"three":[19],"inherent":[20],"limitations":[21,37],"including":[22],"vulnerability":[23],"to":[24],"outlier":[25],"perturbations,":[26],"neglect":[27],"of":[28,49,85,92,112],"inter-feature":[29],"covariance":[30],"structures,":[31],"and":[32],"local":[33],"optimum":[34],"trapping.":[35],"These":[36],"stem":[38],"from":[39],"a":[40],"critical":[41,110],"oversight\u2014existing":[42],"approaches":[43],"disregard":[44],"the":[45,90,109],"global":[46],"statistical":[47],"structure":[48],"multi-modal":[50],"data,":[51],"treating":[52],"alignment":[54,58,79,114],"as":[55],"isolated":[56],"feature-level":[57],"rather":[59],"than":[60],"systematic":[61],"distribution-level":[62,78,113],"To":[64],"address":[65],"these":[66],"issues,":[67],"this":[68],"paper":[69],"proposes":[70],"Layer-wise":[71],"Covariance":[72],"Alignment":[73],"(LCA),":[74],"which":[75],"first":[76],"leverages":[77],"The":[83],"effectiveness":[84],"LCA":[86],"is":[87],"validated":[88],"through":[89],"use":[91],"parameter-efficient":[93],"Low-Rank":[94],"Adaptation":[95],"(LoRA)":[96],"CLIP":[98],"architectures.":[99],"Experimental":[100],"validation":[101],"across":[102],"eight":[103],"benchmarks":[104],"demonstrates":[105],"state-of-the-art":[106],"performance,":[107],"confirming":[108],"role":[111],"in":[115],"overcoming":[116],"sample-level":[117],"optimization":[118],"constraints":[119],"learning.":[122]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-01-29T00:00:00"}
