{"id":"https://openalex.org/W4411635553","doi":"https://doi.org/10.1145/3731715.3733423","title":"RobustPT: Dynamic Disentanglement Prompt Tuning in Vision-Language Models with Missing Modalities","display_name":"RobustPT: Dynamic Disentanglement Prompt Tuning in Vision-Language Models with Missing Modalities","publication_year":2025,"publication_date":"2025-06-25","ids":{"openalex":"https://openalex.org/W4411635553","doi":"https://doi.org/10.1145/3731715.3733423"},"language":"en","primary_location":{"id":"doi:10.1145/3731715.3733423","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731715.3733423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040004253","display_name":"Ruiting Dai","orcid":"https://orcid.org/0000-0002-8944-6759"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ruiting Dai","raw_affiliation_strings":["University of Electronic Science and Technology of China, ChengDu, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, ChengDu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053871882","display_name":"Yuqiao Tan","orcid":"https://orcid.org/0009-0009-0693-5230"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuqiao Tan","raw_affiliation_strings":["University of Electronic Science and Technology of China, ChengDu, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, ChengDu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099043577","display_name":"Lisi Mo","orcid":"https://orcid.org/0009-0008-4742-4456"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lisi Mo","raw_affiliation_strings":["University of Electronic Science and Technology of China, ChengDu, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, ChengDu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100761497","display_name":"Tao He","orcid":"https://orcid.org/0000-0001-8676-7429"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao He","raw_affiliation_strings":["University of Electronic Science and Technology of China, ChengDu, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, ChengDu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070150374","display_name":"Ke Qin","orcid":"https://orcid.org/0000-0001-6174-3877"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Qin","raw_affiliation_strings":["University of Electronic Science and Technology of China, ChengDu, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, ChengDu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016843517","display_name":"Shuang Liang","orcid":"https://orcid.org/0000-0001-7387-2801"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuang Liang","raw_affiliation_strings":["University of Electronic Science and Technology of China, ChengDu, China"],"affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, ChengDu, China","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5040004253"],"corresponding_institution_ids":["https://openalex.org/I150229711"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12577569,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"164","last_page":"172"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7678877711296082},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7387092113494873},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47385767102241516},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3881130814552307},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.344768226146698}],"concepts":[{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7678877711296082},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7387092113494873},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47385767102241516},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3881130814552307},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.344768226146698},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3731715.3733423","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3731715.3733423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7699999809265137,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[{"id":"https://openalex.org/G933148648","display_name":null,"funder_award_id":"62306064","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"}],"funders":[{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2296448531","https://openalex.org/W2910191085","https://openalex.org/W2957186196","https://openalex.org/W2966683369","https://openalex.org/W2971014764","https://openalex.org/W3134912427","https://openalex.org/W3173882198","https://openalex.org/W3194841206","https://openalex.org/W3198377975","https://openalex.org/W4312310776","https://openalex.org/W4312651322","https://openalex.org/W4385782081","https://openalex.org/W4386057714","https://openalex.org/W4386071547","https://openalex.org/W4399418463","https://openalex.org/W4411631883","https://openalex.org/W6872102093"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Recently,":[0],"prompt":[1,101],"tuning":[2,102,134],"has":[3],"garnered":[4],"considerable":[5],"attention":[6],"due":[7,32],"to":[8,29,33,52,78,84,105,122,147,163],"its":[9,89],"success":[10],"across":[11,185],"various":[12],"Vision-Language":[13],"(VL)":[14],"tasks.":[15],"However,":[16],"unimodal":[17],"prompts,":[18,20],"coupled":[19],"and":[21,38,87,125,135,168],"joint":[22],"prompts":[23,139],"in":[24,35,43,145],"these":[25,48],"models":[26,58,111],"often":[27],"lead":[28],"suboptimal":[30],"performance":[31],"differences":[34],"information":[36,166],"density":[37],"complexity":[39],"between":[40],"modalities.":[41],"Particularly,":[42],"scenarios":[44],"with":[45],"missing":[46,114],"modalities,":[47],"prompt-based":[49],"approaches":[50],"tend":[51],"exacerbate":[53],"'Channel":[54],"Bias'-a":[55],"phonomenon":[56],"where":[57,138],"overly":[59],"rely":[60],"on":[61],"specific":[62],"feature":[63],"(such":[64],"as":[65],"unmissing-modal":[66],"feature)":[67],"channels":[68],"from":[69],"the":[70,75,107,182],"base":[71],"tasks,":[72],"thereby":[73],"undermining":[74],"model's":[76],"ability":[77],"capture":[79],"crucial":[80],"shared":[81],"knowledge":[82],"applicable":[83],"new":[85],"tasks":[86],"affecting":[88],"generalizability.":[90],"To":[91],"address":[92],"this":[93],"challenge,":[94],"we":[95],"propose":[96],"RobustPT,":[97],"a":[98,118,159],"dynamic":[99],"disentanglement":[100],"model":[103],"designed":[104],"enhance":[106,169],"robustness":[108],"of":[109],"VL":[110],"under":[112],"modality":[113,142],"conditions.":[115],"RobustPT":[116,129,177],"utilizes":[117],"multi-channel":[119],"prompting":[120],"mechanism":[121],"dynamically":[123],"disentangle":[124],"align":[126],"prompts.":[127],"Specifically,":[128],"is":[130],"divided":[131],"into":[132,150],"single-channel":[133],"alignment-channel":[136],"tuning,":[137],"for":[140],"each":[141],"run":[143],"independently":[144],"sequence":[146],"delve":[148],"deeply":[149],"their":[151],"intrinsic":[152],"characteristics,":[153],"followed":[154],"by":[155],"an":[156],"integration":[157],"through":[158],"non-strong":[160],"coupling":[161],"strategy":[162],"effectively":[164],"balance":[165],"contributions":[167],"overall":[170],"performance.":[171],"Extensive":[172],"experiments":[173],"demonstrate":[174],"that":[175],"our":[176],"achieve":[178],"significant":[179],"improvements":[180],"over":[181],"current":[183],"state-of-the-art":[184],"all":[186],"benchmark":[187],"datasets.":[188],"Our":[189],"codes":[190],"are":[191],"available":[192],"at":[193],"https://github.com/Trae1ounG/RobustPT.":[194]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
