{"id":"https://openalex.org/W4386075505","doi":"https://doi.org/10.1109/cvpr52729.2023.02318","title":"MixPHM: Redundancy-Aware Parameter-Efficient Tuning for Low-Resource Visual Question Answering","display_name":"MixPHM: Redundancy-Aware Parameter-Efficient Tuning for Low-Resource Visual Question Answering","publication_year":2023,"publication_date":"2023-06-01","ids":{"openalex":"https://openalex.org/W4386075505","doi":"https://doi.org/10.1109/cvpr52729.2023.02318"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr52729.2023.02318","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.02318","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101477192","display_name":"Jingjing Jiang","orcid":"https://orcid.org/0000-0002-8241-4877"},"institutions":[{"id":"https://openalex.org/I4210105595","display_name":"Institute of Art","ror":"https://ror.org/017fyx225","country_code":"PL","type":"facility","lineage":["https://openalex.org/I4210105595","https://openalex.org/I99542240"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Jingjing Jiang","raw_affiliation_strings":["Institute of Artificial Intelligence and Robotics, Xi&#x0027;an Jiaotong University"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence and Robotics, Xi&#x0027;an Jiaotong University","institution_ids":["https://openalex.org/I4210105595"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047405956","display_name":"Nanning Zheng","orcid":"https://orcid.org/0000-0003-1608-8257"},"institutions":[{"id":"https://openalex.org/I4210105595","display_name":"Institute of Art","ror":"https://ror.org/017fyx225","country_code":"PL","type":"facility","lineage":["https://openalex.org/I4210105595","https://openalex.org/I99542240"]}],"countries":["PL"],"is_corresponding":false,"raw_author_name":"Nanning Zheng","raw_affiliation_strings":["Institute of Artificial Intelligence and Robotics, Xi&#x0027;an Jiaotong University"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence and Robotics, Xi&#x0027;an Jiaotong University","institution_ids":["https://openalex.org/I4210105595"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101477192"],"corresponding_institution_ids":["https://openalex.org/I4210105595"],"apc_list":null,"apc_paid":null,"fwci":2.4597,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.91089962,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"24203","last_page":"24213"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8016939759254456},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7587201595306396},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.7493190765380859},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5250741839408875},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5072171688079834},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.47121232748031616},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.45550537109375},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.4481639862060547},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34918850660324097},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3200390338897705},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.10743710398674011}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8016939759254456},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7587201595306396},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.7493190765380859},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5250741839408875},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5072171688079834},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.47121232748031616},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.45550537109375},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.4481639862060547},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34918850660324097},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3200390338897705},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.10743710398674011},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr52729.2023.02318","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52729.2023.02318","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8","score":0.49000000953674316}],"awards":[{"id":"https://openalex.org/G3833898155","display_name":null,"funder_award_id":"62088102","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":100,"referenced_works":["https://openalex.org/W1933349210","https://openalex.org/W2009284521","https://openalex.org/W2560730294","https://openalex.org/W2887997457","https://openalex.org/W2947312908","https://openalex.org/W2963518342","https://openalex.org/W2964184826","https://openalex.org/W2964303773","https://openalex.org/W2970231061","https://openalex.org/W3035688398","https://openalex.org/W3040573126","https://openalex.org/W3092642435","https://openalex.org/W3094491777","https://openalex.org/W3120074043","https://openalex.org/W3126337491","https://openalex.org/W3126792443","https://openalex.org/W3130089296","https://openalex.org/W3143320354","https://openalex.org/W3147874613","https://openalex.org/W3153675281","https://openalex.org/W3164972323","https://openalex.org/W3167118264","https://openalex.org/W3168867926","https://openalex.org/W3170796112","https://openalex.org/W3173220247","https://openalex.org/W3173777717","https://openalex.org/W3173788106","https://openalex.org/W3174770825","https://openalex.org/W3176693010","https://openalex.org/W3176828726","https://openalex.org/W3184735396","https://openalex.org/W3184784418","https://openalex.org/W3193402170","https://openalex.org/W3196642073","https://openalex.org/W3199693760","https://openalex.org/W3205949070","https://openalex.org/W3205972749","https://openalex.org/W3206816211","https://openalex.org/W3207493267","https://openalex.org/W3214685499","https://openalex.org/W4200634402","https://openalex.org/W4205991051","https://openalex.org/W4206178588","https://openalex.org/W4221155125","https://openalex.org/W4221160818","https://openalex.org/W4226052861","https://openalex.org/W4226182655","https://openalex.org/W4226375166","https://openalex.org/W4281633595","https://openalex.org/W4286856918","https://openalex.org/W4287113019","https://openalex.org/W4287121196","https://openalex.org/W4287122891","https://openalex.org/W4287391717","https://openalex.org/W4292779060","https://openalex.org/W4293718192","https://openalex.org/W4312238277","https://openalex.org/W4312563428","https://openalex.org/W4312784228","https://openalex.org/W4312884055","https://openalex.org/W4385572073","https://openalex.org/W4385573610","https://openalex.org/W4386212021","https://openalex.org/W6732520560","https://openalex.org/W6754278344","https://openalex.org/W6759579507","https://openalex.org/W6777155081","https://openalex.org/W6778883912","https://openalex.org/W6779473860","https://openalex.org/W6780805062","https://openalex.org/W6784001418","https://openalex.org/W6788237939","https://openalex.org/W6788811087","https://openalex.org/W6789753369","https://openalex.org/W6789909235","https://openalex.org/W6790003725","https://openalex.org/W6790019176","https://openalex.org/W6791404205","https://openalex.org/W6793102544","https://openalex.org/W6795933390","https://openalex.org/W6796159650","https://openalex.org/W6796487566","https://openalex.org/W6796710205","https://openalex.org/W6796854725","https://openalex.org/W6797716411","https://openalex.org/W6798805250","https://openalex.org/W6800139874","https://openalex.org/W6800480908","https://openalex.org/W6802290083","https://openalex.org/W6802744804","https://openalex.org/W6804095316","https://openalex.org/W6804126242","https://openalex.org/W6805239564","https://openalex.org/W6810127701","https://openalex.org/W6810471247","https://openalex.org/W6810921705","https://openalex.org/W6811013733","https://openalex.org/W6811138465","https://openalex.org/W6839015040","https://openalex.org/W6843742964"],"related_works":["https://openalex.org/W4362597605","https://openalex.org/W1574414179","https://openalex.org/W4297676672","https://openalex.org/W3009056573","https://openalex.org/W2922073769","https://openalex.org/W4281702477","https://openalex.org/W2490526372","https://openalex.org/W4376166922","https://openalex.org/W4378510483","https://openalex.org/W4221142204"],"abstract_inverted_index":{"Recently,":[0],"finetuning":[1,79],"pretrained":[2],"vision-language":[3],"models":[4],"(VLMs)":[5],"has":[6],"been":[7],"a":[8,37,58,71,86,94,106],"prevailing":[9],"paradigm":[10],"for":[11,36],"achieving":[12],"state-of-the-art":[13,160],"performance":[14,60],"in":[15,40,80,93,105],"VQA.":[16,82],"However,":[17],"as":[18],"VLMs":[19],"scale,":[20],"it":[21],"becomes":[22],"computationally":[23],"expensive,":[24],"storage":[25],"inefficient,":[26],"and":[27,109,116,149,163],"prone":[28],"to":[29,135],"overfitting":[30],"when":[31],"tuning":[32,46,74],"full":[33,63,78,170],"model":[34],"parameters":[35],"specific":[38],"task":[39],"low-resource":[41,81,153],"settings.":[42],"Although":[43],"current":[44],"parameter-efficient":[45,73,161],"methods":[47,162],"dramatically":[48],"reduce":[49,98,136],"the":[50,113,165],"number":[51],"of":[52,112,125],"tunable":[53],"parameters,":[54],"there":[55],"still":[56],"exists":[57],"significant":[59],"gap":[61],"with":[62,151],"finetuning.":[64,171],"In":[65],"this":[66],"paper,":[67],"we":[68,101,128],"propose":[69,129],"MixPHM,":[70],"redundancy-aware":[72],"method":[75],"that":[76,156],"outperforms":[77,159],"Specifically,":[83],"MixPHM":[84,134,158],"is":[85,164],"lightweight":[87],"module":[88],"implemented":[89],"by":[90],"multiple":[91],"PHM-experts":[92],"mixture-of-experts":[95],"manner.":[96],"To":[97],"parameter":[99],"redundancy,":[100,127],"reparameterize":[102],"expert":[103],"weights":[104,114],"low-rank":[107],"subspace":[108],"share":[110],"part":[111],"inside":[115],"across":[117],"MixPHM.":[118],"Moreover,":[119],"based":[120],"on":[121,145],"our":[122,157],"quantitative":[123],"analysis":[124],"representation":[126],"Redundancy":[130],"Regularization,":[131],"which":[132],"facilitates":[133],"task-irrelevant":[137],"redundancy":[138],"while":[139],"promoting":[140],"task-relevant":[141],"correlation.":[142],"Experiments":[143],"conducted":[144],"VQA":[146],"v2,":[147],"GQA,":[148],"OK-VQA":[150],"different":[152],"settings":[154],"show":[155],"only":[166],"one":[167],"consistently":[168],"surpassing":[169]},"counts_by_year":[{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
