{"id":"https://openalex.org/W7134228070","doi":"https://doi.org/10.48550/arxiv.2603.06270","title":"HiPP-Prune: Hierarchical Preference-Conditioned Structured Pruning for Vision-Language Models","display_name":"HiPP-Prune: Hierarchical Preference-Conditioned Structured Pruning for Vision-Language Models","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7134228070","doi":"https://doi.org/10.48550/arxiv.2603.06270"},"language":"en","primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.06270","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128393563","display_name":"Lincen Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Lincen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107633038","display_name":"Hedi Tabia","orcid":"https://orcid.org/0000-0002-1827-7150"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tabia, Hedi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5124004944","display_name":"Raul Santos-Rodriguez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Santos-Rodriguez, Raul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9254999756813049,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9254999756813049,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.017400000244379044,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.013500000350177288,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5990999937057495},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5115000009536743},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4124999940395355},{"id":"https://openalex.org/keywords/budget-constraint","display_name":"Budget constraint","score":0.31049999594688416},{"id":"https://openalex.org/keywords/conditional-independence","display_name":"Conditional independence","score":0.2892000079154968},{"id":"https://openalex.org/keywords/proxy","display_name":"Proxy (statistics)","score":0.288100004196167}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7365999817848206},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5990999937057495},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5568000078201294},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5526999831199646},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5115000009536743},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4124999940395355},{"id":"https://openalex.org/C8505890","wikidata":"https://www.wikidata.org/wiki/Q605095","display_name":"Budget constraint","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29109999537467957},{"id":"https://openalex.org/C79772020","wikidata":"https://www.wikidata.org/wiki/Q5159264","display_name":"Conditional independence","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C10347200","wikidata":"https://www.wikidata.org/wiki/Q1960297","display_name":"Hindsight bias","level":2,"score":0.2567000091075897}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.06270","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:HAL:hal-05551618v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05551618","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2026","raw_type":"Preprints, Working Papers, ..."},{"id":"doi:10.48550/arxiv.2603.06270","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.06270","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.06270","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Pruning":[0],"vision-language":[1],"models":[2],"(VLMs)":[3],"for":[4,85],"efficient":[5],"deployment":[6],"is":[7],"challenging":[8],"because":[9],"compression":[10],"can":[11],"affect":[12],"not":[13],"only":[14],"task":[15,134],"utility":[16],"but":[17],"also":[18],"visual":[19,94],"grounding,":[20],"often":[21],"amplifying":[22],"object":[23],"hallucinations":[24],"even":[25],"at":[26],"the":[27],"same":[28],"sparsity":[29,69,174],"level.":[30],"We":[31,117],"present":[32],"HiPP-Prune,":[33],"a":[34,54,59,72,79,93,129,141],"hierarchical":[35],"preference-conditioned":[36],"structured":[37],"pruning":[38,42,61,119,165],"framework":[39],"that":[40,113,132,160],"treats":[41],"as":[43],"conditional":[44],"resource":[45],"allocation":[46],"under":[47,128,172],"multiple":[48],"objectives.":[49],"HiPP-Prune":[50,161],"makes":[51],"plan-level":[52,122],"decisions:":[53],"single":[55],"policy":[56,90],"invocation":[57],"outputs":[58],"global":[60],"blueprint":[62],"by":[63],"factorizing":[64],"decisions":[65],"into":[66],"an":[67],"overall":[68],"budget":[70],"and":[71,104,140,157,167],"layer-wise":[73],"allocation,":[74],"enabling":[75],"queryable":[76],"trade-offs":[77,171],"via":[78],"user-specified":[80],"preference":[81],"vector.":[82],"To":[83],"account":[84],"VLM-specific":[86],"failure":[87],"modes,":[88],"our":[89],"state":[91],"integrates":[92],"sensitivity":[95],"signal":[96],"derived":[97],"from":[98],"attention":[99],"flow":[100],"between":[101],"vision":[102],"tokens":[103],"language":[105],"hidden":[106],"states,":[107],"discouraging":[108],"over-pruning":[109],"of":[110],"vision-critical":[111],"layers":[112],"facilitate":[114],"cross-modal":[115],"fusion.":[116],"optimize":[118],"plans":[120,166],"with":[121,155],"Group":[123],"Relative":[124],"Policy":[125],"Optimization":[126],"(GRPO)":[127],"multi-objective":[130],"return":[131],"combines":[133],"utility,":[135],"hallucination":[136],"robustness":[137],"(POPE),":[138],"compression,":[139],"synaptic-flow-inspired":[142],"stability":[143],"proxy":[144],"to":[145],"reduce":[146],"unproductive":[147],"exploration":[148],"in":[149],"high-sparsity":[150],"regimes.":[151],"Experiments":[152],"on":[153],"LLaVA":[154],"POPE":[156],"ScienceQA":[158],"demonstrate":[159],"discovers":[162],"diverse":[163],"non-dominated":[164],"provides":[168],"controllable":[169],"robustness--utility":[170],"matched":[173],"budgets.":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-10T00:00:00"}
