{"id":"https://openalex.org/W7130684282","doi":"https://doi.org/10.48550/arxiv.2602.17196","title":"EntropyPrune: Matrix Entropy Guided Visual Token Pruning for Multimodal Large Language Models","display_name":"EntropyPrune: Matrix Entropy Guided Visual Token Pruning for Multimodal Large Language Models","publication_year":2026,"publication_date":"2026-02-19","ids":{"openalex":"https://openalex.org/W7130684282","doi":"https://doi.org/10.48550/arxiv.2602.17196"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.17196","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.17196","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.17196","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126494083","display_name":"Yahong Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Yahong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103268881","display_name":"Jiande Wu","orcid":"https://orcid.org/0000-0003-2780-4925"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Juncheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032273272","display_name":"Zhangkai Ni","orcid":"https://orcid.org/0000-0003-3682-6288"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ni, Zhangkai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126465263","display_name":"Chengmei Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Chengmei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126515235","display_name":"Yihang Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yihang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085584344","display_name":"Longzhen Yang","orcid":"https://orcid.org/0000-0002-5791-145X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Longzhen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126447215","display_name":"Yuyin Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yuyin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126479282","display_name":"Ying Wen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen, Ying","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"He, Lianghua","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Lianghua","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5126494083"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8718000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8718000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.048500001430511475,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.017799999564886093,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.6995000243186951},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5625},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.526199996471405},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.47440001368522644},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4731999933719635},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.45010000467300415},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.44510000944137573},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4431000053882599}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7904999852180481},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.6995000243186951},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5625},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5457000136375427},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.526199996471405},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5206999778747559},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.47440001368522644},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4731999933719635},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.45010000467300415},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.44510000944137573},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4431000053882599},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4196000099182129},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.39820000529289246},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.39719998836517334},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.35109999775886536},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.28200000524520874},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.2718000113964081},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2655999958515167},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.25290000438690186}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.17196","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.17196","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.17196","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.17196","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"large":[1],"language":[2],"models":[3],"(MLLMs)":[4],"incur":[5],"substantial":[6],"inference":[7],"cost":[8],"due":[9],"to":[10,33,124,146,191],"the":[11,70,89,107,130,138,184,197],"processing":[12],"of":[13,15,73,110,133,140,183],"hundreds":[14],"visual":[16,74,112],"tokens":[17,113],"per":[18],"image.":[19],"Although":[20],"token":[21,102],"pruning":[22,90,103,163],"has":[23],"proven":[24],"effective":[25],"for":[26,87],"accelerating":[27],"inference,":[28],"determining":[29],"when":[30],"and":[31,50,62,79,114,143,168,193,200],"where":[32,69],"prune":[34],"remains":[35],"largely":[36],"heuristic.":[37],"Existing":[38],"approaches":[39],"typically":[40],"rely":[41],"on":[42,93,120,153],"static,":[43],"empirically":[44],"selected":[45],"layers,":[46],"which":[47,82],"limit":[48],"interpretability":[49],"transferability":[51],"across":[52],"models.":[53],"In":[54],"this":[55,94],"work,":[56],"we":[57,96,128],"introduce":[58],"a":[59,77,84,99,147,175],"matrix-entropy":[60],"perspective":[61],"identify":[63],"an":[64],"\"Entropy":[65],"Collapse":[66],"Layer\"":[67],"(ECL),":[68],"information":[71,108],"content":[72],"representations":[75],"exhibits":[76],"sharp":[78],"consistent":[80],"drop,":[81],"provides":[83],"principled":[85],"criterion":[86],"selecting":[88],"stage.":[91],"Building":[92],"observation,":[95],"propose":[97],"EntropyPrune,":[98],"novel":[100],"matrix-entropy-guided":[101],"framework":[104],"that":[105,158],"quantifies":[106],"value":[109],"individual":[111],"prunes":[115],"redundant":[116],"ones":[117],"without":[118],"relying":[119],"attention":[121],"maps.":[122],"Moreover,":[123],"enable":[125],"efficient":[126],"computation,":[127],"exploit":[129],"spectral":[131],"equivalence":[132],"dual":[134],"Gram":[135],"matrices,":[136],"reducing":[137],"complexity":[139],"entropy":[141],"computation":[142],"yielding":[144],"up":[145],"64x":[148],"theoretical":[149],"speedup.":[150],"Extensive":[151],"experiments":[152],"diverse":[154],"multimodal":[155],"benchmarks":[156],"demonstrate":[157],"EntropyPrune":[159,188],"consistently":[160],"outperforms":[161],"state-of-the-art":[162],"methods":[164],"in":[165,178,202],"both":[166],"accuracy":[167],"efficiency.":[169],"On":[170],"LLaVA-1.5-7B,":[171],"our":[172],"method":[173],"achieves":[174],"68.2%":[176],"reduction":[177],"FLOPs":[179],"while":[180],"preserving":[181],"96.0%":[182],"original":[185],"performance.":[186],"Furthermore,":[187],"generalizes":[189],"effectively":[190],"high-resolution":[192],"video-based":[194],"models,":[195],"highlighting":[196],"strong":[198],"robustness":[199],"scalability":[201],"practical":[203],"MLLM":[204],"acceleration.":[205],"The":[206],"code":[207],"will":[208],"be":[209],"publicly":[210],"available":[211],"at":[212],"https://github.com/YahongWang1/EntropyPrune.":[213]},"counts_by_year":[],"updated_date":"2026-03-25T23:56:10.502304","created_date":"2026-02-21T00:00:00"}
