{"id":"https://openalex.org/W4414693319","doi":"https://doi.org/10.1109/tpami.2025.3616854","title":"CAIT: Triple-Win <u>C</u> ompression Toward High <u>A</u> ccuracy, Fast <u>I</u> nference, and Favorable <u>T</u> ransferability for ViTs","display_name":"CAIT: Triple-Win <u>C</u> ompression Toward High <u>A</u> ccuracy, Fast <u>I</u> nference, and Favorable <u>T</u> ransferability for ViTs","publication_year":2025,"publication_date":"2025-10-01","ids":{"openalex":"https://openalex.org/W4414693319","doi":"https://doi.org/10.1109/tpami.2025.3616854","pmid":"https://pubmed.ncbi.nlm.nih.gov/41032537"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3616854","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3616854","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086294753","display_name":"Ao Wang","orcid":"https://orcid.org/0000-0003-0030-551X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ao Wang","raw_affiliation_strings":["BNRist, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"BNRist, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100334231","display_name":"Hui Chen","orcid":"https://orcid.org/0000-0003-4180-5801"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Chen","raw_affiliation_strings":["BNRist, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"BNRist, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077882811","display_name":"Zijia Lin","orcid":"https://orcid.org/0000-0002-1390-7424"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zijia Lin","raw_affiliation_strings":["School of Software, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051149140","display_name":"Sicheng Zhao","orcid":"https://orcid.org/0000-0001-5843-6411"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sicheng Zhao","raw_affiliation_strings":["BNRist, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"BNRist, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046605531","display_name":"Jungong Han","orcid":"https://orcid.org/0000-0003-4361-956X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jungong Han","raw_affiliation_strings":["Department of Automation, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057732142","display_name":"Guiguang Ding","orcid":"https://orcid.org/0000-0003-0137-9975"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guiguang Ding","raw_affiliation_strings":["BNRist, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"BNRist, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5086294753"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":2.3568,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.91251655,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"48","issue":"2","first_page":"1373","last_page":"1389"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.7664999961853027,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.7664999961853027,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11032","display_name":"VLSI and Analog Circuit Testing","score":0.7275999784469604,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.6766999959945679,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6953999996185303},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6047999858856201},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4690000116825104},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4657999873161316},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.430400013923645},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.3910999894142151},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.36230000853538513},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.3257000148296356}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8256000280380249},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6953999996185303},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6047999858856201},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.524399995803833},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4690000116825104},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4657999873161316},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.430400013923645},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.36230000853538513},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3402999937534332},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3257000148296356},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3257000148296356},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2978000044822693},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2888999879360199},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.27059999108314514},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2671000063419342},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C147764199","wikidata":"https://www.wikidata.org/wiki/Q6865248","display_name":"Minification","level":2,"score":0.2630999982357025},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.262800008058548},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26080000400543213},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2531000077724457},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3616854","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3616854","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:41032537","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41032537","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2365988345","display_name":null,"funder_award_id":"62525103","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G338250432","display_name":null,"funder_award_id":"62441235","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4144755178","display_name":null,"funder_award_id":"62571294","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5950249341","display_name":null,"funder_award_id":"624B2082","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G826746073","display_name":null,"funder_award_id":"62271281","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1935978687","https://openalex.org/W2008359794","https://openalex.org/W2108598243","https://openalex.org/W2737258237","https://openalex.org/W2804047627","https://openalex.org/W2807961551","https://openalex.org/W2808168148","https://openalex.org/W2884822772","https://openalex.org/W2910628332","https://openalex.org/W2928560789","https://openalex.org/W2955994610","https://openalex.org/W2963150697","https://openalex.org/W2963420272","https://openalex.org/W2989676862","https://openalex.org/W2997286550","https://openalex.org/W3035022492","https://openalex.org/W3121523901","https://openalex.org/W3131500599","https://openalex.org/W3138516171","https://openalex.org/W3151130473","https://openalex.org/W3159481202","https://openalex.org/W3165924482","https://openalex.org/W3170841864","https://openalex.org/W3171125843","https://openalex.org/W3171516518","https://openalex.org/W3172801447","https://openalex.org/W3172942063","https://openalex.org/W3188427387","https://openalex.org/W3193895134","https://openalex.org/W3216553632","https://openalex.org/W4213019189","https://openalex.org/W4214588794","https://openalex.org/W4214624153","https://openalex.org/W4214736485","https://openalex.org/W4226013274","https://openalex.org/W4226066935","https://openalex.org/W4226359564","https://openalex.org/W4283023197","https://openalex.org/W4285541168","https://openalex.org/W4293680532","https://openalex.org/W4295903508","https://openalex.org/W4312340826","https://openalex.org/W4312769570","https://openalex.org/W4312796067","https://openalex.org/W4312815172","https://openalex.org/W4312820606","https://openalex.org/W4312910119","https://openalex.org/W4312950730","https://openalex.org/W4313145913","https://openalex.org/W4313156423","https://openalex.org/W4313166619","https://openalex.org/W4319300502","https://openalex.org/W4327808545","https://openalex.org/W4366352791","https://openalex.org/W4385245566","https://openalex.org/W4386066311","https://openalex.org/W4386076539","https://openalex.org/W4386076556","https://openalex.org/W4388145401","https://openalex.org/W4388284323","https://openalex.org/W4390873017","https://openalex.org/W4390874575","https://openalex.org/W4391021637","https://openalex.org/W6902762063"],"related_works":[],"abstract_inverted_index":{"Vision":[0],"Transformers":[1],"(ViTs)":[2],"have":[3,27],"emerged":[4],"as":[5,87],"state-of-the-art":[6,202],"models":[7,74],"for":[8,20,36,101],"various":[9,205],"vision":[10,77],"tasks":[11,78],"recently.":[12],"However,":[13,38],"their":[14],"heavy":[15],"computation":[16],"costs":[17],"remain":[18],"daunting":[19],"resource-limited":[21],"devices.":[22],"To":[23,90],"address":[24],"this,":[25],"researchers":[26],"dedicated":[28],"themselves":[29],"to":[30,58,75,117,129,162,170],"compressing":[31],"redundant":[32,44,138],"information":[33,140],"in":[34,167,174],"ViTs":[35,102,179],"acceleration.":[37],"existing":[39],"approaches":[40],"generally":[41],"sparsely":[42],"drop":[43],"image":[45],"tokens":[46],"by":[47,54],"token":[48,125,139],"pruning":[49,159],"or":[50],"brutally":[51],"remove":[52],"channels":[53,166,173],"channel":[55,158],"pruning,":[56],"leading":[57],"a":[59,97,105,155],"sub-optimal":[60],"balance":[61],"between":[62],"model":[63,187],"performance":[64,203],"and":[65,114],"inference":[66,112],"speed.":[67],"Moreover,":[68],"they":[69],"struggle":[70],"when":[71],"transferring":[72],"compressed":[73],"downstream":[76,118],"that":[79,103,196],"require":[80],"the":[81,143,186],"spatial":[82,144],"structure":[83,145],"of":[84,108,146,150,178],"images,":[85],"such":[86],"semantic":[88],"segmentation.":[89],"tackle":[91],"these":[92],"issues,":[93],"we":[94,121,152],"propose":[95],"CAIT,":[96],"joint":[98],"compression":[99],"method":[100,199],"achieves":[104],"harmonious":[106],"blend":[107],"high":[109],"accuracy,":[110],"fast":[111],"speed,":[113],"favorable":[115],"transferability":[116],"tasks.":[119],"Specifically,":[120],"introduce":[122],"an":[123],"asymmetric":[124],"merging":[126],"(ATME)":[127],"strategy":[128,161],"effectively":[130],"integrate":[131],"neighboring":[132],"tokens.":[133],"It":[134],"can":[135,180,200],"successfully":[136],"compress":[137],"while":[141],"preserving":[142],"images.":[147],"On":[148],"top":[149],"it,":[151],"further":[153],"design":[154],"consistent":[156],"dynamic":[157],"(CDCP)":[160],"dynamically":[163],"prune":[164],"unimportant":[165],"ViTs.":[168,206],"Thanks":[169],"CDCP,":[171],"insignificant":[172],"multi-head":[175],"self-attention":[176],"modules":[177],"be":[181],"pruned":[182],"uniformly,":[183],"significantly":[184],"enhancing":[185],"compression.":[188],"Extensive":[189],"experiments":[190],"on":[191],"multiple":[192],"benchmark":[193],"datasets":[194],"show":[195],"our":[197],"proposed":[198],"achieve":[201],"across":[204]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-01T00:00:00"}
