{"id":"https://openalex.org/W4416252325","doi":"https://doi.org/10.1109/ijcnn64981.2025.11229197","title":"Efficient Framework with Pruning and Factorization for Vision Transformer","display_name":"Efficient Framework with Pruning and Factorization for Vision Transformer","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4416252325","doi":"https://doi.org/10.1109/ijcnn64981.2025.11229197"},"language":null,"primary_location":{"id":"doi:10.1109/ijcnn64981.2025.11229197","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11229197","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101431252","display_name":"Yipeng Chen","orcid":"https://orcid.org/0000-0001-6281-9183"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yipeng Chen","raw_affiliation_strings":["University of Science and Technology Beijing,Collaborative Innovation Center of Steel Technology"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology Beijing,Collaborative Innovation Center of Steel Technology","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101940716","display_name":"Ke Xu","orcid":"https://orcid.org/0000-0003-1809-7413"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Xu","raw_affiliation_strings":["University of Science and Technology Beijing,Collaborative Innovation Center of Steel Technology"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology Beijing,Collaborative Innovation Center of Steel Technology","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009624071","display_name":"Xiaojuan Ban","orcid":"https://orcid.org/0000-0001-9142-3276"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaojuan Ban","raw_affiliation_strings":["University of Science and Technology Beijing,School of Computer and Communication Engineering"],"affiliations":[{"raw_affiliation_string":"University of Science and Technology Beijing,School of Computer and Communication Engineering","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076174605","display_name":"Jingyu Liu","orcid":"https://orcid.org/0000-0002-1646-637X"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingyu Liu","raw_affiliation_strings":["Beijing Institute of Technology,School of Medical Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology,School of Medical Technology","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101431252"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36560221,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.36250001192092896,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.36250001192092896,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.17000000178813934,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.09679999947547913,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.7497000098228455},{"id":"https://openalex.org/keywords/factorization","display_name":"Factorization","score":0.5115000009536743},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.47609999775886536},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.3799999952316284},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.321399986743927},{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.3086000084877014}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.7497000098228455},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6420999765396118},{"id":"https://openalex.org/C187834632","wikidata":"https://www.wikidata.org/wiki/Q188804","display_name":"Factorization","level":2,"score":0.5115000009536743},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5037000179290771},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48089998960494995},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.47609999775886536},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.3799999952316284},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.321399986743927},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3199000060558319},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.3086000084877014},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3061999976634979},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.25519999861717224},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn64981.2025.11229197","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11229197","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2963363373","https://openalex.org/W2965862774","https://openalex.org/W3138516171","https://openalex.org/W3170841864","https://openalex.org/W3200980014","https://openalex.org/W4285601701","https://openalex.org/W4309125142","https://openalex.org/W4312333591","https://openalex.org/W4312412889","https://openalex.org/W4312422436","https://openalex.org/W4312677967","https://openalex.org/W4313007769","https://openalex.org/W4313069943","https://openalex.org/W4385801313","https://openalex.org/W4386065441","https://openalex.org/W4386071535","https://openalex.org/W4386072014","https://openalex.org/W4386076571","https://openalex.org/W4390873673","https://openalex.org/W4393147495","https://openalex.org/W4409366412","https://openalex.org/W4409367143","https://openalex.org/W4415798884"],"related_works":[],"abstract_inverted_index":{"Vision":[0],"Transformers":[1],"(ViTs)":[2],"have":[3],"demonstrated":[4],"impressive":[5],"performance":[6],"across":[7],"various":[8],"vision":[9],"tasks.":[10],"However,":[11],"these":[12],"models":[13],"usually":[14],"suffer":[15],"from":[16],"intensive":[17],"computational":[18],"costs":[19],"and":[20,83,93,150,165],"excessive":[21],"memory":[22],"requirements,":[23],"making":[24],"them":[25],"impractical":[26],"for":[27,102,122],"deployment.":[28],"In":[29],"this":[30,44],"paper,":[31],"we":[32,46,78,110,130],"propose":[33,79],"a":[34,80],"post-training":[35],"pruning":[36,86,117],"method":[37],"specially":[38],"tailored":[39],"to":[40,118,135],"ViTs.":[41],"To":[42],"achieve":[43],"goal,":[45],"underline":[47],"two":[48],"important":[49,97],"facts:":[50],"i)":[51],"the":[52,59,62,75,87,90,96,107,137,145,157],"importance":[53],"of":[54,61,128,147,172],"weights":[55,66,88],"heavily":[56],"relies":[57],"on":[58,168],"attributes":[60],"sample;":[63],"ii)":[64],"some":[65],"show":[67],"minor":[68],"contributions":[69],"in":[70],"feed-forward":[71],"calculation.":[72],"Motivated":[73,105],"by":[74,106],"first":[76],"observation,":[77,109],"weight":[81,98],"selection":[82],"recovery":[84],"mechanism,":[85],"with":[89,114],"lowest":[91],"score":[92],"then":[94],"recovering":[95],"via":[99],"calibration":[100],"samples":[101],"layer-wise":[103],"tuning.":[104],"second":[108],"explore":[111],"rank":[112],"values":[113],"search":[115],"space":[116],"accelerate":[119],"low-rank":[120],"factorization":[121],"more":[123],"effective":[124],"compression.":[125],"On":[126],"top":[127],"these,":[129],"further":[131],"conduct":[132],"hardware":[133],"optimization":[134],"support":[136],"pruned":[138],"models.":[139],"Promisingly,":[140],"three":[141],"designs":[142],"could":[143],"promote":[144],"effectiveness":[146],"each":[148],"other":[149],"finally":[151],"form":[152],"an":[153],"overall":[154],"framework.":[155],"Using":[156],"DeiT":[158],"benchmarks,":[159],"our":[160],"framework":[161],"achieves":[162],"competitive":[163],"acceleration":[164],"accuracy":[166],"conditioned":[167],"using":[169],"1%":[170],"data":[171],"ImageNet-1K.":[173]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-14T00:00:00"}
