{"id":"https://openalex.org/W4415428974","doi":"https://doi.org/10.3233/faia250834","title":"GCQ-ViT: Group-Aware Collaborative Post-Training Quantization for Vision Transformers","display_name":"GCQ-ViT: Group-Aware Collaborative Post-Training Quantization for Vision Transformers","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4415428974","doi":"https://doi.org/10.3233/faia250834"},"language":null,"primary_location":{"id":"doi:10.3233/faia250834","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia250834","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia250834","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112112665","display_name":"Peng Pan","orcid":"https://orcid.org/0009-0003-8351-4671"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pan Peng","raw_affiliation_strings":["School of Software and AI, Yunnan University, Kunming, China"],"affiliations":[{"raw_affiliation_string":"School of Software and AI, Yunnan University, Kunming, China","institution_ids":["https://openalex.org/I189210763"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060805967","display_name":"Wenbin Guo","orcid":"https://orcid.org/0000-0002-7341-9203"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenbin Guo","raw_affiliation_strings":["School of Software and AI, Yunnan University, Kunming, China"],"affiliations":[{"raw_affiliation_string":"School of Software and AI, Yunnan University, Kunming, China","institution_ids":["https://openalex.org/I189210763"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113987537","display_name":"Wei Ping","orcid":"https://orcid.org/0000-0002-8852-6618"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Wei","raw_affiliation_strings":["School of Software and AI, Yunnan University, Kunming, China"],"affiliations":[{"raw_affiliation_string":"School of Software and AI, Yunnan University, Kunming, China","institution_ids":["https://openalex.org/I189210763"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005510423","display_name":"Wei Zhou","orcid":"https://orcid.org/0000-0001-5956-0684"},"institutions":[{"id":"https://openalex.org/I189210763","display_name":"Yunnan University","ror":"https://ror.org/0040axw97","country_code":"CN","type":"education","lineage":["https://openalex.org/I189210763"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhou","raw_affiliation_strings":["School of Software and AI, Yunnan University, Kunming, China"],"affiliations":[{"raw_affiliation_string":"School of Software and AI, Yunnan University, Kunming, China","institution_ids":["https://openalex.org/I189210763"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5112112665"],"corresponding_institution_ids":["https://openalex.org/I189210763"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.67205584,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9825000166893005,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9825000166893005,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9753000140190125,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9151999950408936,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.7554000020027161},{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.4417000114917755},{"id":"https://openalex.org/keywords/histogram","display_name":"Histogram","score":0.3662000000476837},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.350600004196167},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.34200000762939453},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.3334999978542328},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.32589998841285706},{"id":"https://openalex.org/keywords/mura","display_name":"Mura","score":0.29739999771118164}],"concepts":[{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.7554000020027161},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6287000179290771},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4650000035762787},{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.4417000114917755},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3732999861240387},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.3662000000476837},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3634999990463257},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.350600004196167},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.34200000762939453},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.32589998841285706},{"id":"https://openalex.org/C2776147852","wikidata":"https://www.wikidata.org/wiki/Q6937160","display_name":"Mura","level":3,"score":0.29739999771118164},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.29330000281333923},{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2671000063419342},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.260699987411499},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.2556000053882599},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.2547999918460846}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia250834","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia250834","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia250834","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia250834","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Post-training":[0],"quantization":[1,25,59,106,153],"(PTQ)":[2],"is":[3],"widely":[4],"utilized":[5],"in":[6,29,35,136],"Vision":[7],"Transformers":[8],"(ViTs)":[9],"for":[10,54,192],"its":[11],"computational":[12],"efficiency":[13,93],"and":[14,92,130,175],"retraining":[15],"elimination.":[16],"However,":[17],"the":[18,39,46,80,90,183],"unique":[19],"architecture":[20],"of":[21,42,49,67,94,139],"ViTs":[22],"introduces":[23],"significant":[24],"challenges.":[26],"Dynamic":[27],"fluctuations":[28],"channel":[30,156],"activations,":[31],"particularly":[32],"post-LayerNorm,":[33],"result":[34],"distributional":[36,110],"mismatches.":[37],"Additionally,":[38,142],"heavy-tailed":[40],"nature":[41],"post-Softmax":[43,140],"activations":[44],"compromises":[45],"accurate":[47],"representation":[48,135],"critical":[50],"attention":[51],"regions,":[52],"vital":[53],"ViT":[55,95,193],"performance.":[56],"Moreover,":[57],"weight":[58],"at":[60],"low":[61],"bit-widths":[62],"leads":[63],"to":[64,108,133,151],"a":[65,101,121,145,159,189],"loss":[66],"structural":[68],"information,":[69],"degrading":[70],"global":[71],"feature":[72,166],"representation.":[73],"To":[74],"address":[75],"these":[76],"challenges,":[77],"we":[78,143],"introduce":[79],"Group-aware":[81],"Collaborative":[82],"Quantization":[83],"framework":[84,99],"(GCQ-ViT),":[85],"which":[86],"significantly":[87],"improves":[88],"both":[89],"accuracy":[91],"quantization.":[96,194],"The":[97],"GCQ-ViT":[98,181],"integrates":[100],"novel":[102],"dynamic":[103,146],"perception":[104],"grouping":[105],"mechanism":[107],"ensure":[109],"consistency":[111],"within":[112],"groups,":[113],"thus":[114],"reducing":[115],"hardware":[116],"expense.":[117],"It":[118],"also":[119],"utilizes":[120],"self-adaptive":[122],"displaced":[123],"uniform":[124],"log2":[125],"quantizer,":[126],"optimizing":[127],"shift":[128],"factors":[129],"nonlinear":[131],"intervals":[132],"enhance":[134],"high-density":[137],"regions":[138],"activations.":[141],"propose":[144],"dimension-aware":[147],"error":[148],"compensation":[149,162],"method":[150],"correct":[152],"errors":[154],"across":[155],"dimensions":[157],"using":[158],"residual":[160],"mean":[161],"skill,":[163],"ensuring":[164],"robust":[165],"preservation.":[167],"Extensive":[168],"experiments":[169],"on":[170],"image":[171],"classification,":[172],"object":[173],"detection,":[174],"instance":[176],"segmentation":[177],"tasks":[178],"demonstrate":[179],"that":[180],"outperforms":[182],"current":[184],"leading":[185],"PTQ":[186],"methods,":[187],"setting":[188],"new":[190],"benchmark":[191]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-24T00:00:00"}
