{"id":"https://openalex.org/W4413147408","doi":"https://doi.org/10.1109/cvpr52734.2025.00387","title":"Data-Free Group-Wise Fully Quantized Winograd Convolution via Learnable Scales","display_name":"Data-Free Group-Wise Fully Quantized Winograd Convolution via Learnable Scales","publication_year":2025,"publication_date":"2025-06-10","ids":{"openalex":"https://openalex.org/W4413147408","doi":"https://doi.org/10.1109/cvpr52734.2025.00387"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr52734.2025.00387","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.00387","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008056593","display_name":"Shirui Pan","orcid":"https://orcid.org/0000-0003-0794-527X"},"institutions":[{"id":"https://openalex.org/I4210156213","display_name":"American Rock Mechanics Association","ror":"https://ror.org/05vfrxy92","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156213"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Shuokai Pan","raw_affiliation_strings":["Arm Inc"],"affiliations":[{"raw_affiliation_string":"Arm Inc","institution_ids":["https://openalex.org/I4210156213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115728504","display_name":"Gerti Tuzi","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156213","display_name":"American Rock Mechanics Association","ror":"https://ror.org/05vfrxy92","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156213"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gerti Tuzi","raw_affiliation_strings":["Arm Inc"],"affiliations":[{"raw_affiliation_string":"Arm Inc","institution_ids":["https://openalex.org/I4210156213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115728505","display_name":"Sudarshan Sreeram","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156213","display_name":"American Rock Mechanics Association","ror":"https://ror.org/05vfrxy92","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156213"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sudarshan Sreeram","raw_affiliation_strings":["Arm Inc"],"affiliations":[{"raw_affiliation_string":"Arm Inc","institution_ids":["https://openalex.org/I4210156213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078130628","display_name":"Dibakar Gope","orcid":null},"institutions":[{"id":"https://openalex.org/I4210156213","display_name":"American Rock Mechanics Association","ror":"https://ror.org/05vfrxy92","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210156213"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dibakar Gope","raw_affiliation_strings":["Arm Inc"],"affiliations":[{"raw_affiliation_string":"Arm Inc","institution_ids":["https://openalex.org/I4210156213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5008056593"],"corresponding_institution_ids":["https://openalex.org/I4210156213"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.24133182,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4091","last_page":"4100"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9013000130653381,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9013000130653381,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.7089030146598816},{"id":"https://openalex.org/keywords/group","display_name":"Group (periodic table)","score":0.6168140769004822},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.448588103055954},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4296822249889374},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4223648011684418},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.3226620852947235},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27002567052841187},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.13443195819854736}],"concepts":[{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.7089030146598816},{"id":"https://openalex.org/C2781311116","wikidata":"https://www.wikidata.org/wiki/Q83306","display_name":"Group (periodic table)","level":2,"score":0.6168140769004822},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.448588103055954},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4296822249889374},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4223648011684418},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.3226620852947235},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27002567052841187},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.13443195819854736},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr52734.2025.00387","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.00387","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W1979597421","https://openalex.org/W2007980826","https://openalex.org/W2051487156","https://openalex.org/W2061531152","https://openalex.org/W3002753104","https://openalex.org/W2077600819","https://openalex.org/W2142036596","https://openalex.org/W2072657027","https://openalex.org/W2962838298"],"abstract_inverted_index":{"Despite":[0],"the":[1,72,88,94,114,126,142,152,161,170,177,181,201,215,232,238,258,271],"revolutionary":[2],"breakthroughs":[3],"of":[4,26,66,76,92,116,120,128,160,180,204,240,261],"large-scale":[5,109],"text-to-image":[6,212],"diffusion":[7,27,69,134,206,218,263],"models":[8,28,101,207],"for":[9,57,62,98,108,244],"complex":[10],"vision":[11],"and":[12,19,39,90,226,278,286],"downstream":[13],"tasks,":[14],"their":[15,23],"extremely":[16],"high":[17],"computational":[18],"storage":[20],"costs":[21,38],"limit":[22],"usability.":[24],"Quantization":[25],"has":[29],"been":[30],"explored":[31],"in":[32,68,122,132,156,169,229,280],"recent":[33],"works":[34],"to":[35,102,149,231,257],"reduce":[36,166],"compute":[37],"memory":[40],"bandwidth":[41],"usage.":[42],"To":[43,165],"further":[44],"improve":[45],"inference":[46],"time,":[47],"fast":[48],"convolution":[49,58,259],"algorithms":[50],"such":[51,99],"as":[52],"Winograd":[53,79,95,145,162,171,182,273,290],"can":[54,139],"be":[55],"used":[56],"layers,":[59],"which":[60],"account":[61],"a":[63,117,157,262],"significant":[64,73],"portion":[65,159],"computations":[67],"models.":[70,111,135],"However,":[71],"quality":[74,224],"loss":[75],"fully":[77,143,246],"quantized":[78,144,205,247],"using":[80,186],"existing":[81],"coarser-grained":[82],"post-training":[83],"quantization":[84,131,138],"methods,":[85],"combined":[86],"with":[87,151,220,237,289],"complexity":[89],"cost":[91],"finetuning":[93,175],"transformation":[96],"matrices":[97,184],"large":[100,118,153],"recover":[103],"quality,":[104],"makes":[105],"them":[106],"unsuitable":[107],"foundation":[110],"Motivated":[112],"by":[113,253,276],"presence":[115],"range":[119,167],"values":[121],"them,":[123],"we":[124,173],"investigate":[125],"impact":[127],"finer-grained":[129],"group-wise":[130,137,245],"quantizing":[133],"While":[136],"largely":[140],"handle":[141],"convolution,":[146],"it":[147],"struggles":[148],"deal":[150],"distribution":[154],"imbalance":[155],"sizable":[158],"domain":[163],"computation.":[164],"differences":[168],"domain,":[172],"propose":[174],"only":[176],"scale":[178],"parameters":[179],"transform":[183],"without":[185],"any":[187,198],"domain-specific":[188],"training":[189,199],"data.":[190],"Because":[191],"our":[192,268],"method":[193,269,275],"does":[194],"not":[195],"depend":[196],"on":[197,284],"data,":[200],"generalization":[202],"performance":[203],"is":[208],"safely":[209],"guaranteed.":[210],"For":[211,265],"generation":[213],"task,":[214],"8-bit":[216],"fully-quantized":[217],"model":[219],"Wino-grad":[221],"provides":[222],"near-lossless":[223],"(FID":[225],"CLIP":[227],"scores)":[228],"comparison":[230],"full-precision":[233],"model.":[234,264],"This,":[235],"coupled":[236],"development":[239],"highly":[241],"optimized":[242],"kernels":[243],"Winograd,":[248],"improves":[249],"CPU":[250],"wall-clock":[251],"time":[252],"31.3%":[254],"when":[255],"compared":[256],"layers":[260],"image":[266],"classification,":[267],"outperforms":[270],"state-of-the-art":[272],"PTQ":[274],"1.62%":[277],"2.56%":[279],"top-1":[281],"ImageNet":[282],"accuracy":[283],"ResNet-18":[285],"ResNet-34,":[287],"respectively,":[288],"F(6,":[291],"3).":[292]},"counts_by_year":[],"updated_date":"2025-12-19T19:40:27.379048","created_date":"2025-10-10T00:00:00"}
