{"id":"https://openalex.org/W4414427347","doi":"https://doi.org/10.1109/iccv51701.2025.02123","title":"Task-Specific Zero-Shot Quantization-Aware Training for Object Detection","display_name":"Task-Specific Zero-Shot Quantization-Aware Training for Object Detection","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4414427347","doi":"https://doi.org/10.1109/iccv51701.2025.02123"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.02123","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.02123","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.16782","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001748944","display_name":"C. Li","orcid":"https://orcid.org/0000-0003-0850-8987"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Changhao Li","raw_affiliation_strings":["School of Computational Science and Engineering, Georgia Institute of Technology,Atlanta,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computational Science and Engineering, Georgia Institute of Technology,Atlanta,USA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046671377","display_name":"Xinrui Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinrui Chen","raw_affiliation_strings":["Shenzhen International Graduate School, Tsinghua University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University,China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009827642","display_name":"Ji Wang","orcid":"https://orcid.org/0000-0002-4536-6044"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ji Wang","raw_affiliation_strings":["School of Software, Tsinghua University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Software, Tsinghua University,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039040895","display_name":"Kang Zhao","orcid":"https://orcid.org/0000-0003-4767-6561"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kang Zhao","raw_affiliation_strings":["Institute for AI, Tsinghua-Bosch Joint ML Center, Tsinghua University,Dept. of Comp. Sci. and Tech.,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for AI, Tsinghua-Bosch Joint ML Center, Tsinghua University,Dept. of Comp. Sci. and Tech.,Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055874248","display_name":"Jianfei Chen","orcid":"https://orcid.org/0000-0001-9291-5926"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianfei Chen","raw_affiliation_strings":["Institute for AI, Tsinghua-Bosch Joint ML Center, Tsinghua University,Dept. of Comp. Sci. and Tech.,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for AI, Tsinghua-Bosch Joint ML Center, Tsinghua University,Dept. of Comp. Sci. and Tech.,Beijing,China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.2150579,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"22868","last_page":"22878"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9818999767303467,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12389","display_name":"Infrared Target Detection Methodologies","score":0.9746999740600586,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6793000102043152},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.6717000007629395},{"id":"https://openalex.org/keywords/pascal","display_name":"Pascal (unit)","score":0.6069999933242798},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4925999939441681},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.45509999990463257},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.413100004196167},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4088999927043915},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.38040000200271606}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7527999877929688},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6793000102043152},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.6717000007629395},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6136000156402588},{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.6069999933242798},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4925999939441681},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.45509999990463257},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43479999899864197},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.413100004196167},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4088999927043915},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.39079999923706055},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.38670000433921814},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.38040000200271606},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34209999442100525},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.335999995470047},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3285999894142151},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3125},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.30809998512268066},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C182521987","wikidata":"https://www.wikidata.org/wiki/Q2493877","display_name":"Viola\u2013Jones object detection framework","level":5,"score":0.25870001316070557}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.02123","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.02123","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2507.16782","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.16782","pdf_url":"https://arxiv.org/pdf/2507.16782","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2507.16782","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.16782","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.16782","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.16782","pdf_url":"https://arxiv.org/pdf/2507.16782","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7525196029","display_name":null,"funder_award_id":"62376131","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Quantization":[0,43],"is":[1,32,181],"a":[2,18,96,114,123],"key":[3],"technique":[4],"to":[5,27,36,67,88,121,152],"reduce":[6],"network":[7,15],"size":[8],"and":[9,117,135,166,173],"computational":[10],"complexity":[11],"by":[12,47],"representing":[13],"the":[14,56,80,128,148,154,164,171],"parameters":[16],"with":[17],"lower":[19],"precision.":[20],"Traditional":[21],"quantization":[22],"methods":[23,72],"rely":[24],"on":[25,163],"access":[26],"original":[28],"training":[29,60,146],"data,":[30],"which":[31,105],"often":[33],"restricted":[34],"due":[35],"privacy":[37],"concerns":[38],"or":[39],"security":[40],"challenges.":[41],"Zero-shot":[42],"(ZSQ)":[44],"addresses":[45],"this":[46,92],"using":[48],"synthetic":[49,76],"data":[50],"generated":[51],"from":[52,127],"pre-trained":[53,129],"models,":[54],"eliminating":[55],"need":[57],"for":[58,84,101],"real":[59],"data.":[61],"Recently,":[62],"ZSQ":[63,99],"has":[64],"been":[65],"extended":[66],"object":[68,85,102,132],"detection.":[69],"However,":[70],"existing":[71],"use":[73],"unlabeled":[74],"task-agnostic":[75],"images":[77],"that":[78],"lack":[79],"specific":[81],"information":[82],"required":[83],"detection,":[86],"leading":[87],"suboptimal":[89],"performance.":[90],"In":[91],"paper,":[93],"we":[94,112,143],"propose":[95],"novel":[97],"task-specific":[98,124,145],"framework":[100],"detection":[103,158],"networks,":[104],"consists":[106],"of":[107,156,176],"two":[108],"main":[109],"stages.":[110],"First,":[111],"introduce":[113],"bounding":[115],"box":[116],"category":[118,136],"sampling":[119],"strategy":[120],"synthesize":[122],"calibration":[125],"set":[126],"network,":[130],"reconstructing":[131],"locations,":[133],"sizes,":[134],"distributions":[137],"without":[138],"any":[139],"prior":[140],"knowledge.":[141],"Second,":[142],"integrate":[144],"into":[147],"knowledge":[149],"distillation":[150],"process":[151],"restore":[153],"performance":[155,175],"quantized":[157],"networks.":[159],"Extensive":[160],"experiments":[161],"conducted":[162],"MS-COCO":[165],"Pascal":[167],"VOC":[168],"datasets":[169],"demonstrate":[170],"efficiency":[172],"state-of-the-art":[174],"our":[177],"method.":[178],"Our":[179],"code":[180],"publicly":[182],"available":[183],"at:":[184],"https://github.com/DFQ-Dojo/dfq-toolkit":[185],".":[186]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
