{"id":"https://openalex.org/W4415193100","doi":"https://doi.org/10.1109/iccv51701.2025.00288","title":"Fewer Denoising Steps or Cheaper Per-Step Inference: Towards Compute-Optimal Diffusion Model Deployment","display_name":"Fewer Denoising Steps or Cheaper Per-Step Inference: Towards Compute-Optimal Diffusion Model Deployment","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4415193100","doi":"https://doi.org/10.1109/iccv51701.2025.00288"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.00288","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00288","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.06160","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079778367","display_name":"Zhenbang Du","orcid":"https://orcid.org/0000-0002-1386-8381"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhenbang Du","raw_affiliation_strings":["Georgia Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061572132","display_name":"Yonggan Fu","orcid":"https://orcid.org/0000-0002-7483-2921"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yonggan Fu","raw_affiliation_strings":["Georgia Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076449077","display_name":"Lifu Wang","orcid":"https://orcid.org/0000-0002-3206-4928"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lifu Wang","raw_affiliation_strings":["Georgia Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077756951","display_name":"Jiayi Qian","orcid":"https://orcid.org/0000-0002-7112-9931"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiayi Qian","raw_affiliation_strings":["Georgia Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038978057","display_name":"Xiao Luo","orcid":"https://orcid.org/0000-0002-3649-9785"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiao Luo","raw_affiliation_strings":["Georgia Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"last","author":{"id":null,"display_name":"Yingyan Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yingyan Lin","raw_affiliation_strings":["Georgia Institute of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I130701444"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.2053528,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3001","last_page":"3010"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9648000001907349,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9648000001907349,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12603","display_name":"NMR spectroscopy and applications","score":0.9136000275611877,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.6826000213623047},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.6349999904632568},{"id":"https://openalex.org/keywords/reuse","display_name":"Reuse","score":0.6043999791145325},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4415000081062317},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4316999912261963},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4049000144004822},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.3950999975204468}],"concepts":[{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.6826000213623047},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6801999807357788},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.6349999904632568},{"id":"https://openalex.org/C206588197","wikidata":"https://www.wikidata.org/wiki/Q846574","display_name":"Reuse","level":2,"score":0.6043999791145325},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4415000081062317},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4316999912261963},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4049000144004822},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3950999975204468},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3474000096321106},{"id":"https://openalex.org/C30814859","wikidata":"https://www.wikidata.org/wiki/Q4119603","display_name":"Video denoising","level":5,"score":0.3357999920845032},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31360000371932983},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.31200000643730164},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2937999963760376},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.27459999918937683},{"id":"https://openalex.org/C57691317","wikidata":"https://www.wikidata.org/wiki/Q1289248","display_name":"Scalar (mathematics)","level":2,"score":0.2565999925136566},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25290000438690186}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.00288","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00288","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2508.06160","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.06160","pdf_url":"https://arxiv.org/pdf/2508.06160","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2508.06160","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.06160","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.06160","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.06160","pdf_url":"https://arxiv.org/pdf/2508.06160","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3406327847","display_name":null,"funder_award_id":"2016727,2048183","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"models":[1,108],"have":[2],"shown":[3],"remarkable":[4],"success":[5],"across":[6,67,169],"generative":[7],"tasks,":[8],"yet":[9],"their":[10],"high":[11],"computational":[12],"demands":[13],"challenge":[14],"deployment":[15],"on":[16,135],"resource-limited":[17],"platforms.":[18],"This":[19],"paper":[20],"investigates":[21],"a":[22,31,50,101,121,130,161],"critical":[23],"question":[24],"for":[25,104],"compute-optimal":[26],"diffusion":[27,107,189],"model":[28,71],"deployment:":[29],"Under":[30],"post-training":[32,90,122],"setting":[33],"without":[34],"fine-tuning,":[35],"is":[36,205,218],"it":[37],"more":[38,72,79,92,207],"effective":[39,208],"to":[40,48,74,166,193],"reduce":[41],"the":[42,56,62,65,70,83,114,125,136,156,184,211],"number":[43,57,212],"of":[44,58,64,187,213],"denoising":[45,59,80,132,144,170,214],"steps":[46,60,81,145],"or":[47],"use":[49],"cheaper":[51],"per-step":[52,202],"inference?":[53],"Intuitively,":[54],"reducing":[55,110,139,201,210],"increases":[61],"variability":[63],"distributions":[66],"steps,":[68],"making":[69,89],"sensitive":[73],"compression.":[75],"In":[76],"contrast,":[77],"keeping":[78],"makes":[82],"differences":[84],"smaller,":[85],"preserving":[86],"redundancy,":[87],"and":[88,117,150,174,191],"compression":[91],"feasible.":[93],"To":[94],"systematically":[95],"examine":[96],"this,":[97],"we":[98,128,159],"propose":[99,129],"PostDiff,":[100],"training-free":[102],"framework":[103],"accelerating":[105],"pre-trained":[106],"by":[109],"redundancy":[111],"at":[112,220],"both":[113],"input":[115,126],"level":[116,119],"module":[118,157,163],"in":[120,142],"manner.":[123],"At":[124,155],"level,":[127,158],"mixed-resolution":[131],"scheme":[133],"based":[134],"insight":[137],"that":[138,178],"generation":[140,153,199],"resolution":[141],"early":[143],"can":[146,181],"enhance":[147],"low-frequency":[148],"components":[149],"improve":[151,183],"final":[152],"fidelity.":[154],"employ":[160],"hybrid":[162],"caching":[164],"strategy":[165],"reuse":[167],"computations":[168],"steps.":[171,215],"Extensive":[172],"experiments":[173],"ablation":[175],"studies":[176],"demonstrate":[177],"(1)":[179],"PostDiff":[180],"significantly":[182],"fidelity-efficiency":[185],"trade-off":[186],"state-of-the-art":[188],"models,":[190],"(2)":[192],"boost":[194],"efficiency":[195],"while":[196],"maintaining":[197],"decent":[198],"fidelity,":[200],"inference":[203],"cost":[204],"often":[206],"than":[209],"Our":[216],"code":[217],"available":[219],"https://github.com/GATECH-EIC/PostDiff.":[221]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2025-10-15T00:00:00"}
