{"id":"https://openalex.org/W7110015622","doi":"https://doi.org/10.1145/3757377.3763979","title":"HiWave: Training-Free High-Resolution Image Generation via Wavelet-Based Diffusion Sampling","display_name":"HiWave: Training-Free High-Resolution Image Generation via Wavelet-Based Diffusion Sampling","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W7110015622","doi":"https://doi.org/10.1145/3757377.3763979"},"language":null,"primary_location":{"id":"doi:10.1145/3757377.3763979","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3757377.3763979","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Tobias Vontobel","orcid":"https://orcid.org/0009-0008-7579-0613"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":true,"raw_author_name":"Tobias Vontobel","raw_affiliation_strings":["ETH Z\u00fcrich, Z\u00fcrich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Z\u00fcrich, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Seyedmorteza Sadat","orcid":"https://orcid.org/0009-0003-4668-5703"},"institutions":[{"id":"https://openalex.org/I35440088","display_name":"ETH Zurich","ror":"https://ror.org/05a28rw58","country_code":"CH","type":"education","lineage":["https://openalex.org/I2799323385","https://openalex.org/I35440088"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Seyedmorteza Sadat","raw_affiliation_strings":["ETH Z\u00fcrich, Z\u00fcrich, Switzerland and Disney Research Studios, Z\u00fcrich, Switzerland"],"affiliations":[{"raw_affiliation_string":"ETH Z\u00fcrich, Z\u00fcrich, Switzerland and Disney Research Studios, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I35440088"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Farnood Salehi","orcid":"https://orcid.org/0000-0002-9222-4727"},"institutions":[{"id":"https://openalex.org/I4210137357","display_name":"Walt Disney (Switzerland)","ror":"https://ror.org/04h1x1p54","country_code":"CH","type":"company","lineage":["https://openalex.org/I4210137357","https://openalex.org/I4210142140"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Farnood Salehi","raw_affiliation_strings":["Disney Research Studios, Z\u00fcrich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Disney Research Studios, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I4210137357"]}]},{"author_position":"last","author":{"id":null,"display_name":"Romann Weber","orcid":"https://orcid.org/0000-0003-1196-5425"},"institutions":[{"id":"https://openalex.org/I4210137357","display_name":"Walt Disney (Switzerland)","ror":"https://ror.org/04h1x1p54","country_code":"CH","type":"company","lineage":["https://openalex.org/I4210137357","https://openalex.org/I4210142140"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Romann Weber","raw_affiliation_strings":["Disney Research Studios, Z\u00fcrich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Disney Research Studios, Z\u00fcrich, Switzerland","institution_ids":["https://openalex.org/I4210137357"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I35440088"],"apc_list":null,"apc_paid":null,"fwci":1.3104,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.86797435,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7513999938964844,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7513999938964844,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.0917000025510788,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.02459999918937683,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fidelity","display_name":"Fidelity","score":0.6384000182151794},{"id":"https://openalex.org/keywords/coherence","display_name":"Coherence (philosophical gambling strategy)","score":0.47350001335144043},{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.3785000145435333},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.365200012922287},{"id":"https://openalex.org/keywords/base","display_name":"Base (topology)","score":0.35569998621940613},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.35569998621940613},{"id":"https://openalex.org/keywords/image-processing","display_name":"Image processing","score":0.34470000863075256},{"id":"https://openalex.org/keywords/image-synthesis","display_name":"Image synthesis","score":0.33169999718666077}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6909000277519226},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.6384000182151794},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6118999719619751},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5989000201225281},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.47350001335144043},{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.3785000145435333},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.365200012922287},{"id":"https://openalex.org/C42058472","wikidata":"https://www.wikidata.org/wiki/Q810214","display_name":"Base (topology)","level":2,"score":0.35569998621940613},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.35569998621940613},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.34470000863075256},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3418000042438507},{"id":"https://openalex.org/C2989087649","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Image synthesis","level":3,"score":0.33169999718666077},{"id":"https://openalex.org/C203504353","wikidata":"https://www.wikidata.org/wiki/Q4765461","display_name":"Anisotropic diffusion","level":3,"score":0.3312000036239624},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.3310999870300293},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.32989999651908875},{"id":"https://openalex.org/C2779606619","wikidata":"https://www.wikidata.org/wiki/Q17092524","display_name":"Interchangeability","level":2,"score":0.3255999982357025},{"id":"https://openalex.org/C35772409","wikidata":"https://www.wikidata.org/wiki/Q1323086","display_name":"Image noise","level":3,"score":0.3124000132083893},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.31209999322891235},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.31040000915527344},{"id":"https://openalex.org/C125045340","wikidata":"https://www.wikidata.org/wiki/Q6002224","display_name":"Image formation","level":3,"score":0.2863999903202057},{"id":"https://openalex.org/C50494287","wikidata":"https://www.wikidata.org/wiki/Q658467","display_name":"Texture synthesis","level":5,"score":0.2734000086784363},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.2612999975681305},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.257999986410141}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3757377.3763979","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3757377.3763979","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2073075511","https://openalex.org/W3212516020","https://openalex.org/W4224035735","https://openalex.org/W4288099666","https://openalex.org/W4308163867","https://openalex.org/W4312933868","https://openalex.org/W4319989813","https://openalex.org/W4320853729","https://openalex.org/W4383472654","https://openalex.org/W4386065807","https://openalex.org/W4386071957","https://openalex.org/W4389115686","https://openalex.org/W4390872297","https://openalex.org/W4402667895","https://openalex.org/W4403841908","https://openalex.org/W4409262753"],"related_works":[],"abstract_inverted_index":{"Diffusion":[0,152],"models":[1,19],"have":[2],"emerged":[3],"as":[4],"the":[5,83,116,130,181],"leading":[6],"approach":[7,55],"for":[8,31,193],"image":[9,66,81,132,196],"synthesis,":[10],"demonstrating":[11],"exceptional":[12],"photorealism":[13],"and":[14,26,43,61,93,146],"diversity.":[15],"However,":[16],"training":[17,35],"diffusion":[18,70],"at":[20],"high":[21],"resolutions":[22,36],"remains":[23],"computationally":[24],"prohibitive,":[25],"existing":[27],"zero-shot":[28,54],"generation":[29],"techniques":[30],"synthesizing":[32],"images":[33],"beyond":[34],"often":[37],"produce":[38],"artifacts,":[39],"including":[40],"object":[41],"duplication":[42],"spatial":[44],"incoherence.":[45],"In":[46],"this":[47],"paper,":[48],"we":[49,101],"introduce":[50],"HiWave,":[51],"a":[52,75,79,88,94],"training-free,":[53],"that":[56,111,155],"substantially":[57],"enhances":[58],"visual":[59,160],"fidelity":[60],"structural":[62,135],"coherence":[63,114],"in":[64,163,184],"ultra-high-resolution":[65,195],"synthesis":[67,197],"using":[68,150],"pretrained":[69,84],"models.":[71],"Our":[72],"method":[73],"employs":[74],"two-stage":[76],"pipeline:":[77],"generating":[78],"base":[80,117,131],"from":[82,115,129],"model":[85],"followed":[86],"by":[87],"patch-wise":[89],"DDIM":[90],"inversion":[91,104],"step":[92],"novel":[95],"wavelet-based":[96],"detail":[97,124],"enhancer":[98,125],"module.":[99],"Specifically,":[100],"first":[102],"utilize":[103],"methods":[105],"to":[106,133,142],"derive":[107],"initial":[108],"noise":[109],"vectors":[110],"preserve":[112],"global":[113],"image.":[118],"Subsequently,":[119],"during":[120],"sampling,":[121],"our":[122],"wavelet-domain":[123],"retains":[126],"low-frequency":[127],"components":[128,141],"ensure":[134],"consistency,":[136],"while":[137],"selectively":[138],"guiding":[139],"high-frequency":[140],"enrich":[143],"fine":[144],"details":[145],"textures.":[147],"Extensive":[148],"evaluations":[149],"Stable":[151],"XL":[153],"demonstrate":[154],"HiWave":[156],"effectively":[157],"mitigates":[158],"common":[159],"artifacts":[161],"seen":[162],"prior":[164],"methods,":[165],"achieving":[166],"superior":[167],"perceptual":[168],"quality.":[169],"A":[170],"user":[171],"study":[172],"confirmed":[173],"HiWave\u2019s":[174],"performance,":[175],"where":[176],"it":[177],"was":[178],"preferred":[179],"over":[180],"state-of-the-art":[182],"alternative":[183],"more":[185],"than":[186],"80%":[187],"of":[188],"comparisons,":[189],"highlighting":[190],"its":[191],"effectiveness":[192],"high-quality,":[194],"without":[198],"requiring":[199],"retraining":[200],"or":[201],"architectural":[202],"modifications.":[203]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-10T02:45:41.426853","created_date":"2025-12-08T00:00:00"}
