{"id":"https://openalex.org/W4414982526","doi":"https://doi.org/10.1109/wacv61042.2026.00422","title":"Fine-grained Defocus Blur Control for Generative Image Models","display_name":"Fine-grained Defocus Blur Control for Generative Image Models","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W4414982526","doi":"https://doi.org/10.1109/wacv61042.2026.00422"},"language":"en","primary_location":{"id":"doi:10.1109/wacv61042.2026.00422","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00422","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.06215","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062122421","display_name":"Ayush Shrivastava","orcid":null},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ayush Shrivastava","raw_affiliation_strings":["University of Michigan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083898813","display_name":"Connelly Barnes","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Connelly Barnes","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045095414","display_name":"Xuaner Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuaner Zhang","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100683340","display_name":"Lingzhi Zhang","orcid":"https://orcid.org/0000-0002-8348-5618"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lingzhi Zhang","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103210329","display_name":"Andrew Owens","orcid":"https://orcid.org/0000-0002-3535-025X"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Owens","raw_affiliation_strings":["University of Michigan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Michigan","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042253371","display_name":"Sohrab Amirghodsi","orcid":null},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sohrab Amirghodsi","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024777042","display_name":"Eli Shechtman","orcid":"https://orcid.org/0000-0002-6783-1795"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Eli Shechtman","raw_affiliation_strings":["Adobe Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Adobe Research","institution_ids":["https://openalex.org/I1306409833"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5062122421"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00550629,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4335","last_page":"4344"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9785000085830688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9767000079154968,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.7200000286102295},{"id":"https://openalex.org/keywords/autofocus","display_name":"Autofocus","score":0.6182000041007996},{"id":"https://openalex.org/keywords/lens","display_name":"Lens (geology)","score":0.5843999981880188},{"id":"https://openalex.org/keywords/monocular","display_name":"Monocular","score":0.5439000129699707},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5223000049591064},{"id":"https://openalex.org/keywords/camera-lens","display_name":"Camera lens","score":0.49639999866485596},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4830000102519989},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.42309999465942383},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.41929998993873596}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7348999977111816},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.7200000286102295},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7160999774932861},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6873000264167786},{"id":"https://openalex.org/C103764139","wikidata":"https://www.wikidata.org/wiki/Q210008","display_name":"Autofocus","level":3,"score":0.6182000041007996},{"id":"https://openalex.org/C15336307","wikidata":"https://www.wikidata.org/wiki/Q1766051","display_name":"Lens (geology)","level":2,"score":0.5843999981880188},{"id":"https://openalex.org/C65909025","wikidata":"https://www.wikidata.org/wiki/Q1945033","display_name":"Monocular","level":2,"score":0.5439000129699707},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5223000049591064},{"id":"https://openalex.org/C2778022956","wikidata":"https://www.wikidata.org/wiki/Q192234","display_name":"Camera lens","level":3,"score":0.49639999866485596},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4830000102519989},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.42309999465942383},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.41929998993873596},{"id":"https://openalex.org/C202615002","wikidata":"https://www.wikidata.org/wiki/Q783507","display_name":"Differentiable function","level":2,"score":0.3977999985218048},{"id":"https://openalex.org/C78336883","wikidata":"https://www.wikidata.org/wiki/Q4779385","display_name":"Aperture (computer memory)","level":2,"score":0.38530001044273376},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.34439998865127563},{"id":"https://openalex.org/C125045340","wikidata":"https://www.wikidata.org/wiki/Q6002224","display_name":"Image formation","level":3,"score":0.3443000018596649},{"id":"https://openalex.org/C119657128","wikidata":"https://www.wikidata.org/wiki/Q11633","display_name":"Photography","level":2,"score":0.3244999945163727},{"id":"https://openalex.org/C177454536","wikidata":"https://www.wikidata.org/wiki/Q578290","display_name":"Emphasis (telecommunications)","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.31040000915527344},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.2937000095844269},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.27219998836517334},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C2777708103","wikidata":"https://www.wikidata.org/wiki/Q852589","display_name":"Motion blur","level":3,"score":0.2533999979496002},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.25279998779296875},{"id":"https://openalex.org/C146044194","wikidata":"https://www.wikidata.org/wiki/Q5157334","display_name":"Computational photography","level":4,"score":0.25049999356269836}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/wacv61042.2026.00422","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv61042.2026.00422","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2510.06215","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.06215","pdf_url":"https://arxiv.org/pdf/2510.06215","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2510.06215","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.06215","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.06215","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.06215","pdf_url":"https://arxiv.org/pdf/2510.06215","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4414982526.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Current":[0],"text-to-image":[1,30],"diffusion":[2,31,147],"models":[3],"excel":[4],"at":[5],"generating":[6,51,65],"diverse,":[7],"high-quality":[8],"images,":[9],"yet":[10],"they":[11],"struggle":[12],"to":[13,107,112],"incorporate":[14],"fine-grained":[15,157],"camera":[16,35],"metadata":[17],"such":[18],"as":[19],"precise":[20,130],"aperture":[21],"settings.":[22],"In":[23],"this":[24,102,128],"work,":[25],"we":[26],"introduce":[27],"a":[28,74,79,87],"novel":[29,80],"framework":[32],"that":[33,152],"leverages":[34],"metadata,":[36],"or":[37],"EXIF":[38,123],"data,":[39],"which":[40,141],"is":[41,142],"often":[42],"embedded":[43],"in":[44],"image":[45,60,89],"files,":[46],"with":[47,78,90,145],"an":[48,66,91],"emphasis":[49],"on":[50,117],"controllable":[52],"lens":[53,94],"blur.":[54],"Our":[55],"method":[56],"mimics":[57],"the":[58,121,161],"physical":[59],"formation":[61],"process":[62],"by":[63],"first":[64],"all-in-focus":[67],"image,":[68],"estimating":[69],"its":[70],"monocular":[71],"depth,":[72],"predicting":[73],"plausible":[75],"focus":[76,81],"distance":[77,82],"transformer,":[83],"and":[84,120],"then":[85],"forming":[86],"defocused":[88],"existing":[92,146],"differentiable":[93],"blur":[95],"model":[96,154],"[32].":[97],"Gradients":[98],"flow":[99],"backwards":[100],"through":[101],"whole":[103],"process,":[104],"allowing":[105],"us":[106],"learn":[108],"without":[109,159],"explicit":[110],"supervision":[111],"generate":[113],"defocus":[114,135],"effects":[115,136],"based":[116],"content":[118],"elements":[119],"provided":[122],"data.":[124],"At":[125],"inference":[126],"time,":[127],"enables":[129,155],"interactive":[131],"user":[132],"control":[133,158],"over":[134],"while":[137],"preserving":[138],"scene":[139],"contents,":[140],"not":[143],"achievable":[144],"models.":[148],"Experimental":[149],"results":[150],"demonstrate":[151],"our":[153],"superior":[156],"altering":[160],"depicted":[162],"scene.":[163]},"counts_by_year":[],"updated_date":"2026-05-07T06:04:25.777469","created_date":"2025-10-10T00:00:00"}
