{"id":"https://openalex.org/W4416587598","doi":"https://doi.org/10.1016/j.patcog.2026.114063","title":"Training-Free Image Inversion for One-Step Diffusion Models","display_name":"Training-Free Image Inversion for One-Step Diffusion Models","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4416587598","doi":"https://doi.org/10.1016/j.patcog.2026.114063"},"language":"en","primary_location":{"id":"doi:10.1016/j.patcog.2026.114063","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.114063","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.1016/j.patcog.2026.114063","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102963038","display_name":"Tao Wu","orcid":"https://orcid.org/0000-0002-8463-7994"},"institutions":[{"id":"https://openalex.org/I4387153096","display_name":"Computer Vision Center","ror":"https://ror.org/00s0nnj93","country_code":null,"type":"other","lineage":["https://openalex.org/I4387153040","https://openalex.org/I4387153096"]}],"countries":[],"is_corresponding":true,"raw_author_name":"Tao Wu","raw_affiliation_strings":["Computer Vision Center"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Vision Center","institution_ids":["https://openalex.org/I4387153096"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102008586","display_name":"Senmao Li","orcid":"https://orcid.org/0000-0003-0377-8566"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Senmao Li","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010398295","display_name":"Yaxing Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaxing Wang","raw_affiliation_strings":["Nankai University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Nankai University","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100676328","display_name":"Shiqi Yang","orcid":"https://orcid.org/0009-0009-8529-4522"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shiqi Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077265199","display_name":"K. W. Wang","orcid":"https://orcid.org/0000-0002-9605-8279"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kai Wang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101958996","display_name":"Joost van de Weijer","orcid":"https://orcid.org/0000-0002-9656-9706"},"institutions":[{"id":"https://openalex.org/I4387153096","display_name":"Computer Vision Center","ror":"https://ror.org/00s0nnj93","country_code":null,"type":"other","lineage":["https://openalex.org/I4387153040","https://openalex.org/I4387153096"]}],"countries":[],"is_corresponding":false,"raw_author_name":"Joost van de Weijer","raw_affiliation_strings":["Computer Vision Center"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computer Vision Center","institution_ids":["https://openalex.org/I4387153096"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102963038"],"corresponding_institution_ids":["https://openalex.org/I4387153096"],"apc_list":{"value":2710,"currency":"USD","value_usd":2710},"apc_paid":{"value":2710,"currency":"USD","value_usd":2710},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.32106194,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"180","issue":null,"first_page":"114063","last_page":"114063"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8184000253677368,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.8184000253677368,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12859","display_name":"Cell Image Analysis Techniques","score":0.021199999377131462,"subfield":{"id":"https://openalex.org/subfields/1304","display_name":"Biophysics"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.01209999993443489,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.6902999877929688},{"id":"https://openalex.org/keywords/anisotropic-diffusion","display_name":"Anisotropic diffusion","score":0.5356000065803528},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.48249998688697815},{"id":"https://openalex.org/keywords/gaussian-noise","display_name":"Gaussian noise","score":0.4081000089645386},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.39800000190734863},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3853999972343445},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.3571999967098236},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.3513999879360199}],"concepts":[{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.6902999877929688},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6600000262260437},{"id":"https://openalex.org/C203504353","wikidata":"https://www.wikidata.org/wiki/Q4765461","display_name":"Anisotropic diffusion","level":3,"score":0.5356000065803528},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5327000021934509},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4869999885559082},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.48249998688697815},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4634000062942505},{"id":"https://openalex.org/C4199805","wikidata":"https://www.wikidata.org/wiki/Q2725903","display_name":"Gaussian noise","level":2,"score":0.4081000089645386},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.39800000190734863},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3853999972343445},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.3571999967098236},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3513999879360199},{"id":"https://openalex.org/C2779804580","wikidata":"https://www.wikidata.org/wiki/Q102047","display_name":"Suffix","level":2,"score":0.34049999713897705},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.3377000093460083},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33230000734329224},{"id":"https://openalex.org/C2781170535","wikidata":"https://www.wikidata.org/wiki/Q30587856","display_name":"Noisy data","level":2,"score":0.2847000062465668},{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C135252773","wikidata":"https://www.wikidata.org/wiki/Q1567213","display_name":"Inverse problem","level":2,"score":0.2671000063419342},{"id":"https://openalex.org/C35772409","wikidata":"https://www.wikidata.org/wiki/Q1323086","display_name":"Image noise","level":3,"score":0.26339998841285706},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.2606000006198883},{"id":"https://openalex.org/C143606050","wikidata":"https://www.wikidata.org/wiki/Q1377019","display_name":"Inverse transform sampling","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.25619998574256897},{"id":"https://openalex.org/C2781204021","wikidata":"https://www.wikidata.org/wiki/Q6497091","display_name":"Lattice (music)","level":2,"score":0.25270000100135803}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1016/j.patcog.2026.114063","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.114063","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},{"id":"doi:10.2139/ssrn.5800056","is_oa":true,"landing_page_url":"https://doi.org/10.2139/ssrn.5800056","pdf_url":null,"source":{"id":"https://openalex.org/S4210172589","display_name":"SSRN Electronic Journal","issn_l":"1556-5068","issn":["1556-5068"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1318003438","host_organization_name":"RELX Group (Netherlands)","host_organization_lineage":["https://openalex.org/I1318003438"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"posted-content"},{"id":"pmh:oai:arXiv.org:2606.01380","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2606.01380","pdf_url":"https://arxiv.org/pdf/2606.01380","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2606.01380","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2606.01380","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1016/j.patcog.2026.114063","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.patcog.2026.114063","pdf_url":null,"source":{"id":"https://openalex.org/S414566","display_name":"Pattern Recognition","issn_l":"0031-3203","issn":["0031-3203","1873-5142"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Pattern Recognition","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322300","display_name":"Jilin University","ror":"https://ror.org/00js3aw79"},{"id":"https://openalex.org/F4320322598","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98"},{"id":"https://openalex.org/F4320326826","display_name":"Universitat Aut\u00f2noma de Barcelona","ror":"https://ror.org/052g8jq94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":1,"referenced_works":["https://openalex.org/W4412020477"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"we":[3,81,135],"introduce":[4],"a":[5,137],"novel":[6,84],"training-free":[7],"inversion":[8,21,32,71,121],"(TFinv)":[9],"framework":[10],"for":[11,141],"one-step":[12,77,165],"diffusion":[13,78,166],"models,":[14],"addressing":[15],"key":[16],"challenges":[17],"in":[18,164,175],"real":[19],"image":[20,66,132],"and":[22,33,49,54,65,73,102,130],"editing.":[23,133],"We":[24],"first":[25],"identify":[26],"two":[27,83],"critical":[28],"factors":[29,69],"hampering":[30],"real-image":[31],"editing:":[34],"(1)":[35],"Initial":[36],"Latent":[37],"Editability,":[38],"which":[39,58,90,106],"is":[40],"related":[41],"to":[42,95],"the":[43,46,50,60,74,92,98,151],"distance":[44],"between":[45,62],"initial":[47,127],"noise":[48,87,128],"ideal":[51],"Gaussian":[52,100],"distribution,":[53,101],"(2)":[55],"Caption":[56],"Gap,":[57],"means":[59],"alignment":[61,88,110],"text":[63],"captions":[64],"representations.":[67],"Both":[68],"influence":[70],"efficiency":[72],"editability":[75],"of":[76,122],"models.":[79],"Then,":[80],"propose":[82,136],"techniques:":[85],"iterative":[86],"(iterNA),":[89],"minimizes":[91],"distribution":[93],"gap":[94],"align":[96],"with":[97],"normal":[99],"suffix":[103,114],"learning":[104],"(suffL),":[105],"enhances":[107],"text-to-image":[108],"caption":[109],"by":[111],"introducing":[112],"learned":[113],"prompt":[115],"tokens.":[116],"These":[117],"techniques":[118],"enable":[119],"precise":[120],"input":[123],"images":[124],"into":[125],"their":[126],"representations":[129],"facilitate":[131],"Furthermore,":[134],"mask-based":[138],"editing":[139],"technique":[140],"localized":[142],"edits":[143],"while":[144],"preserving":[145],"background":[146],"integrity.":[147],"Comprehensive":[148],"experiments":[149],"on":[150],"PIE-Bench":[152],"dataset":[153],"validate":[154],"that":[155],"our":[156],"method":[157],"TFinv":[158],"not":[159],"only":[160],"achieves":[161],"state-of-the-art":[162],"performance":[163],"editing,":[167],"but":[168],"also":[169],"significantly":[170],"outperforms":[171],"existing":[172],"multistep":[173],"approaches":[174],"efficiency.":[176]},"counts_by_year":[],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2025-11-25T00:00:00"}
