{"id":"https://openalex.org/W4402979841","doi":"https://doi.org/10.1109/icme57554.2024.10687547","title":"IterInv: Iterative Inversion for Pixel-Level T2I Models","display_name":"IterInv: Iterative Inversion for Pixel-Level T2I Models","publication_year":2024,"publication_date":"2024-07-15","ids":{"openalex":"https://openalex.org/W4402979841","doi":"https://doi.org/10.1109/icme57554.2024.10687547"},"language":"en","primary_location":{"id":"doi:10.1109/icme57554.2024.10687547","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme57554.2024.10687547","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004593135","display_name":"Chuanming Tang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I4210128284","display_name":"Institute of Optics and Electronics, Chinese Academy of Sciences","ror":"https://ror.org/02bn68w95","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128284"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chuanming Tang","raw_affiliation_strings":["University of Chinese Academy of Sciences,Institute of Optics and Electronics Computer Vision Center,Beijing,China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,Institute of Optics and Electronics Computer Vision Center,Beijing,China","institution_ids":["https://openalex.org/I4210128284","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100437002","display_name":"Kai Wang","orcid":"https://orcid.org/0000-0002-2937-9339"},"institutions":[{"id":"https://openalex.org/I2799803557","display_name":"Barcelona Supercomputing Center","ror":"https://ror.org/05sd8tv96","country_code":"ES","type":"facility","lineage":["https://openalex.org/I2799803557","https://openalex.org/I9617848"]},{"id":"https://openalex.org/I4387153096","display_name":"Computer Vision Center","ror":"https://ror.org/00s0nnj93","country_code":null,"type":"other","lineage":["https://openalex.org/I4387153040","https://openalex.org/I4387153096"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Kai Wang","raw_affiliation_strings":["Computer Vision Center,Barcelona,Spain"],"affiliations":[{"raw_affiliation_string":"Computer Vision Center,Barcelona,Spain","institution_ids":["https://openalex.org/I2799803557","https://openalex.org/I4387153096"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101958996","display_name":"Joost van de Weijer","orcid":"https://orcid.org/0000-0002-9656-9706"},"institutions":[{"id":"https://openalex.org/I123044942","display_name":"Universitat Aut\u00f2noma de Barcelona","ror":"https://ror.org/052g8jq94","country_code":"ES","type":"education","lineage":["https://openalex.org/I123044942"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Joost van de Weijer","raw_affiliation_strings":["Universitat Autonoma de Barcelona,Computer Vision Center,Barcelona,Spain"],"affiliations":[{"raw_affiliation_string":"Universitat Autonoma de Barcelona,Computer Vision Center,Barcelona,Spain","institution_ids":["https://openalex.org/I123044942"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004593135"],"corresponding_institution_ids":["https://openalex.org/I4210128284","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":1.7227,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.85069601,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10378","display_name":"Advanced MRI Techniques and Applications","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10378","display_name":"Advanced MRI Techniques and Applications","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10522","display_name":"Medical Imaging Techniques and Applications","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9876000285148621,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.7292405962944031},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.6718255877494812},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5660532116889954},{"id":"https://openalex.org/keywords/iterative-method","display_name":"Iterative method","score":0.5621992945671082},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4077732264995575},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3156886100769043},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.2315225899219513},{"id":"https://openalex.org/keywords/seismology","display_name":"Seismology","score":0.06747522950172424}],"concepts":[{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.7292405962944031},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.6718255877494812},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5660532116889954},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.5621992945671082},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4077732264995575},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3156886100769043},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.2315225899219513},{"id":"https://openalex.org/C165205528","wikidata":"https://www.wikidata.org/wiki/Q83371","display_name":"Seismology","level":1,"score":0.06747522950172424},{"id":"https://openalex.org/C77928131","wikidata":"https://www.wikidata.org/wiki/Q193343","display_name":"Tectonics","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme57554.2024.10687547","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme57554.2024.10687547","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":43,"referenced_works":["https://openalex.org/W1580389772","https://openalex.org/W2962785568","https://openalex.org/W3036167779","https://openalex.org/W3153469116","https://openalex.org/W3191805365","https://openalex.org/W4224035735","https://openalex.org/W4226125322","https://openalex.org/W4281485151","https://openalex.org/W4312740349","https://openalex.org/W4312872987","https://openalex.org/W4312911498","https://openalex.org/W4312933868","https://openalex.org/W4313484371","https://openalex.org/W4361230700","https://openalex.org/W4361865257","https://openalex.org/W4378760015","https://openalex.org/W4385527149","https://openalex.org/W4386057725","https://openalex.org/W4386076215","https://openalex.org/W4386076532","https://openalex.org/W4386113271","https://openalex.org/W4387158652","https://openalex.org/W4390872477","https://openalex.org/W4390873084","https://openalex.org/W4390873195","https://openalex.org/W4390874314","https://openalex.org/W6779823529","https://openalex.org/W6783713337","https://openalex.org/W6790978476","https://openalex.org/W6791353385","https://openalex.org/W6809885388","https://openalex.org/W6810940779","https://openalex.org/W6838639034","https://openalex.org/W6840155194","https://openalex.org/W6840815571","https://openalex.org/W6841366371","https://openalex.org/W6845433216","https://openalex.org/W6848774630","https://openalex.org/W6849367332","https://openalex.org/W6850576684","https://openalex.org/W6851457070","https://openalex.org/W6852963699","https://openalex.org/W6857140470"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W2085033728","https://openalex.org/W4285411112","https://openalex.org/W2171299904","https://openalex.org/W1647606319","https://openalex.org/W2922442631","https://openalex.org/W4390494008","https://openalex.org/W2053596378","https://openalex.org/W2168523118"],"abstract_inverted_index":{"Large-scale":[0],"text-to-image":[1,112],"diffusion":[2,141],"models":[3,62,142,185],"have":[4],"been":[5],"a":[6,48,111,236],"ground-breaking":[7],"development":[8],"in":[9,52],"generating":[10],"convincing":[11],"images":[12,32],"following":[13],"an":[14,79,175],"input":[15],"text":[16,36],"prompt.":[17,37],"The":[18,248,255],"goal":[19],"of":[20,105,166,183,203,246],"image":[21,39,136,159,205,238],"editing":[22,40,239],"research":[23],"is":[24,163,257],"to":[25,73,127,151,220],"give":[26],"users":[27],"control":[28],"over":[29],"the":[30,35,58,65,74,89,98,123,129,134,139,147,157,161,164,190,199,214,222,228,243],"generated":[31],"by":[33,116],"modifying":[34],"Current":[38],"techniques":[41],"predominantly":[42],"hinge":[43],"on":[44,64,88,170],"DDIM":[45,124,148],"inversion":[46,125,177,200,224],"as":[47,93,160,198],"prevalent":[49],"practice":[50],"rooted":[51],"Latent":[53],"Diffusion":[54],"Models":[55],"(LDM).":[56],"However,":[57],"large":[59],"pretrained":[60],"T2I":[61,85,184],"working":[63,87],"latent":[66,215],"space":[67],"suffer":[68],"from":[69],"losing":[70],"details":[71],"due":[72],"first":[75],"compression":[76],"stage":[77,113],"with":[78,110,146,189,235],"autoencoder":[80],"mechanism.":[81],"Instead,":[82],"other":[83],"mainstream":[84],"pipeline":[86],"pixel":[90],"level,":[91],"such":[92],"Imagen":[94],"and":[95,114,132,186,201,210,226],"DeepFloyd-IF,":[96],"circumvents":[97],"above":[99],"problem.":[100,168],"They":[101],"are":[102,143],"commonly":[103],"composed":[104],"multiple":[106],"stages,":[107],"typically":[108],"starting":[109],"followed":[115],"several":[117],"super-resolution":[118,140],"stages.":[119],"In":[120,207],"this":[121,167,171,181],"pipeline,":[122],"fails":[126],"find":[128,221],"initial":[130],"noise":[131],"generate":[133],"original":[135],"given":[137],"that":[138],"not":[144],"compatible":[145],"technique.":[149],"According":[150],"our":[152,233],"experimental":[153],"findings,":[154],"iteratively":[155],"concatenating":[156],"noisy":[158],"condition":[162],"root":[165],"Based":[169],"observation,":[172],"we":[173,212,241],"develop":[174],"iterative":[176],"(IterInv)":[178],"technique":[179],"for":[180],"category":[182],"verify":[187],"IterInv":[188,195],"open-source":[191],"DeepFloyd-IF":[192],"model.":[193],"Specifically,":[194],"employ":[196],"NTI":[197],"reconstruction":[202,229],"low-resolution":[204],"generation.":[206],"stages":[208],"2":[209],"3,":[211],"update":[213],"variance":[216],"at":[217,259],"each":[218],"timestep":[219],"deterministic":[223],"trace":[225],"promote":[227],"process.":[230],"By":[231],"combining":[232],"method":[234],"popular":[237],"method,":[240],"prove":[242],"application":[244],"prospects":[245],"IterInv.":[247],"code":[249,256],"will":[250],"be":[251],"released":[252],"upon":[253],"acceptance.":[254],"available":[258],"https://github.com/Tchuanm/IterInv.git":[260]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
