{"id":"https://openalex.org/W4412605259","doi":"https://doi.org/10.1109/access.2025.3592163","title":"Decoupled Latent Diffusion Model for Enhancing Image Generation","display_name":"Decoupled Latent Diffusion Model for Enhancing Image Generation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412605259","doi":"https://doi.org/10.1109/access.2025.3592163"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3592163","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3592163","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3592163","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026727740","display_name":"Hyun-Tae Choi","orcid":null},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyun-Tae Choi","raw_affiliation_strings":["Department of Artificial Intelligence, Chung-Ang University, Seoul, South Korea"],"raw_orcid":"https://orcid.org/0000-0001-8268-0705","affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence, Chung-Ang University, Seoul, South Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102774458","display_name":"Kensuke Nakamura","orcid":"https://orcid.org/0000-0002-6858-3551"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kensuke Nakamura","raw_affiliation_strings":["Department of Artificial Intelligence, Chung-Ang University, Seoul, South Korea"],"raw_orcid":"https://orcid.org/0000-0002-6858-3551","affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence, Chung-Ang University, Seoul, South Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065943331","display_name":"Byung\u2010Woo Hong","orcid":"https://orcid.org/0000-0003-2752-3939"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Byung-Woo Hong","raw_affiliation_strings":["Department of Artificial Intelligence, Chung-Ang University, Seoul, South Korea"],"raw_orcid":"https://orcid.org/0000-0003-2752-3939","affiliations":[{"raw_affiliation_string":"Department of Artificial Intelligence, Chung-Ang University, Seoul, South Korea","institution_ids":["https://openalex.org/I67900169"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13713236,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"130505","last_page":"130516"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.8421000242233276,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.8421000242233276,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5967041850090027},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.5190408825874329},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4130405783653259},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3195975422859192},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.0950724184513092},{"id":"https://openalex.org/keywords/thermodynamics","display_name":"Thermodynamics","score":0.09230530261993408}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5967041850090027},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.5190408825874329},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4130405783653259},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3195975422859192},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0950724184513092},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.09230530261993408}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3592163","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3592163","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:0754ed6ec3f041b4abd4a58ebccf0d34","is_oa":true,"landing_page_url":"https://doaj.org/article/0754ed6ec3f041b4abd4a58ebccf0d34","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 130505-130516 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3592163","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3592163","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1882192421","display_name":null,"funder_award_id":"IITP-RS-2021-II211341","funder_id":"https://openalex.org/F4320328359","funder_display_name":"Ministry of Science and ICT, South Korea"},{"id":"https://openalex.org/G6053833429","display_name":null,"funder_award_id":"NRF-RS-2023-00251366","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W2108598243","https://openalex.org/W2752796333","https://openalex.org/W2987820424","https://openalex.org/W3034600949","https://openalex.org/W3159957450","https://openalex.org/W4311415873","https://openalex.org/W4312497550","https://openalex.org/W4312933868","https://openalex.org/W4387230345","https://openalex.org/W4401943167","https://openalex.org/W4406526284","https://openalex.org/W6625168331","https://openalex.org/W6638836233","https://openalex.org/W6679045638","https://openalex.org/W6688384872","https://openalex.org/W6739659843","https://openalex.org/W6745560452","https://openalex.org/W6748582592","https://openalex.org/W6757817989","https://openalex.org/W6760514122","https://openalex.org/W6762931180","https://openalex.org/W6765807149","https://openalex.org/W6766364717","https://openalex.org/W6779823529","https://openalex.org/W6780248173","https://openalex.org/W6780593937","https://openalex.org/W6783713337","https://openalex.org/W6786494455","https://openalex.org/W6788990321","https://openalex.org/W6795288823","https://openalex.org/W6838047808"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Latent":[0,35],"Diffusion":[1,36],"Models":[2],"have":[3],"emerged":[4],"as":[5],"an":[6],"efficient":[7,187],"alternative":[8],"to":[9,67,145],"conventional":[10,192],"diffusion":[11,29,98],"approaches":[12],"by":[13,44,75,162],"compressing":[14],"high-dimensional":[15],"images":[16,168],"into":[17],"a":[18,23,47,95,103,118,130,177],"lower-dimensional":[19],"latent":[20,40,63,86,97,105,115,180,195],"space":[21,64],"using":[22],"Variational":[24],"Autoencoder":[25],"(VAE)":[26],"and":[27,55,93,126,128,165,186],"performing":[28],"in":[30,156,197],"that":[31,79,100,121,176],"space.":[32],"In":[33],"standard":[34,57,114,147],"Model":[37],"(LDM),":[38],"the":[39,53,56,62,71,80,85,113,146,149,191],"code":[41],"is":[42],"formed":[43],"sampling":[45,196],"from":[46],"Gaussian":[48],"distribution":[49],"(i.e.,":[50],"combining":[51],"both":[52,124],"mean":[54,125],"deviation),":[58],"which":[59],"helps":[60],"regularize":[61],"but":[65,155],"appears":[66],"contribute":[68],"little":[69],"beyond":[70],"deterministic":[72,131,179],"component.":[73],"Motivated":[74],"recent":[76],"empirical":[77],"observations":[78],"decoder":[81],"relies":[82],"primarily":[83],"on":[84,102,137,194],"mean,":[87],"our":[88],"work":[89],"reexamines":[90],"this":[91],"paradigm":[92],"proposes":[94],"decoupled":[96],"model":[99],"focuses":[101],"simplified":[104],"representation.":[106,133],"Specifically,":[107],"we":[108],"compare":[109],"three":[110],"configurations:":[111],"(i)":[112],"code,":[116],"(ii)":[117],"concatenated":[119],"representation":[120,181],"explicitly":[122],"preserves":[123],"variance,":[127],"(iii)":[129],"mean-only":[132,150],"Our":[134],"extensive":[135],"experiments":[136],"multiple":[138],"benchmark":[139],"datasets":[140],"demonstrate":[141],"that,":[142],"when":[143],"compared":[144],"approach,":[148],"configuration":[151],"not":[152],"only":[153],"maintains":[154],"many":[157],"cases":[158],"improves":[159],"synthesis":[160],"quality":[161],"producing":[163],"sharper":[164],"more":[166,184],"coherent":[167],"while":[169],"reducing":[170],"unnecessary":[171],"noise.":[172],"These":[173],"findings":[174],"suggest":[175],"simplified,":[178],"can":[182],"yield":[183],"stable":[185],"generative":[188],"models,":[189],"challenging":[190],"reliance":[193],"diffusion-based":[198],"image":[199],"synthesis.":[200]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
