{"id":"https://openalex.org/W7118603523","doi":"https://doi.org/10.48550/arxiv.2601.01045","title":"Coarse-Grained Kullback--Leibler Control of Diffusion-Based Generative AI","display_name":"Coarse-Grained Kullback--Leibler Control of Diffusion-Based Generative AI","publication_year":2026,"publication_date":"2026-01-03","ids":{"openalex":"https://openalex.org/W7118603523","doi":"https://doi.org/10.48550/arxiv.2601.01045"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.01045","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.01045","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.01045","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072214554","display_name":"Tatsuaki Tsuruyama","orcid":"https://orcid.org/0000-0002-3118-2826"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Tsuruyama, Tatsuaki","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5072214554"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.875,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.875,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.026499999687075615,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.007300000172108412,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monotonic-function","display_name":"Monotonic function","score":0.5321000218391418},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.5271999835968018},{"id":"https://openalex.org/keywords/lyapunov-function","display_name":"Lyapunov function","score":0.5073999762535095},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.48260000348091125},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.4528000056743622},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.42879998683929443},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.42480000853538513},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.41110000014305115}],"concepts":[{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.5321000218391418},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.5271999835968018},{"id":"https://openalex.org/C60640748","wikidata":"https://www.wikidata.org/wiki/Q2337858","display_name":"Lyapunov function","level":3,"score":0.5073999762535095},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.48260000348091125},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4787999987602234},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4675999879837036},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4553999900817871},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.4528000056743622},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.42879998683929443},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.42480000853538513},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.41110000014305115},{"id":"https://openalex.org/C68710425","wikidata":"https://www.wikidata.org/wiki/Q5275442","display_name":"Diffusion process","level":3,"score":0.40709999203681946},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.39489999413490295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3727000057697296},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.35679998993873596},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.3280999958515167},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3278000056743622},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3165000081062317},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.31470000743865967},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.29019999504089355},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.28130000829696655},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.01045","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.01045","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.01045","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.01045","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"models":[1,5,130],"and":[2,44,91,131,163,169,189,205,217,241],"score-based":[3],"generative":[4,129,228],"provide":[6],"a":[7,67,87,94,99,106,110,133,182,190,231,243],"powerful":[8],"framework":[9,122],"for":[10,62,102,246],"synthesizing":[11],"high-quality":[12],"images":[13,188],"from":[14,86,237],"noise.":[15],"However,":[16],"there":[17],"is":[18,138],"still":[19],"no":[20],"satisfactory":[21],"theory":[22],"that":[23,93,137,197],"describes":[24],"how":[25],"coarse-grained":[26,254],"quantities,":[27],"such":[28],"as":[29,74,109,146,175,230],"blockwise":[30],"intensity":[31],"or":[32],"class":[33],"proportions":[34],"after":[35],"partitioning":[36],"an":[37,57,176,234],"image":[38],"into":[39,71],"spatial":[40],"blocks,":[41,72],"are":[42],"preserved":[43],"evolve":[45],"along":[46],"the":[47,54,75,80,124,141,147,154,170,198,202,206,210,222],"reverse":[48,125,134,150,192,247],"diffusion":[49,126,135,248],"dynamics.":[50,224],"In":[51,116],"previous":[52],"work,":[53],"author":[55],"introduced":[56],"information-theoretic":[58],"Lyapunov":[59,178],"function":[60],"V":[61,157],"non-ergodic":[63],"Markov":[64,161],"processes":[65,249],"on":[66,113],"state":[68],"space":[69],"partitioned":[70],"defined":[73],"minimal":[76],"Kullback-Leibler":[77],"divergence":[78],"to":[79,123,145,158,221,239],"set":[81],"of":[82,156,186,233,253],"stationary":[83],"distributions":[84],"reachable":[85],"given":[88],"initial":[89],"condition,":[90],"showed":[92],"leak-tolerant":[95,207],"potential":[96,142,208,236],"V-delta":[97,143,148,171,173],"with":[98,250],"prescribed":[100,211],"tolerance":[101],"block":[103,114],"masses":[104],"admits":[105],"closed-form":[107],"expression":[108],"scaling-and-clipping":[111],"operation":[112],"masses.":[115],"this":[117,121],"paper,":[118],"I":[119,152,194],"transplant":[120],"process":[127],"in":[128],"propose":[132],"scheme":[136],"projected":[139,149],"by":[140],"(referred":[144],"diffusion).":[151],"extend":[153],"monotonicity":[155],"time-inhomogeneous":[159],"block-preserving":[160],"kernels":[162],"show":[164],"that,":[165],"under":[166],"small":[167],"leakage":[168],"projection,":[172],"acts":[174],"approximate":[177],"function.":[179],"Furthermore,":[180],"using":[181],"toy":[183],"model":[184],"consisting":[185],"block-constant":[187],"simplified":[191],"kernel,":[193],"numerically":[195],"demonstrate":[196],"proposed":[199],"method":[200],"keeps":[201],"block-mass":[203],"error":[204],"within":[209],"tolerance,":[212],"while":[213],"achieving":[214],"pixel-wise":[215],"accuracy":[216],"visual":[218],"quality":[219],"comparable":[220],"non-projected":[223],"This":[225],"study":[226],"reinterprets":[227],"sampling":[229],"decrease":[232],"information":[235],"noise":[238],"data,":[240],"provides":[242],"design":[244],"principle":[245],"explicit":[251],"control":[252],"quantities.":[255]},"counts_by_year":[],"updated_date":"2026-01-08T20:10:11.968330","created_date":"2026-01-08T00:00:00"}
