{"id":"https://openalex.org/W7161724837","doi":"https://doi.org/10.48550/arxiv.2605.17232","title":"Dimension-Free Convergence of Discrete Diffusion Models: Adjoint Equations Induce the Right Space","display_name":"Dimension-Free Convergence of Discrete Diffusion Models: Adjoint Equations Induce the Right Space","publication_year":2026,"publication_date":"2026-05-17","ids":{"openalex":"https://openalex.org/W7161724837","doi":"https://doi.org/10.48550/arxiv.2605.17232"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.17232","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17232","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.17232","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136462379","display_name":"Kelvin Kan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kan, Kelvin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136486257","display_name":"Xingjian Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xingjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007765084","display_name":"B. Zhang","orcid":"https://orcid.org/0000-0002-4170-5096"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Benjamin J.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057249914","display_name":"Tuhin Sahai","orcid":"https://orcid.org/0000-0003-1896-8768"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sahai, Tuhin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136461239","display_name":"Stanley Osher","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Osher, Stanley","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5045079747","display_name":"Markos A. Katsoulakis","orcid":"https://orcid.org/0000-0003-4354-1766"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Katsoulakis, Markos A.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10730","display_name":"Language Development and Disorders","score":0.2671999931335449,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10730","display_name":"Language Development and Disorders","score":0.2671999931335449,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10465","display_name":"Neurobiology of Language and Bilingualism","score":0.09640000015497208,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.07779999822378159,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6238999962806702},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5580999851226807},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.506600022315979},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4731000065803528},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.4453999996185303},{"id":"https://openalex.org/keywords/weak-convergence","display_name":"Weak convergence","score":0.4415000081062317},{"id":"https://openalex.org/keywords/argument","display_name":"Argument (complex analysis)","score":0.41530001163482666},{"id":"https://openalex.org/keywords/probability-measure","display_name":"Probability measure","score":0.3986000120639801},{"id":"https://openalex.org/keywords/coupling","display_name":"Coupling (piping)","score":0.3910999894142151}],"concepts":[{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.6761000156402588},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6238999962806702},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5580999851226807},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.5476999878883362},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.506600022315979},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4731000065803528},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.4453999996185303},{"id":"https://openalex.org/C57945734","wikidata":"https://www.wikidata.org/wiki/Q7977941","display_name":"Weak convergence","level":3,"score":0.4415000081062317},{"id":"https://openalex.org/C98184364","wikidata":"https://www.wikidata.org/wiki/Q1780131","display_name":"Argument (complex analysis)","level":2,"score":0.41530001163482666},{"id":"https://openalex.org/C21031990","wikidata":"https://www.wikidata.org/wiki/Q355020","display_name":"Probability measure","level":2,"score":0.3986000120639801},{"id":"https://openalex.org/C131584629","wikidata":"https://www.wikidata.org/wiki/Q4308705","display_name":"Coupling (piping)","level":2,"score":0.3910999894142151},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.37560001015663147},{"id":"https://openalex.org/C2777634741","wikidata":"https://www.wikidata.org/wiki/Q768993","display_name":"Wasserstein metric","level":2,"score":0.3752000033855438},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.3709000051021576},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.3400999903678894},{"id":"https://openalex.org/C198043062","wikidata":"https://www.wikidata.org/wiki/Q180953","display_name":"Metric space","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C2777299769","wikidata":"https://www.wikidata.org/wiki/Q3707858","display_name":"Type (biology)","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.302700012922287},{"id":"https://openalex.org/C62799726","wikidata":"https://www.wikidata.org/wiki/Q190056","display_name":"Hilbert space","level":2,"score":0.296099990606308},{"id":"https://openalex.org/C153782549","wikidata":"https://www.wikidata.org/wiki/Q175116","display_name":"Discrete space","level":2,"score":0.2906000018119812},{"id":"https://openalex.org/C157709441","wikidata":"https://www.wikidata.org/wiki/Q1411887","display_name":"Uniform convergence","level":3,"score":0.27140000462532043},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.26759999990463257},{"id":"https://openalex.org/C48216909","wikidata":"https://www.wikidata.org/wiki/Q6889156","display_name":"Modes of convergence (annotated index)","level":5,"score":0.2667999863624573},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.2639000117778778},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.2619999945163727},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.2615000009536743},{"id":"https://openalex.org/C122203268","wikidata":"https://www.wikidata.org/wiki/Q5862903","display_name":"Probability theory","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C27851653","wikidata":"https://www.wikidata.org/wiki/Q829653","display_name":"Bounded variation","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.17232","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17232","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.17232","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.17232","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.41361555457115173,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Discrete":[0],"diffusion":[1,207],"has":[2],"become":[3,50],"a":[4,66,112,144,153,198],"leading":[5],"framework":[6,69,175,196],"for":[7,52,201],"generative":[8],"modeling":[9],"in":[10,38,75,130],"various":[11],"applications":[12],"including":[13,209],"language,":[14],"vision,":[15],"and":[16,49,98,103,118,162,165,182,188,215],"biology.":[17],"Existing":[18],"convergence":[19,73,193],"theory,":[20],"however,":[21],"exhibits":[22],"fundamental":[23],"limitations.":[24],"KL-based":[25],"analyses":[26,181],"diverge":[27],"under":[28,159,171],"singular":[29],"priors":[30],"such":[31],"as":[32],"the":[33,44,82,90,131,184],"masked":[34,102,172],"distribution,":[35],"while":[36],"bounds":[37,88,149],"total":[39],"variation":[40],"(TV)":[41],"depend":[42],"on":[43,111,150],"state":[45],"space":[46,132],"size":[47],"$S$":[48,97],"vacuous":[51],"modern":[53],"language":[54],"tasks,":[55],"where":[56],"vocabularies":[57],"contain":[58],"hundreds":[59],"of":[60,62,84,96,133,186,205,212],"thousands":[61],"tokens.":[63],"We":[64],"develop":[65],"unified":[67],"adjoint-equation-based":[68],"that":[70,147,156,168],"establishes":[71],"dimension-free":[72,216],"guarantees":[74],"any":[76,151],"integral":[77],"probability":[78,142],"metric":[79],"(IPM).":[80],"To":[81],"best":[83],"our":[85,87,107,127,195],"knowledge,":[86],"are":[89],"first":[91],"to":[92,100,120],"be":[93],"entirely":[94],"free":[95],"applicable":[99],"both":[101],"uniform":[104,160],"priors.":[105,122],"Importantly,":[106],"theory":[108],"relies":[109],"only":[110],"single":[113],"standard":[114],"rate-matrix":[115],"regularity":[116,145],"assumption":[117],"applies":[119],"general":[121],"Five":[123],"novel":[124],"techniques":[125,167],"drive":[126],"improvements:":[128],"working":[129],"observables":[134],"via":[135],"adjoint":[136],"equations":[137],"rather":[138],"than":[139],"directly":[140],"with":[141],"measures,":[143],"analysis":[146],"yields":[148],"IPM,":[152],"coupling":[154],"argument":[155],"removes":[157],"$S$-dependence":[158,170],"transitions,":[161],"score-marginal":[163],"cancellation":[164],"exit-routing":[166],"remove":[169],"transitions.":[173],"Our":[174],"thus":[176],"sharply":[177],"departs":[178],"from":[179],"prior":[180],"avoids":[183],"shortcomings":[185],"pathspace-KL":[187],"existing":[189],"TV-based":[190],"approaches.":[191],"Beyond":[192],"bounds,":[194],"provides":[197],"versatile":[199],"toolkit":[200],"further":[202],"theoretical":[203],"study":[204],"discrete":[206],"models,":[208],"principled":[210],"choices":[211],"loss":[213],"functions":[214],"step":[217],"complexity.":[218]},"counts_by_year":[],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2026-05-20T00:00:00"}
