{"id":"https://openalex.org/W7140171967","doi":"https://doi.org/10.48550/arxiv.2603.20589","title":"Generating from Discrete Distributions Using Diffusions: Insights from Random Constraint Satisfaction Problems","display_name":"Generating from Discrete Distributions Using Diffusions: Insights from Random Constraint Satisfaction Problems","publication_year":2026,"publication_date":"2026-03-21","ids":{"openalex":"https://openalex.org/W7140171967","doi":"https://doi.org/10.48550/arxiv.2603.20589"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.20589","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20589","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.20589","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Bhatt, Alankrita","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhatt, Alankrita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Gupta, Mukur","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gupta, Mukur","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kolossov, Germain","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kolossov, Germain","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Montanari, Andrea","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Montanari, Andrea","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.8432999849319458,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.8432999849319458,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.017400000244379044,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11303","display_name":"Bayesian Modeling and Causal Inference","score":0.011099999770522118,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.7095000147819519},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5478000044822693},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.5195000171661377},{"id":"https://openalex.org/keywords/random-variable","display_name":"Random variable","score":0.5069000124931335},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.46880000829696655},{"id":"https://openalex.org/keywords/constraint-satisfaction-problem","display_name":"Constraint satisfaction problem","score":0.4124999940395355},{"id":"https://openalex.org/keywords/joint-probability-distribution","display_name":"Joint probability distribution","score":0.41190001368522644},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.40290001034736633}],"concepts":[{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.7095000147819519},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5837000012397766},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5478000044822693},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.5195000171661377},{"id":"https://openalex.org/C122123141","wikidata":"https://www.wikidata.org/wiki/Q176623","display_name":"Random variable","level":2,"score":0.5069000124931335},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.42289999127388},{"id":"https://openalex.org/C199622910","wikidata":"https://www.wikidata.org/wiki/Q1128326","display_name":"Constraint satisfaction problem","level":3,"score":0.4124999940395355},{"id":"https://openalex.org/C18653775","wikidata":"https://www.wikidata.org/wiki/Q1333358","display_name":"Joint probability distribution","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.40290001034736633},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3693000078201294},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3691999912261963},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.35670000314712524},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.34599998593330383},{"id":"https://openalex.org/C8272713","wikidata":"https://www.wikidata.org/wiki/Q176737","display_name":"Stochastic process","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.2888999879360199},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2743000090122223},{"id":"https://openalex.org/C44616089","wikidata":"https://www.wikidata.org/wiki/Q30158686","display_name":"Constraint satisfaction","level":3,"score":0.27379998564720154},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C122203268","wikidata":"https://www.wikidata.org/wiki/Q5862903","display_name":"Probability theory","level":2,"score":0.26179999113082886},{"id":"https://openalex.org/C197096303","wikidata":"https://www.wikidata.org/wiki/Q869887","display_name":"Probability mass function","level":3,"score":0.26159998774528503},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25839999318122864}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.20589","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20589","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.20589","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20589","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Generating":[0],"data":[1],"from":[2,44],"discrete":[3,97],"distributions":[4],"is":[5],"important":[6],"for":[7,32],"a":[8,29,75,80],"number":[9],"of":[10,47,61,73,79,109],"application":[11],"domains":[12],"including":[13],"text,":[14],"tabular":[15],"data,":[16],"and":[17],"genomic":[18],"data.":[19],"Several":[20],"groups":[21],"have":[22,52],"recently":[23],"used":[24],"random":[25,48,77],"$k$-satisfiability":[26],"($k$-SAT)":[27],"as":[28],"synthetic":[30],"benchmark":[31],"new":[33],"generative":[34,62],"techniques.":[35],"In":[36],"this":[37],"paper,":[38],"we":[39,69,90],"show":[40],"that":[41],"fundamental":[42],"insights":[43],"the":[45,59,71,103,110],"theory":[46],"constraint":[49],"satisfaction":[50],"problems":[51],"observable":[53],"implications":[54],"(sometime":[55],"contradicting":[56],"intuition)":[57],"on":[58,64],"behavior":[60],"techniques":[63],"such":[65],"benchmarks.":[66],"More":[67],"precisely,":[68],"study":[70],"problem":[72],"generating":[74],"uniformly":[76],"solution":[78],"given":[81],"(random)":[82],"$k$-SAT":[83],"or":[84],"$k$-XORSAT":[85],"formula.":[86],"Among":[87],"other":[88],"findings,":[89],"observe":[91],"that:":[92],"$(i)$~Continuous":[93],"diffusions":[94,100],"outperform":[95],"masked":[96],"diffusions;":[98],"$(ii)$~Learned":[99],"can":[101,112],"match":[102],"theoretical":[104],"`ideal'":[105],"accuracy;":[106],"$(iii)$~Smart":[107],"ordering":[108],"variables":[111],"significantly":[113],"improve":[114],"accuracy,":[115],"although":[116],"not":[117],"following":[118],"popular":[119],"heuristics.":[120]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-25T00:00:00"}
