{"id":"https://openalex.org/W7148412097","doi":"https://doi.org/10.48550/arxiv.2604.00375","title":"Locally Confident, Globally Stuck: The Quality-Exploration Dilemma in Diffusion Language Models","display_name":"Locally Confident, Globally Stuck: The Quality-Exploration Dilemma in Diffusion Language Models","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7148412097","doi":"https://doi.org/10.48550/arxiv.2604.00375"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.00375","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00375","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.00375","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132829952","display_name":"Liancheng Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Fang, Liancheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132804646","display_name":"Aiwei Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Aiwei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132825235","display_name":"Henry Peng Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Henry Peng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125006830","display_name":"Yankai Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Yankai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132753627","display_name":"Enze Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Enze","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132822681","display_name":"Leyi Pan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan, Leyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132808048","display_name":"Chunyu Miao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miao, Chunyu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132803237","display_name":"Wei-Chieh Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wei-Chieh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132828780","display_name":"Xue Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132824958","display_name":"Philip S. Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Philip S.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5132829952"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4717000126838684,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4717000126838684,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.04960000142455101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.0414000004529953,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5723999738693237},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.5562999844551086},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5523999929428101},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4715999960899353},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4708000123500824},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.46230000257492065},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.42309999465942383},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.41040000319480896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.670799970626831},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5723999738693237},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.5562999844551086},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5523999929428101},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4715999960899353},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4708000123500824},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.46230000257492065},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.42309999465942383},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41040000319480896},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3953000009059906},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.39419999718666077},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.3889000117778778},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3614000082015991},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.3312999904155731},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.32749998569488525},{"id":"https://openalex.org/C2778496695","wikidata":"https://www.wikidata.org/wiki/Q254128","display_name":"Dilemma","level":2,"score":0.31630000472068787},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.314300000667572},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3140000104904175},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.2922999858856201},{"id":"https://openalex.org/C9679016","wikidata":"https://www.wikidata.org/wiki/Q1417473","display_name":"Principle of maximum entropy","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C171268870","wikidata":"https://www.wikidata.org/wiki/Q1486676","display_name":"GRASP","level":2,"score":0.2662000060081482},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2605000138282776},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2596000134944916},{"id":"https://openalex.org/C8272713","wikidata":"https://www.wikidata.org/wiki/Q176737","display_name":"Stochastic process","level":2,"score":0.25589999556541443},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.2556000053882599},{"id":"https://openalex.org/C177321328","wikidata":"https://www.wikidata.org/wiki/Q13580479","display_name":"Goldilocks principle","level":2,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.00375","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00375","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.00375","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.00375","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"large":[1],"language":[2],"models":[3],"(dLLMs)":[4],"theoretically":[5],"permit":[6],"token":[7],"decoding":[8,30],"in":[9],"arbitrary":[10],"order,":[11],"a":[12,61,70,82,114,128],"flexibility":[13],"that":[14,78,106,119,140],"could":[15],"enable":[16],"richer":[17],"exploration":[18,53],"of":[19,73,92,130],"reasoning":[20,131],"paths":[21],"than":[22,147],"autoregressive":[23],"(AR)":[24],"LLMs.":[25],"In":[26,65],"practice,":[27],"however,":[28],"random-order":[29],"often":[31],"hurts":[32],"generation":[33],"quality.":[34],"To":[35,97],"mitigate":[36],"this,":[37],"low-confidence":[38,79,151],"remasking":[39,80],"improves":[40,81],"single-sample":[41],"quality":[42,86,109],"(e.g.,":[43,58],"Pass@$1$)":[44],"by":[45],"prioritizing":[46],"confident":[47],"tokens,":[48],"but":[49],"it":[50],"also":[51],"suppresses":[52],"and":[54,110,112,137,150],"limits":[55],"multi-sample":[56],"gains":[57],"Pass@$k$),":[59],"creating":[60],"fundamental":[62],"quality--exploration":[63],"dilemma.":[64,75],"this":[66,74,99,122],"paper,":[67],"we":[68,101],"provide":[69],"unified":[71],"explanation":[72],"We":[76],"show":[77,139],"myopic":[83],"proxy":[84],"for":[85],"while":[87],"provably":[88],"constraining":[89],"the":[90,93,103],"entropy":[91],"induced":[94],"sequence":[95],"distribution.":[96],"overcome":[98],"limitation,":[100],"characterize":[102],"optimal":[104],"distribution":[105,123],"explicitly":[107],"balances":[108],"exploration,":[111],"develop":[113],"simple":[115],"Independent":[116],"Metropolis--Hastings":[117],"sampler":[118],"approximately":[120],"targets":[121],"during":[124],"decoding.":[125],"Experiments":[126],"across":[127],"range":[129],"benchmarks":[132],"including":[133],"MATH500,":[134],"AIME24/25,":[135],"HumanEval,":[136],"MBPP":[138],"our":[141],"approach":[142],"yields":[143],"better":[144],"exploration-quality":[145],"tradeoff":[146],"both":[148],"random":[149],"remasking.":[152]},"counts_by_year":[],"updated_date":"2026-04-03T16:44:17.987007","created_date":"2026-04-03T00:00:00"}
