{"id":"https://openalex.org/W7155214498","doi":"https://doi.org/10.48550/arxiv.2604.18995","title":"$R^2$-dLLM: Accelerating Diffusion Large Language Models via Spatio-Temporal Redundancy Reduction","display_name":"$R^2$-dLLM: Accelerating Diffusion Large Language Models via Spatio-Temporal Redundancy Reduction","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155214498","doi":"https://doi.org/10.48550/arxiv.2604.18995"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.18995","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18995","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.18995","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079778367","display_name":"Zhenbang Du","orcid":"https://orcid.org/0000-0002-1386-8381"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Zhenbang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119181802","display_name":"Kejing Xia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xia, Kejing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002304298","display_name":"Xinrui Zhong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhong, Xinrui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061572132","display_name":"Yonggan Fu","orcid":"https://orcid.org/0000-0002-7483-2921"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Yonggan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036931296","display_name":"Nicolai Oswald","orcid":"https://orcid.org/0009-0009-9272-0518"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oswald, Nicolai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134289069","display_name":"Binfei Ji","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji, Binfei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010156116","display_name":"Brucek Khailany","orcid":"https://orcid.org/0000-0002-7584-3489"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khailany, Brucek","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134237517","display_name":"Pavlo Molchanov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Molchanov, Pavlo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134301971","display_name":"Yingyan Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Yingyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3603000044822693,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.3603000044822693,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.09040000289678574,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.06109999865293503,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.8698999881744385},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.7515000104904175},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6398000121116638},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5745999813079834},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.5282999873161316},{"id":"https://openalex.org/keywords/inefficiency","display_name":"Inefficiency","score":0.5095000267028809},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.42399999499320984}],"concepts":[{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.8698999881744385},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.7515000104904175},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7501000165939331},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6398000121116638},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5745999813079834},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.5282999873161316},{"id":"https://openalex.org/C2778869765","wikidata":"https://www.wikidata.org/wiki/Q6028363","display_name":"Inefficiency","level":2,"score":0.5095000267028809},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4269999861717224},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.42399999499320984},{"id":"https://openalex.org/C193969084","wikidata":"https://www.wikidata.org/wiki/Q7452500","display_name":"Sequential decoding","level":4,"score":0.3887999951839447},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34060001373291016},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.30869999527931213},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.29580000042915344},{"id":"https://openalex.org/C204397858","wikidata":"https://www.wikidata.org/wiki/Q4437907","display_name":"List decoding","level":5,"score":0.29089999198913574},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.259799987077713},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.25450000166893005}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.18995","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18995","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.18995","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.18995","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Diffusion":[0],"Large":[1],"Language":[2],"Models":[3],"(dLLMs)":[4],"have":[5,71],"emerged":[6],"as":[7],"a":[8,38,81,122,179],"promising":[9],"alternative":[10],"to":[11,114,155,158],"autoregressive":[12],"generation":[13,165],"by":[14,56,66,75,153],"enabling":[15],"parallel":[16],"token":[17,107],"prediction.":[18],"However,":[19],"practical":[20,191],"dLLM":[21],"decoding":[22,50,86,100,117,133,151,160,176],"still":[23],"suffers":[24],"from":[25,45,88],"high":[26],"inference":[27,90,95],"latency,":[28],"which":[29],"limits":[30],"deployment.":[31],"In":[32],"this":[33,42],"work,":[34],"we":[35,78,97],"observe":[36],"that":[37,70,102,127,144,175,185],"substantial":[39,190],"part":[40],"of":[41,150],"inefficiency":[43],"comes":[44],"recurring":[46],"redundancy":[47,54,64,87,177],"in":[48,182],"the":[49,129,148],"process,":[51],"including":[52],"spatial":[53],"caused":[55,65],"confidence":[57,105],"clusters":[58],"and":[59,62,91,106,109,135,170,184,196],"positional":[60],"ambiguity,":[61],"temporal":[63],"repeatedly":[67],"remasking":[68],"predictions":[69],"already":[72],"stabilized.":[73],"Motivated":[74],"these":[76],"patterns,":[77],"propose":[79,121],"$R^{2}$-dLLM,":[80],"unified":[82],"framework":[83],"for":[84],"reducing":[85,187],"both":[89],"training":[92],"perspectives.":[93],"At":[94],"time,":[96],"introduce":[98],"training-free":[99],"rules":[101],"aggregate":[103],"local":[104],"predictions,":[108],"finalize":[110],"temporally":[111],"stable":[112],"tokens":[113],"avoid":[115],"redundant":[116],"steps.":[118],"We":[119],"further":[120],"redundancy-aware":[123],"supervised":[124],"fine-tuning":[125],"pipeline":[126],"aligns":[128],"model":[130],"with":[131],"efficient":[132],"trajectories":[134],"reduces":[136,147],"reliance":[137],"on":[138],"manually":[139],"tuned":[140],"thresholds.":[141],"Experiments":[142],"demonstrate":[143],"$R^{2}$-dLLM":[145],"consistently":[146],"number":[149],"steps":[152],"up":[154],"88\\%":[156],"compared":[157],"existing":[159],"strategies,":[161],"while":[162],"maintaining":[163],"competitive":[164],"quality":[166],"across":[167],"different":[168],"models":[169,197],"tasks.":[171],"These":[172],"results":[173],"validate":[174],"is":[178],"central":[180],"bottleneck":[181],"dLLMs,":[183],"explicitly":[186],"it":[188],"yields":[189],"efficiency":[192],"gains.":[193],"Our":[194],"code":[195],"are":[198],"available":[199],"at":[200],"https://github.com/GATECH-EIC/R2-dLLM.":[201]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-23T00:00:00"}
