{"id":"https://openalex.org/W4415367652","doi":"https://doi.org/10.1109/isit63088.2025.11195663","title":"Coupling Without Communication and Drafter-Invariant Speculative Decoding","display_name":"Coupling Without Communication and Drafter-Invariant Speculative Decoding","publication_year":2025,"publication_date":"2025-06-22","ids":{"openalex":"https://openalex.org/W4415367652","doi":"https://doi.org/10.1109/isit63088.2025.11195663"},"language":null,"primary_location":{"id":"doi:10.1109/isit63088.2025.11195663","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit63088.2025.11195663","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064845272","display_name":"Majid Daliri","orcid":"https://orcid.org/0000-0003-4001-4346"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Majid Daliri","raw_affiliation_strings":["New York University"],"affiliations":[{"raw_affiliation_string":"New York University","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018420180","display_name":"Christopher Musco","orcid":"https://orcid.org/0000-0002-3118-4848"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Musco","raw_affiliation_strings":["New York University"],"affiliations":[{"raw_affiliation_string":"New York University","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103890688","display_name":"Ananda Theertha Suresh","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ananda Theertha Suresh","raw_affiliation_strings":["Google Research,NY"],"affiliations":[{"raw_affiliation_string":"Google Research,NY","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5064845272"],"corresponding_institution_ids":["https://openalex.org/I57206974"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16440615,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9147999882698059,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11567","display_name":"semigroups and automata theory","score":0.9054999947547913,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/alice-and-bob","display_name":"Alice and Bob","score":0.7127000093460083},{"id":"https://openalex.org/keywords/gumbel-distribution","display_name":"Gumbel distribution","score":0.6741999983787537},{"id":"https://openalex.org/keywords/alice","display_name":"Alice (programming language)","score":0.6528000235557556},{"id":"https://openalex.org/keywords/coupling","display_name":"Coupling (piping)","score":0.5127999782562256},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5006999969482422},{"id":"https://openalex.org/keywords/probability-distribution","display_name":"Probability distribution","score":0.492900013923645},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.4812000095844269},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.47290000319480896}],"concepts":[{"id":"https://openalex.org/C127964579","wikidata":"https://www.wikidata.org/wiki/Q649676","display_name":"Alice and Bob","level":3,"score":0.7127000093460083},{"id":"https://openalex.org/C137610916","wikidata":"https://www.wikidata.org/wiki/Q1096862","display_name":"Gumbel distribution","level":3,"score":0.6741999983787537},{"id":"https://openalex.org/C2778222013","wikidata":"https://www.wikidata.org/wiki/Q1136926","display_name":"Alice (programming language)","level":2,"score":0.6528000235557556},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5329999923706055},{"id":"https://openalex.org/C131584629","wikidata":"https://www.wikidata.org/wiki/Q4308705","display_name":"Coupling (piping)","level":2,"score":0.5127999782562256},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5006999969482422},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.492900013923645},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.4812000095844269},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.47290000319480896},{"id":"https://openalex.org/C52740198","wikidata":"https://www.wikidata.org/wiki/Q1539564","display_name":"Importance sampling","level":3,"score":0.44440001249313354},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4316999912261963},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.4009000062942505},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.40070000290870667},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4000000059604645},{"id":"https://openalex.org/C110121322","wikidata":"https://www.wikidata.org/wiki/Q865811","display_name":"Distribution (mathematics)","level":2,"score":0.3991999924182892},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.3375999927520752},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.33239999413490295},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.3203999996185303},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3165999948978424},{"id":"https://openalex.org/C147581598","wikidata":"https://www.wikidata.org/wiki/Q729429","display_name":"Extreme value theory","level":2,"score":0.311599999666214},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.3102000057697296},{"id":"https://openalex.org/C2777317252","wikidata":"https://www.wikidata.org/wiki/Q18393516","display_name":"Rare events","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2759000062942505},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.2678000032901764},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isit63088.2025.11195663","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isit63088.2025.11195663","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on Information Theory (ISIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1965996575","https://openalex.org/W1982682305","https://openalex.org/W2013809345","https://openalex.org/W2061130579","https://openalex.org/W2126907894","https://openalex.org/W2152912600","https://openalex.org/W2218607027","https://openalex.org/W2962921917","https://openalex.org/W3083028011","https://openalex.org/W3101751096","https://openalex.org/W3203538342","https://openalex.org/W4379135640","https://openalex.org/W4399522748"],"related_works":[],"abstract_inverted_index":{"Suppose":[0],"Alice":[1,16,61,92],"has":[2,10],"a":[3,11,20,29,124,164,200,246,280,321],"distribution":[4,12],"<tex":[5,13,22,31,38,66,72,83,87,114,208,212,224,326,337],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[6,14,23,32,39,67,73,84,88,115,209,213,225,327,338],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{P}$</tex>":[7,85,210],"and":[8,27,62,86,93,149,211],"Bob":[9,28,63,94],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{Q}$</tex>.":[15,89],"wants":[17],"to":[18,107,137,234,243,263,335,343],"draw":[19],"sample":[21,30],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$a":[24],"\\sim":[25,34],"\\mathcal{P}$</tex>":[26],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$b":[33],"\\mathcal{Q}$</tex>":[35],"such":[36],"that":[37,257,274,323],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$a=b$</tex>":[40],"with":[41,105],"as":[42,46],"high":[43],"of":[44,167,185,206,223,240,285,333],"probability":[45,184],"possible.":[47],"It":[48],"is":[49,77,277,288,313],"well-known":[50],"that,":[51,179],"by":[52,143],"sampling":[53,198,216,298],"from":[54,171],"an":[55,191,218,238],"optimal":[56,139,346],"coupling":[57,242,306],"between":[58,82],"the":[59,78,129,141,158,168,181,271,305,309],"distributions,":[60],"can":[64,111,260],"achieve":[65,113,336],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\operatorname{Pr}[a=b]=1-D_{T":[68,339],"V}(\\mathcal{P},":[69,75,119,121,340],"\\mathcal{Q})$</tex>,":[70],"where":[71,311],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$D_{T":[74],"\\mathcal{Q})$</tex>":[76],"total":[79],"variation":[80],"distance":[81],"What":[90],"if":[91],"must":[95],"solve":[96],"this":[97,154,231],"same":[98],"problem":[99,307],"without":[100],"communicating":[101],"at":[102],"all?":[103],"Surprisingly,":[104],"access":[106],"public":[108],"randomness,":[109],"they":[110],"still":[112],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\operatorname{Pr}[a=b]":[116],"\\geq":[117],"\\frac{1-D_{T":[118],"\\mathcal{Q})}{1+D_{T":[120],"\\mathcal{Q})}$</tex>":[122],"using":[123],"simple":[125,193],"protocol":[126,194,322],"based":[127,195],"on":[128,196,294],"Weighted":[130,186,228,300],"MinHash":[131,187],"algorithm.":[132],"This":[133],"bound":[134],"was":[135],"shown":[136],"be":[138,189,261],"in":[140,308],"worst-case":[142,182],"Bavarian,":[144],"Ghazi,":[145],"Haramaty,":[146],"Kamath,":[147],"Rivest,":[148],"Sudan":[150],"[ToC":[151],"2020].":[152,175],"In":[153,292],"work,":[155],"we":[156,177,303],"revisit":[157],"\u201ccommunication-free":[159],"coupling\u201d":[160],"problem.":[161],"We":[162,236,255,319],"provide":[163],"simpler":[165],"proof":[166],"optimality":[169],"result":[170],"[Bavarian":[172],"et":[173],"al.,":[174],"Moreover":[176],"show":[178,256],"while":[180],"success":[183],"cannot":[188],"improved,":[190],"equally":[192],"Gumbel":[197,215,297],"offers":[199],"Pareto":[201],"improvement:":[202],"for":[203,249,290],"every":[204],"pair":[205],"distributions":[207],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{Q}$</tex>,":[214],"achieves":[217],"equal":[219],"or":[220],"higher":[221],"value":[222],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\operatorname{Pr}[a=b]$</tex>":[226],"than":[227,316],"MinHash.":[229,301],"Importantly,":[230],"improvement":[232],"translates":[233],"practice.":[235],"demonstrate":[237],"application":[239],"communicationfree":[241],"speculative":[244],"decoding,":[245],"recent":[247],"method":[248],"accelerating":[250],"autoregressive":[251],"large":[252],"language":[253,295],"models.":[254],"communication-free":[258],"protocols":[259],"used":[262,289],"construct":[264],"DrafterInvariant":[265],"Speculative":[266],"Decoding":[267],"schemes,":[268],"which":[269],"have":[270],"desirable":[272],"property":[273],"their":[275],"output":[276],"fixed":[278,281],"given":[279],"random":[282],"seed,":[283],"regardless":[284],"what":[286],"drafter":[287],"speculation.":[291],"experiments":[293],"generation,":[296],"outperforms":[299],"Finally,":[302],"study":[304],"setting":[310],"communication":[312,334],"bounded,":[314],"rather":[315],"completely":[317],"eliminated.":[318],"describe":[320],"uses":[324],"just":[325],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$O(\\log":[328],"(n":[329],"/":[330],"\\epsilon))$</tex>":[331],"bits":[332],"\\mathcal{Q})-\\epsilon$</tex>,":[341],"i.e.":[342],"essentially":[344],"match":[345],"coupling.":[347]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-21T00:00:00"}
