{"id":"https://openalex.org/W7155071750","doi":"https://doi.org/10.48550/arxiv.2604.17182","title":"Layer-wise MoE Routing Locality under Shared-Prefix Code Generation: Token-Identity Decomposition and Compile-Equivalent Fork Redundancy","display_name":"Layer-wise MoE Routing Locality under Shared-Prefix Code Generation: Token-Identity Decomposition and Compile-Equivalent Fork Redundancy","publication_year":2026,"publication_date":"2026-04-19","ids":{"openalex":"https://openalex.org/W7155071750","doi":"https://doi.org/10.48550/arxiv.2604.17182"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.17182","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.17182","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.17182","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134100327","display_name":"Shun-ichiro Hayashi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hayashi, Shun-ichiro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035972892","display_name":"Daichi Mukunoki","orcid":"https://orcid.org/0000-0002-0051-6811"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mukunoki, Daichi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134155857","display_name":"Tetsuya Hoshino","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hoshino, Tetsuya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5078063020","display_name":"Takahiro Katagiri","orcid":"https://orcid.org/0000-0001-7193-9304"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Katagiri, Takahiro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5178999900817871,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5178999900817871,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.11159999668598175,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.10999999940395355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/jaccard-index","display_name":"Jaccard index","score":0.7897999882698059},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.5238000154495239},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5209000110626221},{"id":"https://openalex.org/keywords/routing","display_name":"Routing (electronic design automation)","score":0.513700008392334},{"id":"https://openalex.org/keywords/trie","display_name":"Trie","score":0.4747999906539917},{"id":"https://openalex.org/keywords/prefix","display_name":"Prefix","score":0.4171999990940094},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.41200000047683716},{"id":"https://openalex.org/keywords/barcode","display_name":"Barcode","score":0.3621000051498413},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.35850000381469727}],"concepts":[{"id":"https://openalex.org/C203519979","wikidata":"https://www.wikidata.org/wiki/Q865360","display_name":"Jaccard index","level":3,"score":0.7897999882698059},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6442999839782715},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.5238000154495239},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5209000110626221},{"id":"https://openalex.org/C74172769","wikidata":"https://www.wikidata.org/wiki/Q1446839","display_name":"Routing (electronic design automation)","level":2,"score":0.513700008392334},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4767000079154968},{"id":"https://openalex.org/C190290938","wikidata":"https://www.wikidata.org/wiki/Q387015","display_name":"Trie","level":3,"score":0.4747999906539917},{"id":"https://openalex.org/C141603448","wikidata":"https://www.wikidata.org/wiki/Q134830","display_name":"Prefix","level":2,"score":0.4171999990940094},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.41200000047683716},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4016999900341034},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.37689998745918274},{"id":"https://openalex.org/C2776841711","wikidata":"https://www.wikidata.org/wiki/Q856","display_name":"Barcode","level":2,"score":0.3621000051498413},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.35850000381469727},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.35179999470710754},{"id":"https://openalex.org/C184896649","wikidata":"https://www.wikidata.org/wiki/Q290066","display_name":"Routing table","level":4,"score":0.3352000117301941},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3059000074863434},{"id":"https://openalex.org/C94240970","wikidata":"https://www.wikidata.org/wiki/Q733318","display_name":"Pastry","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2757999897003174},{"id":"https://openalex.org/C47434764","wikidata":"https://www.wikidata.org/wiki/Q1770035","display_name":"Dead code","level":5,"score":0.27250000834465027},{"id":"https://openalex.org/C193319292","wikidata":"https://www.wikidata.org/wiki/Q272172","display_name":"Hamming distance","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C151578736","wikidata":"https://www.wikidata.org/wiki/Q1251793","display_name":"Redundant code","level":4,"score":0.2685000002384186},{"id":"https://openalex.org/C45340560","wikidata":"https://www.wikidata.org/wiki/Q215382","display_name":"Disjoint sets","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C20079647","wikidata":"https://www.wikidata.org/wiki/Q1278039","display_name":"Prefix code","level":5,"score":0.251800000667572},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.250900000333786}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.17182","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.17182","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.17182","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.17182","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0,163],"LLM-based":[1],"code":[2,5,24,165,226],"generation,":[3,166],"multiple":[4],"candidates":[6],"are":[7,97],"often":[8],"generated":[9,105],"in":[10,19,146,155,173,194,224],"parallel":[11],"from":[12,69],"the":[13,37,80,106,147,156,174,207],"same":[14,107],"prompt":[15],"--":[16],"for":[17,92,220],"example,":[18],"best-of-N":[20],"sampling":[21],"or":[22],"multi-candidate":[23],"completion.":[25],"These":[26,204],"requests":[27],"can":[28],"share":[29],"KV":[30],"caches":[31],"through":[32,214],"a":[33,70,83,132,201],"common":[34],"prefix,":[35],"yet":[36],"extent":[38],"to":[39],"which":[40],"their":[41],"Mixture-of-Experts":[42],"(MoE)":[43],"expert":[44],"routing":[45,136],"overlaps,":[46],"and":[47,78,179,187,217],"how":[48],"this":[49],"overlap":[50],"varies":[51],"across":[52,141],"layers,":[53,143],"remains":[54,123],"insufficiently":[55],"understood.":[56],"We":[57,190],"study":[58],"Qwen3.5-35B-A3B-FP8":[59],"(256":[60],"routed":[61],"experts,":[62],"top-8)":[63],"by":[64],"performing":[65],"tree-search-based":[66],"branching":[67],"generation":[68],"shared":[71],"prefix":[72],"(851":[73],"completed":[74],"codes,":[75],"temperature":[76],"0.7)":[77],"analyzing":[79],"results":[81,205],"with":[82,119],"compiler-output-based":[84],"alignment":[85],"(gcc":[86],"-S":[87],"-O0":[88],"assembly)":[89],"that":[90,192],"controls":[91],"token-identity":[93],"confounds.":[94],"Our":[95],"findings":[96],"threefold:":[98],"(1)":[99],"At":[100],"positions":[101,118],"where":[102],"both":[103],"sequences":[104],"token,":[108],"Jaccard":[109],"similarity":[110,137,140,153],"reaches":[111],"0.649":[112],"(40x":[113],"random),":[114],"while":[115,151],"even":[116],"at":[117,159],"different":[120],"tokens":[121],"it":[122],"0.175":[124],"(11x":[125],"random).":[126],"(2)":[127],"A":[128],"layer-wise":[129,215],"decomposition":[130,216],"reveals":[131],"crossing":[133],"pattern:":[134],"same-token":[135],"exceeds":[138],"different-token":[139,152],"all":[142],"but":[144],"dips":[145],"middle":[148,157],"layers":[149,158],"(L14-20),":[150],"peaks":[154],"14x":[160],"random.":[161],"(3)":[162],"tree-search":[164],"67%":[167],"of":[168,181,185,211],"successfully":[169],"compiled":[170],"codes":[171],"concentrate":[172],"top":[175],"three":[176],"assembly-equivalent":[177],"groups,":[178],"99.6%":[180],"within-group":[182],"differences":[183],"consist":[184],"comments":[186],"blank":[188],"lines.":[189],"show":[191],"diversity":[193],"top-P":[195],"search,":[196,199],"including":[197],"beam":[198],"poses":[200],"significant":[202],"challenge.":[203],"refine":[206],"\"context-independent":[208],"routing\"":[209],"claim":[210],"prior":[212],"work":[213],"suggest":[218],"opportunities":[219],"improving":[221],"search":[222],"efficiency":[223],"LLM":[225],"generation.":[227]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-22T00:00:00"}
