{"id":"https://openalex.org/W4415332922","doi":"https://doi.org/10.48550/arxiv.2506.14794","title":"Assembly of Experts: Linear-time construction of the Chimera LLM variants with emergent and adaptable behaviors","display_name":"Assembly of Experts: Linear-time construction of the Chimera LLM variants with emergent and adaptable behaviors","publication_year":2025,"publication_date":"2025-05-31","ids":{"openalex":"https://openalex.org/W4415332922","doi":"https://doi.org/10.48550/arxiv.2506.14794"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2506.14794","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.14794","pdf_url":"https://arxiv.org/pdf/2506.14794","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2506.14794","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054415619","display_name":"Henrik Klagges","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Klagges, Henrik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062334835","display_name":"Robert Dahlke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dahlke, Robert","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014371566","display_name":"Fabian Klemm","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klemm, Fabian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083191946","display_name":"Benjamin Merkel","orcid":"https://orcid.org/0000-0002-8637-7655"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Merkel, Benjamin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120056989","display_name":"Daniel Klingmann","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Klingmann, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060347528","display_name":"David Reiss","orcid":"https://orcid.org/0000-0002-7701-0480"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reiss, David A.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5035633645","display_name":"Dan Zecha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zecha, Dan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5054415619"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9574999809265137,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9362999796867371,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7113000154495239},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5084999799728394},{"id":"https://openalex.org/keywords/chimera","display_name":"Chimera (genetics)","score":0.38580000400543213},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.2524999976158142}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7113000154495239},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6025999784469604},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5084999799728394},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5015000104904175},{"id":"https://openalex.org/C30278631","wikidata":"https://www.wikidata.org/wiki/Q281721","display_name":"Chimera (genetics)","level":3,"score":0.38580000400543213},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3837999999523163},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35269999504089355},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2542000114917755},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.24639999866485596}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2506.14794","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.14794","pdf_url":"https://arxiv.org/pdf/2506.14794","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2506.14794","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2506.14794","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2506.14794","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2506.14794","pdf_url":"https://arxiv.org/pdf/2506.14794","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Requiring":[0],"$10^{13}$-$10^{15}$":[1],"FLOPs":[2],"to":[3,38,58,159,176],"calculate":[4],"one":[5],"8":[6],"bit":[7],"weight":[8,52],"in":[9,48],"an":[10],"LLM":[11],"during":[12],"pretraining":[13],"is":[14,102],"extremely":[15],"expensive":[16],"and":[17,104,127],"seems":[18],"inefficient.":[19],"To":[20],"better":[21],"leverage":[22],"the":[23,32,65,68,74,82,109,115,135,148,168],"huge":[24],"investments":[25],"made":[26],"into":[27],"pretrained":[28],"models,":[29,76],"we":[30,77],"develop":[31],"new":[33],"\"Assembly-of-Experts\"":[34],"(AoE)":[35],"construction":[36],"method":[37],"create":[39],"capable":[40],"child":[41,84,132],"variants":[42],"of":[43,64,70,81,139],"existing":[44],"Mixture-of-Experts":[45],"parent":[46,75,178],"models":[47],"linear":[49],"time.":[50],"Model":[51],"tensors":[53,138],"get":[54],"interpolated":[55],"individually,":[56],"allowing":[57],"enhance":[59],"or":[60,166],"suppress":[61],"semantic":[62],"features":[63],"parents.":[66],"Varying":[67],"proportion":[69],"weights":[71],"taken":[72],"from":[73],"observe":[78],"some":[79],"properties":[80],"AoE":[83],"model":[85,101,110,123,129],"changing":[86],"gradually,":[87],"while":[88],"other":[89],"behavioral":[90],"traits":[91],"emerge":[92],"with":[93],"a":[94,119],"sharp":[95],"transition.":[96],"Surprisingly,":[97],"nearly":[98],"every":[99],"generated":[100],"functional":[103],"capable,":[105],"which":[106],"makes":[107],"searching":[108],"space":[111],"straightforward.":[112],"We":[113],"construct":[114],"DeepSeek":[116],"R1T":[117],"\"Chimera\",":[118],"671B":[120],"open-weights":[121],"hybrid":[122],"combining":[124],"DeepSeek's":[125],"V3-0324":[126],"R1":[128],"variants.":[130],"The":[131],"inherits":[133],"only":[134],"routed":[136],"expert":[137],"R1,":[140],"but":[141],"still":[142],"achieves":[143],"about":[144,153],"R1-level":[145],"intelligence.":[146],"At":[147],"same":[149],"time,":[150],"it":[151],"uses":[152],"40\\%":[154],"fewer":[155],"output":[156],"tokens,":[157],"close":[158],"V3":[160],"speed.":[161],"Constructed":[162],"without":[163],"any":[164],"fine-tuning":[165],"distillation,":[167],"Chimera":[169],"exhibits":[170],"surprisingly":[171],"compact,":[172],"orderly":[173],"reasoning":[174],"compared":[175],"its":[177],"models.":[179]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-19T00:00:00"}
