{"id":"https://openalex.org/W7161723433","doi":"https://doi.org/10.48550/arxiv.2605.16686","title":"Scalable Knowledge Editing for Mixture-of-Experts LLMs via Tensor-Structured Updates","display_name":"Scalable Knowledge Editing for Mixture-of-Experts LLMs via Tensor-Structured Updates","publication_year":2026,"publication_date":"2026-05-15","ids":{"openalex":"https://openalex.org/W7161723433","doi":"https://doi.org/10.48550/arxiv.2605.16686"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.16686","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16686","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.16686","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136466265","display_name":"Roman Maksimov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maksimov, Roman","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136501822","display_name":"Vladimir Aletov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aletov, Vladimir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114403023","display_name":"Dmitry Bylinkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bylinkin, Dmitry","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136465571","display_name":"Daniil Medyakov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Medyakov, Daniil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5099097234","display_name":"Vladimir Solodkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Solodkin, Vladimir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136461994","display_name":"Aleksandr Beznosikov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Beznosikov, Aleksandr","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.32100000977516174,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.32100000977516174,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.1451999992132187,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.05790000036358833,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6435999870300293},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5087000131607056},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4878999888896942},{"id":"https://openalex.org/keywords/image-editing","display_name":"Image editing","score":0.48030000925064087},{"id":"https://openalex.org/keywords/collaborative-editing","display_name":"Collaborative editing","score":0.4611000120639801},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4424000084400177},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.383899986743927},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.3269999921321869}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.805400013923645},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6435999870300293},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5087000131607056},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4878999888896942},{"id":"https://openalex.org/C2776674983","wikidata":"https://www.wikidata.org/wiki/Q545981","display_name":"Image editing","level":3,"score":0.48030000925064087},{"id":"https://openalex.org/C2780967703","wikidata":"https://www.wikidata.org/wiki/Q2571389","display_name":"Collaborative editing","level":2,"score":0.4611000120639801},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4424000084400177},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.383899986743927},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35030001401901245},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.3269999921321869},{"id":"https://openalex.org/C132943942","wikidata":"https://www.wikidata.org/wiki/Q2562511","display_name":"Footprint","level":2,"score":0.323199987411499},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.3109999895095825},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.29280000925064087},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29109999537467957},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.27480000257492065},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.26669999957084656},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25690001249313354},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.25200000405311584},{"id":"https://openalex.org/C2778348673","wikidata":"https://www.wikidata.org/wiki/Q739302","display_name":"Production (economics)","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.16686","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16686","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.16686","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.16686","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Knowledge":[0],"editing":[1,48,57,73,120,133,174],"(KE)":[2],"provides":[3],"a":[4,40,52,169],"lightweight":[5],"alternative":[6],"to":[7,70,87,103,137,140],"repeated":[8],"fine-tuning":[9],"of":[10,43,67,96,105,122],"LLMs.":[11,60],"However,":[12],"most":[13],"existing":[14],"KE":[15,128,160],"methods":[16],"target":[17],"dense":[18,166],"feed-forward":[19],"layers,":[20,167],"while":[21,130],"modern":[22,176],"LLMs":[23],"increasingly":[24],"adopt":[25],"Mixture-of-Experts":[26],"(MoE)":[27],"architectures":[28],"for":[29,55],"their":[30],"superior":[31],"memory":[32],"footprint":[33],"and":[34,81,109,145],"inference":[35],"efficiency.":[36],"This":[37],"mismatch":[38],"leaves":[39],"growing":[41],"class":[42],"production":[44],"models":[45],"without":[46],"principled":[47],"tools.":[49],"We":[50],"propose":[51],"MEMIT-like":[53],"framework":[54],"knowledge":[56,173],"in":[58,175],"MoE-based":[59],"Our":[61],"method":[62],"exploits":[63],"the":[64,72,77,83,92,119,126,132,141,146,151],"tensor":[65],"structure":[66],"MoE":[68],"layers":[69],"formulate":[71],"objective":[74],"faithfully":[75],"at":[76],"per":[78],"expert":[79,97],"level,":[80],"applies":[82],"Woodbury":[84,152],"matrix":[85,95],"identity":[86],"avoid":[88],"materializing":[89],"or":[90],"inverting":[91],"full":[93],"stacked":[94],"weights.":[98],"The":[99],"resulting":[100],"update":[101],"reduces":[102],"inversions":[104,148],"fixed":[106],"low-rank":[107],"matrices":[108],"requires":[110],"no":[111],"additional":[112],"backward":[113],"passes.":[114],"Empirically,":[115],"our":[116],"approach":[117],"matches":[118],"quality":[121],"strong":[123],"baselines":[124],"on":[125],"main":[127],"metrics":[129],"accelerating":[131],"procedure":[134],"by":[135,150],"up":[136],"6x,":[138],"owing":[139],"batched":[142],"MEMIT-style":[143],"formulation":[144],"low-dimensional":[147],"enabled":[149],"identity.":[153],"These":[154],"results":[155],"show":[156],"that":[157],"closed-form,":[158],"parameter-modifying":[159],"can":[161],"be":[162],"extended":[163],"efficiently":[164],"beyond":[165],"opening":[168],"path":[170],"toward":[171],"scalable":[172],"sparse":[177],"LLM":[178],"architectures.":[179]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-20T00:00:00"}
