{"id":"https://openalex.org/W7117128325","doi":"https://doi.org/10.48550/arxiv.2512.19320","title":"MAGIC: Achieving Superior Model Merging via Magnitude Calibration","display_name":"MAGIC: Achieving Superior Model Merging via Magnitude Calibration","publication_year":2025,"publication_date":"2025-12-22","ids":{"openalex":"https://openalex.org/W7117128325","doi":"https://doi.org/10.48550/arxiv.2512.19320"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2512.19320","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.19320","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2512.19320","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5121223840","display_name":"Yayuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Yayuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121171240","display_name":"Jian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Jian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121182548","display_name":"Jintao Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Jintao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101329800","display_name":"Zihan Cheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng, Zihan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121234732","display_name":"Lei Qi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103058012","display_name":"Yinghuan Shi","orcid":"https://orcid.org/0009-0008-0722-9744"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Yinghuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5121128691","display_name":"Yang Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Yang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5121223840"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.30630001425743103,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.30630001425743103,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.24310000240802765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.12790000438690186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/calibration","display_name":"Calibration","score":0.6528000235557556},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5979999899864197},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.5419999957084656},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.5023999810218811},{"id":"https://openalex.org/keywords/magnitude","display_name":"Magnitude (astronomy)","score":0.4986000061035156},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.4805000126361847},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.47780001163482666},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.43070000410079956}],"concepts":[{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.6528000235557556},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6266999840736389},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5979999899864197},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.5419999957084656},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.5023999810218811},{"id":"https://openalex.org/C126691448","wikidata":"https://www.wikidata.org/wiki/Q2028919","display_name":"Magnitude (astronomy)","level":2,"score":0.4986000061035156},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49380001425743103},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.4805000126361847},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.47909998893737793},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.47780001163482666},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.43070000410079956},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4187000095844269},{"id":"https://openalex.org/C73586568","wikidata":"https://www.wikidata.org/wiki/Q2600211","display_name":"Parameter space","level":2,"score":0.3734999895095825},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.3294999897480011},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.29919999837875366},{"id":"https://openalex.org/C2777704519","wikidata":"https://www.wikidata.org/wiki/Q45732","display_name":"MAGIC (telescope)","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.2897999882698059},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.25940001010894775}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2512.19320","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.19320","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2512.19320","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.19320","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"proliferation":[1],"of":[2,12,24,42,55,69,87,168],"pre-trained":[3],"models":[4,27],"has":[5,78],"given":[6],"rise":[7],"to":[8,19,46,96,110,114,179],"a":[9,29,138,165],"wide":[10],"array":[11],"specialised,":[13],"fine-tuned":[14],"models.":[15],"Model":[16],"merging":[17,44,101],"aims":[18],"merge":[20],"the":[21,48,52,56,85,118,122,160,180],"distinct":[22],"capabilities":[23],"these":[25,188],"specialised":[26,57,123],"into":[28],"unified":[30],"model,":[31],"requiring":[32,184],"minimal":[33],"or":[34],"even":[35],"no":[36],"additional":[37,185,218],"training.":[38,219],"A":[39],"core":[40],"objective":[41],"model":[43,50,120],"is":[45,222],"ensure":[47],"merged":[49,119,161],"retains":[51],"behavioural":[53],"characteristics":[54],"models,":[58,124],"typically":[59],"achieved":[60],"through":[61],"feature":[62,115,146],"alignment.":[63],"We":[64],"identify":[65],"that":[66,141,197],"features":[67,163],"consist":[68],"two":[70],"critical":[71],"components:":[72],"direction":[73],"and":[74,106,147,211],"magnitude.":[75],"Prior":[76],"research":[77],"predominantly":[79],"focused":[80],"on":[81,208,215],"directional":[82],"alignment,":[83],"while":[84,171],"influence":[86],"magnitude":[88,111],"remains":[89],"largely":[90],"neglected,":[91],"despite":[92],"its":[93],"pronounced":[94],"vulnerability":[95],"perturbations":[97,109],"introduced":[98],"by":[99],"common":[100],"operations":[102],"(e.g.,":[103],"parameter":[104],"fusion":[105],"sparsification).":[107],"Such":[108],"inevitably":[112],"lead":[113],"deviations":[116],"in":[117,126,145],"from":[121],"resulting":[125],"subsequent":[127],"performance":[128,201],"degradation.":[129],"To":[130],"address":[131],"this,":[132],"we":[133],"propose":[134],"MAGnItude":[135],"Calibration":[136,157,174,192],"(MAGIC),":[137],"plug-and-play":[139],"framework":[140],"rectifies":[142],"layer-wise":[143],"magnitudes":[144],"weight":[148,181],"spaces,":[149],"with":[150],"three":[151],"variants.":[152],"Specifically,":[153],"our":[154],"Feature":[155],"Space":[156,173,191],"(FSC)":[158],"realigns":[159],"model's":[162],"using":[164],"small":[166],"set":[167],"unlabelled":[169],"data,":[170],"Weight":[172],"(WSC)":[175],"extends":[176],"this":[177],"calibration":[178],"space":[182],"without":[183,217],"data.":[186],"Combining":[187],"yields":[189],"Dual":[190],"(DSC).":[193],"Comprehensive":[194],"experiments":[195],"demonstrate":[196],"MAGIC":[198],"consistently":[199],"boosts":[200],"across":[202],"diverse":[203],"Computer":[204],"Vision":[205],"tasks":[206,213],"(+4.3%":[207],"eight":[209],"datasets)":[210],"NLP":[212],"(+8.0%":[214],"Llama)":[216],"Our":[220],"code":[221],"available":[223],"at:":[224],"https://github.com/lyymuwu/MAGIC":[225]},"counts_by_year":[],"updated_date":"2025-12-24T23:14:05.333182","created_date":"2025-12-24T00:00:00"}
