{"id":"https://openalex.org/W7125212438","doi":"https://doi.org/10.48550/arxiv.2601.13580","title":"Neural Organ Transplantation (NOT): Checkpoint-Based Modular Adaptation for Transformer Models","display_name":"Neural Organ Transplantation (NOT): Checkpoint-Based Modular Adaptation for Transformer Models","publication_year":2026,"publication_date":"2026-01-20","ids":{"openalex":"https://openalex.org/W7125212438","doi":"https://doi.org/10.48550/arxiv.2601.13580"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.13580","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.13580","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.13580","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123485125","display_name":"Ahmad Al-Zuraiqi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Al-Zuraiqi, Ahmad","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5123485125"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.20059999823570251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.20059999823570251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.13420000672340393,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.05999999865889549,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.767300009727478},{"id":"https://openalex.org/keywords/modular-design","display_name":"Modular design","score":0.767300009727478},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6298999786376953},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6298999786376953},{"id":"https://openalex.org/keywords/transplantation","display_name":"Transplantation","score":0.48249998688697815},{"id":"https://openalex.org/keywords/transplantation","display_name":"Transplantation","score":0.48249998688697815},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43869999051094055},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43869999051094055}],"concepts":[{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.767300009727478},{"id":"https://openalex.org/C101468663","wikidata":"https://www.wikidata.org/wiki/Q1620158","display_name":"Modular design","level":2,"score":0.767300009727478},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6444000005722046},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6444000005722046},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6298999786376953},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6298999786376953},{"id":"https://openalex.org/C2911091166","wikidata":"https://www.wikidata.org/wiki/Q106419912","display_name":"Transplantation","level":2,"score":0.48249998688697815},{"id":"https://openalex.org/C2911091166","wikidata":"https://www.wikidata.org/wiki/Q106419912","display_name":"Transplantation","level":2,"score":0.48249998688697815},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45080000162124634},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45080000162124634},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43869999051094055},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43869999051094055},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.3783999979496002},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.3783999979496002},{"id":"https://openalex.org/C2781121602","wikidata":"https://www.wikidata.org/wiki/Q3504403","display_name":"Modular neural network","level":4,"score":0.3393999934196472},{"id":"https://openalex.org/C2781121602","wikidata":"https://www.wikidata.org/wiki/Q3504403","display_name":"Modular neural network","level":4,"score":0.3393999934196472},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.3199999928474426},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.3199999928474426},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28999999165534973},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28999999165534973},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C190839683","wikidata":"https://www.wikidata.org/wiki/Q2448197","display_name":"Train","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C3019816032","wikidata":"https://www.wikidata.org/wiki/Q2575340","display_name":"Cancer treatment","level":3,"score":0.26820001006126404},{"id":"https://openalex.org/C3019816032","wikidata":"https://www.wikidata.org/wiki/Q2575340","display_name":"Cancer treatment","level":3,"score":0.26820001006126404},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.25679999589920044},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.25679999589920044}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.13580","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.13580","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.13580","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.13580","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,159],"introduce":[1],"Neural":[2],"Organ":[3],"Transplantation":[4],"(NOT),":[5],"a":[6],"modular":[7,147],"adaptation":[8,102],"framework":[9],"that":[10,28,63,96,140,161],"enables":[11],"trained":[12,31],"transformer":[13,83,141],"layers":[14,143],"to":[15,33,73,87,167],"function":[16],"as":[17,59],"reusable":[18],"transferable":[19],"checkpoints":[20],"for":[21,149],"domain":[22],"adaptation.":[23],"Unlike":[24],"conventional":[25],"fine-tuning":[26],"approaches":[27],"tightly":[29],"couple":[30],"parameters":[32,89],"specific":[34],"model":[35],"instances":[36],"and":[37,56,92],"training":[38,76,113],"data,":[39,55],"NOT":[40],"extracts":[41],"contiguous":[42],"layer":[43],"subsets":[44],"(\"donor":[45],"organs\")":[46],"from":[47],"pre-trained":[48],"models,":[49],"trains":[50],"them":[51,58],"independently":[52],"on":[53,80,172],"domain-specific":[54],"saves":[57],"standalone":[60],"checkpoint":[61,157],"files":[62],"can":[64,144],"be":[65],"transplanted":[66],"into":[67],"compatible":[68],"recipient":[69],"models":[70],"without":[71],"access":[72],"the":[74],"original":[75],"data.":[77],"Through":[78],"experiments":[79,171],"three":[81],"decoder-only":[82,150,168],"architectures":[84,174],"spanning":[85],"124M":[86],"20B":[88],"(GPT-2,":[90],"TinyLlama,":[91],"GPT-OSS),":[93],"we":[94],"demonstrate":[95,139],"donor":[97],"transplantation":[98],"substantially":[99],"outperforms":[100],"existing":[101],"methods,":[103],"achieving":[104],"an":[105],"order-of-magnitude":[106],"improvement":[107],"in":[108],"perplexity":[109],"over":[110],"LoRA":[111],"while":[112],"significantly":[114],"faster.":[115],"The":[116],"method":[117],"exhibits":[118],"position":[119],"dependence,":[120],"with":[121],"early":[122],"insertion":[123],"positions":[124],"yielding":[125],"optimal":[126],"results.":[127],"Cross-domain":[128],"transfer":[129,148],"at":[130],"billion-parameter":[131],"scale":[132],"reveals":[133],"unexpected":[134],"regularization":[135],"benefits.":[136],"These":[137],"findings":[138],"middle":[142],"support":[145],"efficient":[146],"architectures,":[151],"enabling":[152],"privacy-preserving":[153],"expertise":[154],"sharing":[155],"through":[156],"distribution.":[158],"note":[160],"this":[162],"approach":[163],"is":[164],"currently":[165],"limited":[166],"models;":[169],"preliminary":[170],"encoder-based":[173],"show":[175],"reduced":[176],"effectiveness.":[177]},"counts_by_year":[],"updated_date":"2026-01-22T23:33:04.759266","created_date":"2026-01-22T00:00:00"}
