{"id":"https://openalex.org/W7127928381","doi":"https://doi.org/10.48550/arxiv.2602.05988","title":"Layer-wise LoRA fine-tuning: a similarity metric approach","display_name":"Layer-wise LoRA fine-tuning: a similarity metric approach","publication_year":2026,"publication_date":"2026-02-05","ids":{"openalex":"https://openalex.org/W7127928381","doi":"https://doi.org/10.48550/arxiv.2602.05988"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.05988","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125237717","display_name":"Keith Ando Ogawa","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ogawa, Keith Ando","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070659570","display_name":"Bruno Lopes Yamamoto","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yamamoto, Bruno Lopes","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125219918","display_name":"Lucas Lauton de Alcantara","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Alcantara, Lucas Lauton","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125242107","display_name":"Lucas Pellicer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pellicer, Lucas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125212138","display_name":"Rosimeire Pereira Costa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Costa, Rosimeire Pereira","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085487887","display_name":"Edson Bollis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bollis, Edson","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069264027","display_name":"Anna Helena Reali Costa","orcid":"https://orcid.org/0000-0001-7309-4528"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Costa, Anna Helena Reali","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5112859940","display_name":"Artur Jord\u00e3o","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jordao, Artur","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5125237717"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2442999929189682,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2442999929189682,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.10100000351667404,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.07479999959468842,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.5666999816894531},{"id":"https://openalex.org/keywords/performance-metric","display_name":"Performance metric","score":0.524399995803833},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5238000154495239},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.510200023651123},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.47110000252723694},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.45489999651908875},{"id":"https://openalex.org/keywords/performance-prediction","display_name":"Performance prediction","score":0.41200000047683716},{"id":"https://openalex.org/keywords/predictive-modelling","display_name":"Predictive modelling","score":0.40209999680519104},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.36730000376701355}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7303000092506409},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.5666999816894531},{"id":"https://openalex.org/C2780898871","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Performance metric","level":2,"score":0.524399995803833},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5238000154495239},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.510200023651123},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.47110000252723694},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.45489999651908875},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4268999993801117},{"id":"https://openalex.org/C2777115002","wikidata":"https://www.wikidata.org/wiki/Q7168246","display_name":"Performance prediction","level":2,"score":0.41200000047683716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4099999964237213},{"id":"https://openalex.org/C45804977","wikidata":"https://www.wikidata.org/wiki/Q7239673","display_name":"Predictive modelling","level":2,"score":0.40209999680519104},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.36730000376701355},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.35519999265670776},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3497999906539917},{"id":"https://openalex.org/C2779714256","wikidata":"https://www.wikidata.org/wiki/Q25305062","display_name":"Multiple Models","level":2,"score":0.33059999346733093},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.32589998841285706},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3142000138759613},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3025999963283539},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.29750001430511475},{"id":"https://openalex.org/C2779937294","wikidata":"https://www.wikidata.org/wiki/Q5513666","display_name":"GLUE","level":2,"score":0.29589998722076416},{"id":"https://openalex.org/C2781345722","wikidata":"https://www.wikidata.org/wiki/Q5308388","display_name":"Drop (telecommunication)","level":2,"score":0.29269999265670776},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2903999984264374},{"id":"https://openalex.org/C2778061373","wikidata":"https://www.wikidata.org/wiki/Q1315146","display_name":"Predictive coding","level":3,"score":0.26190000772476196},{"id":"https://openalex.org/C2780091087","wikidata":"https://www.wikidata.org/wiki/Q3092131","display_name":"Dimensional reduction","level":2,"score":0.2612999975681305},{"id":"https://openalex.org/C76969082","wikidata":"https://www.wikidata.org/wiki/Q486902","display_name":"Mathematical model","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C56858530","wikidata":"https://www.wikidata.org/wiki/Q15947151","display_name":"Reduction strategy","level":2,"score":0.25119999051094055},{"id":"https://openalex.org/C174998907","wikidata":"https://www.wikidata.org/wiki/Q357662","display_name":"Work in process","level":2,"score":0.25060001015663147}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.05988","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.05988","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.05988","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.05988","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.4395022988319397,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Pre-training":[0],"Large":[1],"Language":[2],"Models":[3],"(LLMs)":[4],"on":[5,20,75,181,196,215],"web-scale":[6],"datasets":[7],"becomes":[8],"fundamental":[9],"for":[10,229],"advancing":[11],"general-purpose":[12],"AI.":[13],"In":[14,59,92],"contrast,":[15],"enhancing":[16],"their":[17,26,138],"predictive":[18,173,193,213],"performance":[19,174,194,214],"downstream":[21],"tasks":[22],"typically":[23],"involves":[24],"adapting":[25],"knowledge":[27],"through":[28],"fine-tuning.":[29],"Parameter-efficient":[30],"fine-tuning":[31,238],"techniques,":[32],"such":[33,79],"as":[34,85],"Low-Rank":[35],"Adaptation":[36],"(LoRA),":[37],"aim":[38],"to":[39,61,88,107,122,134,140,149,168,190,226,237],"reduce":[40,159],"the":[41,49,76,97,123,130,160,172,197,212],"computational":[42],"cost":[43],"of":[44,57],"this":[45,93,184,223],"process":[46],"by":[47,100,136,166],"freezing":[48],"pre-trained":[50],"model":[51,124],"and":[52,150,178,219],"updating":[53],"a":[54,80,104,191,205],"smaller":[55],"number":[56],"parameters.":[58],"comparison":[60],"full":[62],"fine-tuning,":[63],"these":[64],"methods":[65],"achieve":[66,204],"over":[67],"99\\%":[68],"reduction":[69,81,185],"in":[70,90,142,163,186,211,242],"trainable":[71,161,187],"parameter":[72],"count,":[73],"depending":[74],"configuration.":[77],"Unfortunately,":[78],"may":[82],"prove":[83],"insufficient":[84],"LLMs":[86],"continue":[87],"grow":[89],"scale.":[91],"work,":[94],"we":[95,128,203,231],"address":[96],"previous":[98],"problem":[99],"systematically":[101],"selecting":[102],"only":[103],"few":[105],"layers":[106,119,133],"fine-tune":[108,135],"using":[109],"LoRA":[110,240],"or":[111,208],"its":[112],"variants.":[113],"We":[114,158],"argue":[115],"that":[116],"not":[117],"all":[118,243],"contribute":[120],"equally":[121],"adaptation.":[125],"Leveraging":[126],"this,":[127],"identify":[129],"most":[131],"relevant":[132],"measuring":[137],"contribution":[139],"changes":[141],"internal":[143],"representations.":[144],"Our":[145],"method":[146],"is":[147,246],"orthogonal":[148],"readily":[151],"compatible":[152],"with":[153,239],"existing":[154],"low-rank":[155],"adaptation":[156],"techniques.":[157],"parameters":[162,188],"LoRA-based":[164],"techniques":[165],"up":[167],"50\\%,":[169],"while":[170],"maintaining":[171],"across":[175],"different":[176],"models":[177],"tasks.":[179,221],"Specifically,":[180],"encoder-only":[182],"architectures,":[183,202],"leads":[189],"negligible":[192],"drop":[195,207],"GLUE":[198],"benchmark.":[199],"On":[200],"decoder-only":[201],"small":[206],"even":[209],"improvements":[210],"mathematical":[216],"problem-solving":[217],"capabilities":[218],"coding":[220],"Finally,":[222],"effectiveness":[224],"extends":[225],"multimodal":[227],"models,":[228],"which":[230],"also":[232],"observe":[233],"competitive":[234],"results":[235],"relative":[236],"modules":[241],"layers.":[244],"Code":[245],"available":[247],"at:":[248],"https://github.com/c2d-usp/Layer-wise-LoRA-with-CKA":[249]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-07T00:00:00"}
