{"id":"https://openalex.org/W7131064314","doi":"https://doi.org/10.48550/arxiv.2602.17809","title":"Calibrated Adaptation: Bayesian Stiefel Manifold Priors for Reliable Parameter-Efficient Fine-Tuning","display_name":"Calibrated Adaptation: Bayesian Stiefel Manifold Priors for Reliable Parameter-Efficient Fine-Tuning","publication_year":2026,"publication_date":"2026-02-19","ids":{"openalex":"https://openalex.org/W7131064314","doi":"https://doi.org/10.48550/arxiv.2602.17809"},"language":"en","primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.17809","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126617170","display_name":"Ibne Farabi Shihab","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Shihab, Ibne Farabi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119832027","display_name":"Sanjeda Akter","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akter, Sanjeda","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126599946","display_name":"Anuj Sharma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharma, Anuj","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5126617170"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.4350999891757965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.4350999891757965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2379000037908554,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.06599999964237213,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.7279999852180481},{"id":"https://openalex.org/keywords/stiefel-manifold","display_name":"Stiefel manifold","score":0.6868000030517578},{"id":"https://openalex.org/keywords/manifold","display_name":"Manifold (fluid mechanics)","score":0.5138000249862671},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.44449999928474426},{"id":"https://openalex.org/keywords/tangent-space","display_name":"Tangent space","score":0.4334000051021576},{"id":"https://openalex.org/keywords/orthogonality","display_name":"Orthogonality","score":0.4198000133037567},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.4036000072956085},{"id":"https://openalex.org/keywords/orthonormal-basis","display_name":"Orthonormal basis","score":0.39070001244544983},{"id":"https://openalex.org/keywords/geodesic","display_name":"Geodesic","score":0.385699987411499},{"id":"https://openalex.org/keywords/linear-subspace","display_name":"Linear subspace","score":0.37880000472068787}],"concepts":[{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.7279999852180481},{"id":"https://openalex.org/C612670","wikidata":"https://www.wikidata.org/wiki/Q7616373","display_name":"Stiefel manifold","level":2,"score":0.6868000030517578},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5166000127792358},{"id":"https://openalex.org/C529865628","wikidata":"https://www.wikidata.org/wiki/Q1790740","display_name":"Manifold (fluid mechanics)","level":2,"score":0.5138000249862671},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5055000185966492},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.44449999928474426},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4406000077724457},{"id":"https://openalex.org/C157157409","wikidata":"https://www.wikidata.org/wiki/Q909601","display_name":"Tangent space","level":2,"score":0.4334000051021576},{"id":"https://openalex.org/C17137986","wikidata":"https://www.wikidata.org/wiki/Q215067","display_name":"Orthogonality","level":2,"score":0.4198000133037567},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.4036000072956085},{"id":"https://openalex.org/C5806529","wikidata":"https://www.wikidata.org/wiki/Q2365325","display_name":"Orthonormal basis","level":2,"score":0.39070001244544983},{"id":"https://openalex.org/C165818556","wikidata":"https://www.wikidata.org/wiki/Q213488","display_name":"Geodesic","level":2,"score":0.385699987411499},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3831999897956848},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.37880000472068787},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3686999976634979},{"id":"https://openalex.org/C32230216","wikidata":"https://www.wikidata.org/wiki/Q7882499","display_name":"Uncertainty quantification","level":2,"score":0.36730000376701355},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.3456000089645386},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.34360000491142273},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.3402000069618225},{"id":"https://openalex.org/C153120616","wikidata":"https://www.wikidata.org/wiki/Q17068315","display_name":"Manifold alignment","level":4,"score":0.33730000257492065},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.3255999982357025},{"id":"https://openalex.org/C12773090","wikidata":"https://www.wikidata.org/wiki/Q3888851","display_name":"Ambient space","level":2,"score":0.3068000078201294},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.30320000648498535},{"id":"https://openalex.org/C2777634741","wikidata":"https://www.wikidata.org/wiki/Q768993","display_name":"Wasserstein metric","level":2,"score":0.296099990606308},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C92757383","wikidata":"https://www.wikidata.org/wiki/Q382497","display_name":"Affine transformation","level":2,"score":0.2660999894142151},{"id":"https://openalex.org/C57830394","wikidata":"https://www.wikidata.org/wiki/Q278079","display_name":"Posterior probability","level":3,"score":0.2648000121116638},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.259799987077713},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.2597000002861023},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.2590999901294708},{"id":"https://openalex.org/C2777472644","wikidata":"https://www.wikidata.org/wiki/Q16968992","display_name":"Approximate inference","level":3,"score":0.2554999887943268},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.25110000371932983},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.250900000333786},{"id":"https://openalex.org/C151876577","wikidata":"https://www.wikidata.org/wiki/Q7049464","display_name":"Nonlinear dimensionality reduction","level":3,"score":0.2500999867916107}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.17809","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:dr.lib.iastate.edu:20.500.12876/NveoOeOz","is_oa":false,"landing_page_url":"https://dr.lib.iastate.edu/handle/20.500.12876/NveoOeOz","pdf_url":null,"source":{"id":"https://openalex.org/S4377196104","display_name":"Iowa State University Digital Repository (Iowa State University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I173911158","host_organization_name":"Iowa State University","host_organization_lineage":["https://openalex.org/I173911158"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://doi.org/10.48550/arXiv.2602.17809","raw_type":"Preprint"},{"id":"doi:10.48550/arxiv.2602.17809","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.17809","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.17809","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Parameter-efficient":[0],"fine-tuning":[1],"methods":[2],"such":[3],"as":[4],"LoRA":[5,163,195],"enable":[6],"practical":[7],"adaptation":[8],"of":[9,193,203],"large":[10],"language":[11],"models":[12,196],"but":[13],"provide":[14],"no":[15],"principled":[16],"uncertainty":[17,102],"estimates,":[18],"leading":[19],"to":[20,162,173,184,228],"poorly":[21],"calibrated":[22,100],"predictions":[23],"and":[24,54,94,136,144,152,164,189],"unreliable":[25],"behavior":[26],"under":[27,186],"domain":[28,146,187],"shift.":[29],"We":[30,105],"introduce":[31],"Stiefel-Bayes":[32],"Adapters":[33],"(SBA),":[34],"a":[35,41,126,201],"Bayesian":[36,226],"PEFT":[37],"framework":[38],"that":[39,87,108,210],"places":[40],"Matrix":[42],"Langevin":[43],"prior":[44,78],"over":[45,175],"orthonormal":[46],"adapter":[47,88],"factors":[48],"on":[49,79,139,197,215],"the":[50,80,84,97,109,115,204,216],"Stiefel":[51],"manifold":[52,81,132],"$\\St$":[53],"performs":[55],"approximate":[56],"posterior":[57,98],"inference":[58],"via":[59],"tangent":[60,110],"space":[61,72,111],"Laplace":[62],"approximation":[63,112],"with":[64],"geodesic":[65],"retraction.":[66],"Unlike":[67],"Gaussian":[68],"priors":[69],"in":[70,120],"flat":[71],"projected":[73],"onto":[74],"orthogonality":[75],"constraints,":[76],"our":[77],"naturally":[82],"encodes":[83],"inductive":[85],"bias":[86],"subspaces":[89],"should":[90],"be":[91],"well":[92],"conditioned":[93],"orthogonal,":[95],"while":[96,166],"provides":[99],"predictive":[101],"without":[103],"recalibration.":[104],"prove":[106],"formally":[107],"strictly":[113],"avoids":[114],"structural":[116],"variance":[117],"inflation":[118],"inherent":[119],"projecting":[121],"from":[122],"ambient":[123],"space,":[124],"establishing":[125],"rigorous":[127],"theoretical":[128],"advantage":[129],"for":[130],"intrinsic":[131],"inference.":[133],"Across":[134],"GLUE":[135],"SuperGLUE":[137],"benchmarks":[138],"RoBERTa-large,":[140],"LLaMA-2-7B,":[141],"LLaMA-2-13B,":[142],"Mistral-7B,":[143],"Qwen2.5-7B,":[145],"shift":[147],"evaluations,":[148],"selective":[149,179],"prediction":[150,180],"protocols,":[151],"an":[153],"abstractive":[154],"summarization":[155],"task,":[156],"SBA":[157],"achieves":[158],"task":[159],"performance":[160],"comparable":[161],"DoRA":[165],"reducing":[167],"Expected":[168],"Calibration":[169],"Error":[170],"by":[171,182],"18":[172],"34\\%":[174],"deterministic":[176],"baselines,":[177],"improving":[178],"AUROC":[181],"12":[183],"25\\%":[185],"shift,":[188],"outperforming":[190],"deep":[191],"ensembles":[192],"five":[194],"OOD":[198],"detection":[199],"at":[200],"fraction":[202],"parameter":[205],"cost.":[206],"Our":[207],"results":[208],"demonstrate":[209],"where":[211],"you":[212],"place":[213],"uncertainty,":[214],"right":[217],"geometric":[218],"structure,":[219],"matters":[220],"more":[221],"than":[222],"simply":[223],"adding":[224],"any":[225],"treatment":[227],"adapters.":[229]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-24T00:00:00"}
