{"id":"https://openalex.org/W7128769685","doi":"https://doi.org/10.48550/arxiv.2602.11171","title":"Efficient Hyper-Parameter Search for LoRA via Language-aided Bayesian Optimization","display_name":"Efficient Hyper-Parameter Search for LoRA via Language-aided Bayesian Optimization","publication_year":2026,"publication_date":"2026-01-19","ids":{"openalex":"https://openalex.org/W7128769685","doi":"https://doi.org/10.48550/arxiv.2602.11171"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.11171","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007364455","display_name":"Baek Seong-Eun","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Seong-Eun, Baek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120058664","display_name":"Lee Jung-Mok","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jung-Mok, Lee","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125906716","display_name":"Kim Sung-Bin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sung-Bin, Kim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125931784","display_name":"Tae-Hyun Oh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oh, Tae-Hyun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5007364455"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.42719998955726624,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.42719998955726624,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.051600001752376556,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.0494999997317791,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.9180999994277954},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7178999781608582},{"id":"https://openalex.org/keywords/domain-knowledge","display_name":"Domain knowledge","score":0.53329998254776},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.4659000039100647},{"id":"https://openalex.org/keywords/hyperparameter-optimization","display_name":"Hyperparameter optimization","score":0.4586000144481659},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4546000063419342},{"id":"https://openalex.org/keywords/bayesian-optimization","display_name":"Bayesian optimization","score":0.45260000228881836},{"id":"https://openalex.org/keywords/proxy","display_name":"Proxy (statistics)","score":0.4519999921321869}],"concepts":[{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.9180999994277954},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7580999732017517},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7178999781608582},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6353999972343445},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.53329998254776},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5105999708175659},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.4659000039100647},{"id":"https://openalex.org/C10485038","wikidata":"https://www.wikidata.org/wiki/Q48996162","display_name":"Hyperparameter optimization","level":3,"score":0.4586000144481659},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4546000063419342},{"id":"https://openalex.org/C2778049539","wikidata":"https://www.wikidata.org/wiki/Q17002908","display_name":"Bayesian optimization","level":2,"score":0.45260000228881836},{"id":"https://openalex.org/C2780148112","wikidata":"https://www.wikidata.org/wiki/Q1432581","display_name":"Proxy (statistics)","level":2,"score":0.4519999921321869},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.43689998984336853},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.39010000228881836},{"id":"https://openalex.org/C2776434776","wikidata":"https://www.wikidata.org/wiki/Q19246213","display_name":"Domain adaptation","level":3,"score":0.3804999887943268},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.3741999864578247},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.34360000491142273},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.34040001034736633},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33340001106262207},{"id":"https://openalex.org/C33724603","wikidata":"https://www.wikidata.org/wiki/Q812540","display_name":"Bayesian network","level":2,"score":0.33079999685287476},{"id":"https://openalex.org/C37381756","wikidata":"https://www.wikidata.org/wiki/Q20203288","display_name":"Representativeness heuristic","level":2,"score":0.32179999351501465},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3156000077724457},{"id":"https://openalex.org/C202269582","wikidata":"https://www.wikidata.org/wiki/Q2644277","display_name":"Complementarity (molecular biology)","level":2,"score":0.30790001153945923},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.28780001401901245}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.11171","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.11171","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.11171","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.11171","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.44266369938850403,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Fine-tuning":[0],"Large":[1],"Language":[2],"Models":[3],"(LLMs)":[4],"with":[5,95,158,202,220],"Low-Rank":[6],"Adaptation":[7],"(LoRA)":[8],"enables":[9],"resource-efficient":[10],"personalization":[11],"or":[12],"specialization,":[13],"but":[14],"it":[15,29],"comes":[16],"at":[17],"the":[18,34,57,75,89,108,121,138,146,156,175,178,182,209],"expense":[19],"of":[20,36,60,78,177,211],"additional":[21,160],"hyperparameter":[22,40,218],"tuning.":[23],"Although":[24],"LoRA":[25,71,136,193],"makes":[26],"fine-tuning":[27],"efficient,":[28],"is":[30,42,102,150],"highly":[31],"sensitive":[32],"to":[33,67,87,152,166],"choice":[35],"hyperparameters,":[37],"and":[38,91,106,125,188,200],"exhaustive":[39],"search":[41,69],"still":[43],"computationally":[44],"very":[45],"demanding.":[46],"To":[47,73],"address":[48],"these":[49],"challenges,":[50],"we":[51,80,114,130,144,196],"propose":[52],"a":[53,84,96,116,203],"framework":[54],"that":[55,149,216],"integrates":[56],"domain":[58,93,133],"knowledge":[59,77,94,134],"pre-trained":[61],"LLMs":[62,82],"into":[63,137],"Bayesian":[64],"Optimization":[65],"(BO)":[66],"efficiently":[68],"for":[70],"hyperparameters.":[72,170],"leverage":[74],"informed":[76],"LLMs,":[79],"repurpose":[81],"as":[83],"discrete-to-continuous":[85],"mapping":[86,109],"link":[88],"hyperparameters":[90,124,233],"their":[92,126],"continuous":[97],"vector":[98],"space,":[99],"where":[100,113],"BO":[101,165],"conducted.":[103],"We":[104,214],"design":[105],"control":[107],"by":[110,173],"language":[111],"prompting,":[112],"provide":[115],"domain-aware":[117],"textual":[118],"prompt":[119,157],"describing":[120],"relationships":[122],"among":[123],"respective":[127,183],"roles;":[128],"thereby,":[129],"explicitly":[131],"inject":[132],"about":[135,222,236],"LLM":[139],"in":[140,155,192],"natural":[141],"language.":[142],"Also,":[143],"model":[145],"residual":[147],"information":[148],"hard":[151],"linguistically":[153],"describe":[154],"an":[159],"learnable":[161],"token.":[162],"This":[163,206],"aids":[164],"sample":[167],"more":[168,226],"high-performing":[169],"In":[171],"addition,":[172],"leveraging":[174],"observation":[176],"strong":[179],"correlation":[180],"between":[181],"performance":[184,229],"obtained":[185],"from":[186,235],"full":[187],"subset":[189],"training":[190,194,199],"datasets":[191],"regimes,":[195],"introduce":[197],"proxy":[198],"evaluation":[201],"data":[204],"subset.":[205],"further":[207],"increases":[208],"efficiency":[210],"our":[212,217],"method.":[213],"demonstrate":[215],"found":[219,234],"only":[221],"30":[223],"iterations":[224],"achieves":[225],"than":[227],"20%":[228],"improvement":[230],"over":[231],"standard":[232],"45,000":[237],"combinations.":[238]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-14T00:00:00"}
