{"id":"https://openalex.org/W7125367450","doi":"https://doi.org/10.48550/arxiv.2601.14532","title":"Search over Self-Edit Strategies for LLM Adaptation","display_name":"Search over Self-Edit Strategies for LLM Adaptation","publication_year":2026,"publication_date":"2026-01-20","ids":{"openalex":"https://openalex.org/W7125367450","doi":"https://doi.org/10.48550/arxiv.2601.14532"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.14532","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.14532","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.14532","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048864148","display_name":"Alistair Cheong","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Cheong, Alistair","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123616644","display_name":"Haolin Cong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cong, Haolin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123595759","display_name":"Tyler Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Tyler","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5113048692","display_name":"Dustin Miao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Miao, Dustin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5048864148"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.12610000371932983,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.12610000371932983,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.09279999881982803,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.08789999783039093,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6725000143051147},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.5896000266075134},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.49810001254081726},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.46389999985694885},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.444599986076355},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.3495999872684479},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.3395000100135803}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7307000160217285},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6725000143051147},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.5896000266075134},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5491999983787537},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5472000241279602},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.49810001254081726},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.46389999985694885},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.444599986076355},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.3495999872684479},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.3395000100135803},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.32989999651908875},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3224000036716461},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.30660000443458557},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.30640000104904175},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.28029999136924744},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.26030001044273376},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.25099998712539673},{"id":"https://openalex.org/C17020691","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operator (biology)","level":5,"score":0.25060001015663147}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.14532","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.14532","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.14532","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.14532","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7101063132286072}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Many":[0],"LLM-based":[1],"open-ended":[2],"search":[3],"systems":[4],"freeze":[5],"the":[6,25,33,64,77,87,100,119,167,173,178,185,198],"foundation":[7],"model":[8,27,88,120],"that":[9,202,217],"proposes":[10],"improvements":[11],"to":[12,51,80,121,172,224],"existing":[13],"solutions,":[14],"which":[15],"may":[16,221],"bottleneck":[17],"long-run":[18],"progress.":[19],"Recent":[20],"work":[21],"has":[22],"explored":[23],"updating":[24],"proposal":[26],"at":[28,236],"test":[29],"time":[30],"[arXiv:2511.23473],":[31],"but":[32,211],"update":[34,56,78],"strategy":[35],"is":[36,69,234],"still":[37],"typically":[38],"hand-specified.":[39],"Therefore,":[40],"this":[41],"study":[42],"investigated":[43],"whether":[44,144],"an":[45],"LLM":[46],"can":[47,206,212],"use":[48],"task":[49],"feedback":[50],"decide":[52],"how":[53],"it":[54,129],"should":[55],"its":[57,92,112,123,133],"weights.":[58],"For":[59],"tractability,":[60],"we":[61,110],"focused":[62],"on":[63,149,164],"simpler":[65],"case":[66],"where":[67],"there":[68],"only":[70],"one":[71],"round":[72],"of":[73,153,195],"self-improvement,":[74],"and":[75,95,117,136,183],"restricted":[76],"operator":[79],"self-supervised":[81],"next":[82],"token":[83],"prediction":[84],"(NTP),":[85],"leaving":[86],"freedom":[89],"in":[90,143,197],"choosing":[91],"training":[93,134],"data":[94,135],"key":[96],"NTP":[97],"hyperparameters.":[98,137],"Using":[99],"Self-Adapting":[101],"Language":[102],"Models":[103],"(SEAL)":[104],"[arXiv:2506.10943]":[105],"framework":[106],"as":[107],"a":[108,150,203],"testbed,":[109],"relaxed":[111],"fixed":[113],"human":[114,230],"template":[115,145],"constraint":[116],"allowed":[118],"generate":[122],"own":[124],"self-edit":[125],"templates,":[126],"thereby":[127],"giving":[128],"more":[130],"control":[131],"over":[132],"Two":[138],"variants":[139],"were":[140],"studied,":[141],"differing":[142],"generation":[146],"was":[147],"conditioned":[148],"lightweight":[151],"archive":[152,179,205],"past":[154],"templates.":[155],"In":[156],"SEAL's":[157],"Single-Passage":[158],"Knowledge":[159],"Incorporation":[160],"setting":[161],"with":[162],"Qwen3-8B":[163],"SQuAD":[165],"[arXiv:1606.05250],":[166],"no-archive":[168],"variant":[169,180],"performed":[170],"comparably":[171],"weaker":[174],"\"Implications\"":[175,182],"baseline,":[176],"while":[177],"outperformed":[181],"approached":[184],"strongest":[186],"human-designed":[187],"\"Rewrite\"":[188],"baseline":[189],"without":[190],"surpassing":[191],"it.":[192],"Further":[193],"analysis":[194],"collapse":[196],"model's":[199],"exploration":[200],"revealed":[201],"naive":[204],"confer":[207],"some":[208],"short-term":[209],"robustness":[210],"also":[213],"accelerate":[214],"homogenization,":[215],"suggesting":[216],"explicit":[218],"novelty":[219],"pressure":[220],"be":[222],"required":[223],"consistently":[225],"advance":[226],"beyond":[227],"carefully":[228],"optimized":[229],"strategies.":[231],"Our":[232],"code":[233],"available":[235],"https://github.com/cheongalc/search-self-edit-strategies":[237],".":[238]},"counts_by_year":[],"updated_date":"2026-01-23T23:24:52.574035","created_date":"2026-01-23T00:00:00"}
