{"id":"https://openalex.org/W7162556122","doi":"https://doi.org/10.48550/arxiv.2605.27276","title":"SIA: Self Improving AI with Harness &amp; Weight Updates","display_name":"SIA: Self Improving AI with Harness &amp; Weight Updates","publication_year":2026,"publication_date":"2026-05-26","ids":{"openalex":"https://openalex.org/W7162556122","doi":"https://doi.org/10.48550/arxiv.2605.27276"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.27276","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27276","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.27276","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120420815","display_name":"Prannay Hebbar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hebbar, Prannay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137148666","display_name":"Yogendra Manawat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Manawat, Yogendra","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119238073","display_name":"Samuel Verboomen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Verboomen, Samuel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022459043","display_name":"A. V. Ivanova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ivanova, Alesia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047411992","display_name":"Selvam Palanimalai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Palanimalai, Selvam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137184481","display_name":"Kunal Bhatia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhatia, Kunal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137109895","display_name":"Vignesh Baskaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baskaran, Vignesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.4162999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.4162999987602234,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.07479999959468842,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.05009999871253967,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.6876000165939331},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.5077000260353088},{"id":"https://openalex.org/keywords/disjoint-sets","display_name":"Disjoint sets","score":0.4564000070095062},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4487000107765198},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4077000021934509},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4043999910354614}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7384999990463257},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.6876000165939331},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.5077000260353088},{"id":"https://openalex.org/C45340560","wikidata":"https://www.wikidata.org/wiki/Q215382","display_name":"Disjoint sets","level":2,"score":0.4564000070095062},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4487000107765198},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42089998722076416},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4077000021934509},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4043999910354614},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.3732999861240387},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3684999942779541},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.28780001401901245},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2867000102996826},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.2768999934196472},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.26089999079704285},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.2587999999523163},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.2549000084400177},{"id":"https://openalex.org/C89429830","wikidata":"https://www.wikidata.org/wiki/Q735710","display_name":"Scaffold","level":2,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.27276","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27276","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.27276","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.27276","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.6037752628326416}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Humans":[0],"are":[1,18,74],"the":[2,10,13,56,71,87,95,121,124,188,201],"bottleneck":[3],"in":[4,104,112],"building":[5],"and":[6,12,21,67,123,144,178,195],"improving":[7],"AI.":[8],"Both":[9],"models":[11],"agents":[14],"that":[15,31,204],"wrap":[16],"them":[17],"written,":[19],"tuned,":[20],"corrected":[22],"by":[23],"people.":[24],"The":[25,49,77],"long-horizon":[26],"goal":[27],"of":[28,58,126],"an":[29],"AI":[30],"can":[32,209],"figure":[33],"out":[34],"how":[35,192],"to":[36,85],"improve":[37],"itself":[38],"remains":[39],"open.":[40],"Two":[41],"largely":[42],"disjoint":[43],"research":[44],"lines":[45],"attack":[46],"this":[47],"bottleneck.":[48],"harness-update":[50],"school":[51,80],"has":[52],"a":[53,59,109,114,127],"meta-agent":[54],"rewrite":[55],"scaffold":[57,152,208],"task-specific":[60,128],"agent":[61,116],"(its":[62],"tools,":[63],"prompts,":[64],"retry":[65],"logic,":[66],"search":[68],"procedure)":[69],"while":[70,94,197],"model":[72,189],"weights":[73,90,125],"held":[75,98],"fixed.":[76,99],"test-time":[78],"training":[79],"uses":[81],"hand-written":[82],"RL":[83],"pipelines":[84],"update":[86],"model's":[88],"own":[89],"on":[91,155,165,183],"task":[92],"feedback":[93],"harness":[96,122],"is":[97],"These":[100],"two":[101],"silos":[102],"operate":[103],"isolation.":[105],"We":[106,130],"propose":[107],"SIA,":[108],"self-improving":[110],"loop":[111],"which":[113],"language-model":[115],"(the":[117],"Feedback-Agent)":[118],"updates":[119,186,199],"both":[120,149],"agent.":[129],"evaluate":[131],"across":[132],"three":[133,157],"contrasting":[134],"domains:":[135],"Chinese":[136],"legal":[137],"charge":[138],"classification,":[139],"low-level":[140],"GPU":[141,169],"kernel":[142],"optimisation,":[143],"single-cell":[145],"RNA":[146],"denoising.":[147,184],"Combining":[148],"levers":[150],"outperforms":[151],"iteration":[153],"alone":[154],"all":[156],"benchmarks.":[158],"SIA-W+H":[159],"achieves":[160],"25.1%":[161],"over":[162,180],"prior":[163,172,181],"SOTA":[164,173,182],"LawBench,":[166],"12.4%":[167],"faster":[168],"kernels":[170],"than":[171],"(1,017":[174],"vs":[175],"1,161":[176],"\u03bcs),":[177],"20.4%":[179],"Harness":[185],"make":[187],"agentic,":[190],"shaping":[191],"it":[193],"searches":[194],"acts,":[196],"weight":[198],"build":[200],"domain":[202],"intuition":[203],"no":[205],"prompt":[206],"or":[207],"instil.":[210]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-28T00:00:00"}
