{"id":"https://openalex.org/W7161550390","doi":"https://doi.org/10.48550/arxiv.2605.15221","title":"Effective Harness Engineering for Algorithm Discovery with Coding Agents","display_name":"Effective Harness Engineering for Algorithm Discovery with Coding Agents","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7161550390","doi":"https://doi.org/10.48550/arxiv.2605.15221"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.15221","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.15221","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136427749","display_name":"Yoichi Ishibashi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ishibashi, Yoichi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112284263","display_name":"Taro Yano","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yano, Taro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5044722101","display_name":"Masafumi Oyamada","orcid":"https://orcid.org/0000-0002-4045-7350"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oyamada, Masafumi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.21850000321865082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.21850000321865082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.09009999781847,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.06679999828338623,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.7882999777793884},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.5753999948501587},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.5680000185966492},{"id":"https://openalex.org/keywords/evolutionary-algorithm","display_name":"Evolutionary algorithm","score":0.4740999937057495},{"id":"https://openalex.org/keywords/algorithm-design","display_name":"Algorithm design","score":0.43619999289512634},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.35600000619888306},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.35199999809265137}],"concepts":[{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.7882999777793884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7584999799728394},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.5753999948501587},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.5680000185966492},{"id":"https://openalex.org/C159149176","wikidata":"https://www.wikidata.org/wiki/Q14489129","display_name":"Evolutionary algorithm","level":2,"score":0.4740999937057495},{"id":"https://openalex.org/C106516650","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm design","level":2,"score":0.43619999289512634},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39259999990463257},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.35600000619888306},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C125583679","wikidata":"https://www.wikidata.org/wiki/Q755673","display_name":"Search algorithm","level":2,"score":0.33059999346733093},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.325300008058548},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.32280001044273376},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C105902424","wikidata":"https://www.wikidata.org/wiki/Q1197129","display_name":"Evolutionary computation","level":2,"score":0.3127000033855438},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29179999232292175},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29170000553131104},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.26420000195503235},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C116709606","wikidata":"https://www.wikidata.org/wiki/Q1296251","display_name":"Algorithmic efficiency","level":3,"score":0.25850000977516174},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25459998846054077}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.15221","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.15221","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.15221","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","score":0.6474660634994507,"id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"AlphaEvolve":[0],"and":[1],"FunSearch":[2],"have":[3],"demonstrated":[4],"the":[5,34,37,41,75,84,119,140,150],"potential":[6],"of":[7,36,142,152],"combining":[8],"large":[9],"language":[10],"models":[11,158,171],"(LLMs)":[12],"with":[13,64,70],"evolutionary":[14,153],"search":[15],"for":[16],"automated":[17],"algorithm":[18,103],"discovery.":[19],"However,":[20],"discovery":[21,104],"success":[22],"is":[23,57,145],"shaped":[24],"not":[25],"only":[26],"by":[27,33],"model":[28],"capability":[29],"but":[30],"also":[31],"significantly":[32],"design":[35,48],"execution":[38],"infrastructure,":[39],"i.e.,":[40],"harness.":[42],"This":[43],"paper":[44],"investigates":[45],"effective":[46],"harness":[47,76,108],"through":[49],"three":[50],"questions:":[51],"under":[52,118],"a":[53],"fixed":[54],"token":[55,121],"budget,":[56],"it":[58],"better":[59],"to":[60],"produce":[61],"many":[62],"algorithms":[63,69,126],"brief":[65],"thought":[66],"or":[67],"fewer":[68,125],"deeper":[71],"thought?":[72],"How":[73],"should":[74],"handle":[77],"evaluation":[78,160],"hacks,":[79],"where":[80],"generated":[81],"programs":[82],"exploit":[83],"scoring":[85],"function?":[86],"And":[87],"how":[88],"can":[89],"agents":[90],"that":[91,106],"require":[92],"full":[93],"filesystem":[94],"access":[95],"execute":[96],"safely":[97],"in":[98],"parallel?":[99],"Using":[100],"Vesper,":[101],"an":[102],"framework":[105],"incorporates":[107],"improvements":[109],"addressing":[110],"these":[111],"questions,":[112],"we":[113],"evaluate":[114],"on":[115],"Circle":[116],"Packing":[117],"same":[120],"budget.":[122],"Interestingly,":[123],"generating":[124],"while":[127],"thinking":[128],"more":[129,146,156],"deeply":[130],"about":[131],"each":[132,143],"one":[133],"achieved":[134],"higher":[135,163],"scores.":[136],"That":[137],"is,":[138],"scaling":[139,149],"quality":[141],"individual":[144],"budget-efficient":[147],"than":[148],"number":[151],"generations.":[154],"Surprisingly,":[155],"capable":[157],"produced":[159],"hacks":[161],"at":[162],"rates,":[164],"making":[165],"hack":[166],"detection":[167],"increasingly":[168],"necessary":[169],"as":[170],"scale.":[172]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-05-19T00:00:00"}
