{"id":"https://openalex.org/W7161138927","doi":"https://doi.org/10.48550/arxiv.2605.13139","title":"SWE-Cycle: Benchmarking Code Agents across the Complete Issue Resolution Cycle","display_name":"SWE-Cycle: Benchmarking Code Agents across the Complete Issue Resolution Cycle","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7161138927","doi":"https://doi.org/10.48550/arxiv.2605.13139"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.13139","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.13139","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.13139","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136165523","display_name":"Hao Guan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guan, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046118256","display_name":"Lingyue Fu","orcid":"https://orcid.org/0000-0002-7827-244X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fu, Lingyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136119800","display_name":"Shao Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041011296","display_name":"Yaoming Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Yaoming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136140389","display_name":"Kangning Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Kangning","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136126014","display_name":"Lin Qiu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiu, Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136160971","display_name":"Xunliang Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Xunliang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136092148","display_name":"Xuezhi Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Xuezhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136125682","display_name":"Weiwen Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Weiwen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136124557","display_name":"Weinan Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Weinan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136111937","display_name":"Yong Yu","orcid":"https://orcid.org/0000-0002-9398-9000"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Yong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5047000050544739,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.5047000050544739,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.2849000096321106,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.06549999862909317,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.620199978351593},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.6061000227928162},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.5501999855041504},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5497999787330627},{"id":"https://openalex.org/keywords/static-program-analysis","display_name":"Static program analysis","score":0.5148000121116638},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4878999888896942},{"id":"https://openalex.org/keywords/static-analysis","display_name":"Static analysis","score":0.4848000109195709},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.462799996137619},{"id":"https://openalex.org/keywords/code-refactoring","display_name":"Code refactoring","score":0.3977000117301941}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7573000192642212},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.620199978351593},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.6061000227928162},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.5501999855041504},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5497999787330627},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.5148000121116638},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4878999888896942},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.4848000109195709},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.462799996137619},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.427700012922287},{"id":"https://openalex.org/C152752567","wikidata":"https://www.wikidata.org/wiki/Q116877","display_name":"Code refactoring","level":3,"score":0.3977000117301941},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.391400009393692},{"id":"https://openalex.org/C63406617","wikidata":"https://www.wikidata.org/wiki/Q5266714","display_name":"Development testing","level":5,"score":0.33730000257492065},{"id":"https://openalex.org/C48002344","wikidata":"https://www.wikidata.org/wiki/Q2919644","display_name":"Verification and validation","level":2,"score":0.32499998807907104},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.32339999079704285},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.313400000333786},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.31220000982284546},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.30660000443458557},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.30250000953674316},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C76518257","wikidata":"https://www.wikidata.org/wiki/Q271680","display_name":"Software framework","level":5,"score":0.2800000011920929},{"id":"https://openalex.org/C1009929","wikidata":"https://www.wikidata.org/wiki/Q179550","display_name":"Software bug","level":3,"score":0.273499995470047},{"id":"https://openalex.org/C10272871","wikidata":"https://www.wikidata.org/wiki/Q929972","display_name":"Software inspection","level":5,"score":0.2718999981880188},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C117447612","wikidata":"https://www.wikidata.org/wiki/Q1412670","display_name":"Software quality","level":4,"score":0.2644999921321869},{"id":"https://openalex.org/C33054407","wikidata":"https://www.wikidata.org/wiki/Q6504747","display_name":"Software verification","level":5,"score":0.26420000195503235},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.26420000195503235},{"id":"https://openalex.org/C149091818","wikidata":"https://www.wikidata.org/wiki/Q2429814","display_name":"Software system","level":3,"score":0.2628999948501587},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.25780001282691956}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.13139","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.13139","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.13139","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.13139","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"autonomous":[1,35,184],"code":[2,60,105,130,167],"agents":[3,21,52,81,131],"move":[4],"toward":[5],"end-to-end":[6,70,181],"software":[7,185],"development,":[8],"evaluating":[9],"their":[10,26],"practical":[11],"autonomy":[12],"becomes":[13],"critical.":[14],"Current":[15],"benchmarks":[16],"hide":[17],"friction":[18],"by":[19,133],"testing":[20],"in":[22,85,147,161],"pre-configured":[23],"environments,":[24],"and":[25,62,118,165,171],"static":[27,104,126],"evaluation":[28,112],"pipelines":[29],"frequently":[30],"fail":[31],"when":[32,150],"parsing":[33],"fully":[34],"trajectories.":[36],"We":[37,128],"address":[38],"these":[39,95,138],"limitations":[40],"with":[41,107],"SWE-Cycle,":[42],"a":[43,86,144,174],"benchmark":[44],"of":[45,124,183],"489":[46],"rigorously":[47],"filtered":[48],"instances.":[49],"SWE-Cycle":[50,170],"evaluates":[51],"across":[53,137],"three":[54],"isolated":[55,153],"tasks,":[56],"including":[57],"environment":[58],"reconstruction,":[59],"implementation,":[61],"verification":[63],"test":[64],"generation,":[65],"as":[66,68],"well":[67],"an":[69],"FullCycle":[71,78,156],"task":[72,79],"that":[73],"integrates":[74],"all":[75],"three.":[76],"The":[77,141],"requires":[80],"to":[82,155],"work":[83],"autonomously":[84],"bare":[87],"repository":[88],"without":[89],"human":[90],"scaffolding.":[91],"To":[92],"reliably":[93],"assess":[94],"complex":[96],"execution":[97],"paths,":[98],"we":[99],"developed":[100],"SWE-Judge.":[101],"By":[102],"combining":[103],"review":[106],"dynamic":[108],"testing,":[109],"this":[110],"execution-capable":[111],"agent":[113],"accurately":[114,178],"verifies":[115],"functional":[116],"correctness":[117],"eliminates":[119],"the":[120,180],"systematic":[121],"measurement":[122],"errors":[123],"traditional":[125],"parsers.":[127],"evaluate":[129],"powered":[132],"six":[134],"state-of-the-art":[135],"LLMs":[136],"four":[139],"tasks.":[140],"results":[142],"reveal":[143],"sharp":[145],"drop":[146],"solve":[148],"rates":[149],"transitioning":[151],"from":[152],"tasks":[154],"execution,":[157],"exposing":[158],"critical":[159],"bottlenecks":[160],"handling":[162],"cross-phase":[163],"dependencies":[164],"maintaining":[166],"quality.":[168],"Together,":[169],"SWE-Judge":[172],"provide":[173],"comprehensive":[175],"framework":[176],"for":[177],"measuring":[179],"capabilities":[182],"agents.":[186]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-15T00:00:00"}
