{"id":"https://openalex.org/W7131884775","doi":"https://doi.org/10.48550/arxiv.2602.22518","title":"RepoMod-Bench: A Benchmark for Code Repository Modernization via Implementation-Agnostic Testing","display_name":"RepoMod-Bench: A Benchmark for Code Repository Modernization via Implementation-Agnostic Testing","publication_year":2026,"publication_date":"2026-02-26","ids":{"openalex":"https://openalex.org/W7131884775","doi":"https://doi.org/10.48550/arxiv.2602.22518"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.22518","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127169438","display_name":"Xuefeng Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Li, Xuefeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056689829","display_name":"N. I. Ben-Israel","orcid":"https://orcid.org/0000-0002-9105-9395"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ben-Israel, Nir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127183721","display_name":"Yotam Raz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Raz, Yotam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127252842","display_name":"Belal Ahmed","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ahmed, Belal","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018307536","display_name":"Doron Serebro","orcid":"https://orcid.org/0009-0000-3941-5017"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Serebro, Doron","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5045093641","display_name":"Antoine Raux","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Raux, Antoine","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5127169438"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.3603000044822693,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.3603000044822693,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.17880000174045563,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.07999999821186066,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6790000200271606},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6455000042915344},{"id":"https://openalex.org/keywords/test-suite","display_name":"Test suite","score":0.5336999893188477},{"id":"https://openalex.org/keywords/source-lines-of-code","display_name":"Source lines of code","score":0.4918000102043152},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4505000114440918},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.43459999561309814},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.43220001459121704},{"id":"https://openalex.org/keywords/ranging","display_name":"Ranging","score":0.3659999966621399},{"id":"https://openalex.org/keywords/equivalence","display_name":"Equivalence (formal languages)","score":0.36500000953674316}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.703499972820282},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6790000200271606},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6455000042915344},{"id":"https://openalex.org/C151552104","wikidata":"https://www.wikidata.org/wiki/Q7705809","display_name":"Test suite","level":4,"score":0.5336999893188477},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.4918000102043152},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4505000114440918},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.44530001282691956},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.43459999561309814},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.43220001459121704},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.3659999966621399},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.36500000953674316},{"id":"https://openalex.org/C519991488","wikidata":"https://www.wikidata.org/wiki/Q28865","display_name":"Python (programming language)","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.3522000014781952},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.35109999775886536},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3443000018596649},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.3409000039100647},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C53942775","wikidata":"https://www.wikidata.org/wiki/Q1211721","display_name":"Code coverage","level":3,"score":0.3222000002861023},{"id":"https://openalex.org/C148027188","wikidata":"https://www.wikidata.org/wiki/Q907375","display_name":"Unit testing","level":3,"score":0.32100000977516174},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.31690001487731934},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.29750001430511475},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.296099990606308},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29510000348091125},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.2858000099658966},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.28540000319480896},{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.27469998598098755},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.27309998869895935},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2572999894618988},{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.2551000118255615},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2540000081062317},{"id":"https://openalex.org/C3018397939","wikidata":"https://www.wikidata.org/wiki/Q3644502","display_name":"Open source","level":3,"score":0.2531999945640564}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.22518","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.22518","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.22518","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.22518","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,119],"evolution":[1],"of":[2,32,108,124],"AI":[3],"coding":[4],"agents":[5,21,177],"has":[6],"shifted":[7],"the":[8,30,57,76],"frontier":[9],"from":[10,134,176,196],"simple":[11],"snippet":[12],"completion":[13],"to":[14,37,65,75,136,151,178,203],"autonomous":[15,214],"repository-level":[16,91],"engineering.":[17],"However,":[18],"evaluating":[19],"these":[20,83],"remains":[22,165,218],"ill-posed":[23],"in":[24],"general":[25],"code":[26,92,125,226],"repository":[27,131],"generation,":[28],"where":[29],"lack":[31],"deterministic":[33],"ground":[34,54],"truth":[35,55],"leads":[36],"ambiguous":[38],"metrics.":[39],"Code":[40],"modernization":[41,93,215],"via":[42],"automated":[43],"translation":[44],"offers":[45],"a":[46,52,87,106,188,219],"more":[47],"rigorous":[48],"alternative":[49],"by":[50,85],"providing":[51],"fixed":[53],"--":[56],"source":[58,156],"repository;":[59],"yet":[60],"existing":[61],"benchmarks":[62],"are":[63,227],"limited":[64],"small-scale":[66],"repositories":[67,111,141],"and":[68,127,157,169,225],"rely":[69],"on":[70,95,198,205],"language-specific":[71],"unit":[72],"tests":[73],"visible":[74],"agent,":[77],"allowing":[78],"test-driven":[79,180],"overfitting.":[80],"We":[81],"address":[82],"limitations":[84],"introducing":[86],"benchmarking":[88],"framework":[89,101],"for":[90],"built":[94],"an":[96,147],"implementation-agnostic":[97,148],"evaluation":[98],"paradigm.":[99],"This":[100,160],"is":[102],"instantiated":[103],"through":[104],"RepoMod-Bench:":[105],"benchmark":[107,120,224],"21":[109],"real-world":[110],"with":[112,130,142],"standardized":[113,143],"interfaces,":[114,144],"spanning":[115],"8":[116],"programming":[117],"languages.":[118],"contains":[121],"1.6M":[122],"lines":[123],"(LOC)":[126],"11,616":[128],"tests,":[129],"sizes":[132],"ranging":[133],"14":[135],"211K":[137],"LOC.":[138,209],"By":[139],"targeting":[140],"we":[145],"utilize":[146],"test":[149,174],"suite":[150],"verify":[152],"functional":[153],"equivalence":[154],"between":[155],"target":[158],"implementations.":[159],"black-box":[161],"approach":[162],"ensures":[163],"verification":[164],"consistent":[166],"across":[167],"languages,":[168],"our":[170],"environment":[171],"hides":[172],"all":[173],"suites":[175],"prevent":[179],"shortcuts.":[181],"Evaluating":[182],"four":[183],"state-of-the-art":[184],"agent":[185],"configurations":[186],"reveals":[187],"sharp":[189],"scaling":[190],"collapse:":[191],"average":[192],"pass":[193],"rates":[194],"drop":[195],"91.3%":[197],"projects":[199,206],"under":[200],"10K":[201],"LOC":[202],"15.3%":[204],"exceeding":[207],"50K":[208],"These":[210],"results":[211],"demonstrate":[212],"that":[213],"at":[216,229],"scale":[217],"significant":[220],"open":[221],"challenge.":[222],"Our":[223],"available":[228],"https://github.com/Modelcode-ai/mcode-benchmark.":[230]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-28T00:00:00"}
