{"id":"https://openalex.org/W7160879234","doi":"https://doi.org/10.48550/arxiv.2605.06754","title":"ScarfBench: A Benchmark for Cross-Framework Application Migration in Enterprise Java","display_name":"ScarfBench: A Benchmark for Cross-Framework Application Migration in Enterprise Java","publication_year":2026,"publication_date":"2026-05-07","ids":{"openalex":"https://openalex.org/W7160879234","doi":"https://doi.org/10.48550/arxiv.2605.06754"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.06754","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06754","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.06754","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135896054","display_name":"Advait Pavuluri","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pavuluri, Advait","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115766850","display_name":"Bridget McGinn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McGinn, Bridget","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112617383","display_name":"Ashita Saxena","orcid":"https://orcid.org/0009-0001-5244-0695"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saxena, Ashita","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135832536","display_name":"George Safta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Safta, George","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135902448","display_name":"Srikanth Tamilselvam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tamilselvam, Srikanth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087072038","display_name":"Raju Pavuluri","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pavuluri, Raju","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068061267","display_name":"Michele Merler","orcid":"https://orcid.org/0000-0002-4358-8671"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Merler, Michele","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135840062","display_name":"Baishakhi Ray","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ray, Baishakhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135849255","display_name":"Rahul Krishna","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Krishna, Rahul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.3495999872684479,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.3495999872684479,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.298799991607666,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10639","display_name":"Advanced Software Engineering Methodologies","score":0.15129999816417694,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/code-refactoring","display_name":"Code refactoring","score":0.9258999824523926},{"id":"https://openalex.org/keywords/java","display_name":"Java","score":0.6858000159263611},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.6826000213623047},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6215999722480774},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.46810001134872437},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.4327000081539154},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.38370001316070557},{"id":"https://openalex.org/keywords/test-case","display_name":"Test case","score":0.38350000977516174},{"id":"https://openalex.org/keywords/dependency-graph","display_name":"Dependency graph","score":0.3310999870300293},{"id":"https://openalex.org/keywords/plug-in","display_name":"Plug-in","score":0.30959999561309814}],"concepts":[{"id":"https://openalex.org/C152752567","wikidata":"https://www.wikidata.org/wiki/Q116877","display_name":"Code refactoring","level":3,"score":0.9258999824523926},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7843999862670898},{"id":"https://openalex.org/C548217200","wikidata":"https://www.wikidata.org/wiki/Q251","display_name":"Java","level":2,"score":0.6858000159263611},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.6826000213623047},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6215999722480774},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6194000244140625},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.4772000014781952},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.46810001134872437},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.4327000081539154},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.38370001316070557},{"id":"https://openalex.org/C128942645","wikidata":"https://www.wikidata.org/wiki/Q1568346","display_name":"Test case","level":3,"score":0.38350000977516174},{"id":"https://openalex.org/C16311509","wikidata":"https://www.wikidata.org/wiki/Q4148050","display_name":"Dependency graph","level":3,"score":0.3310999870300293},{"id":"https://openalex.org/C4924752","wikidata":"https://www.wikidata.org/wiki/Q184148","display_name":"Plug-in","level":2,"score":0.30959999561309814},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2976999878883362},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.29580000042915344},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.29120001196861267},{"id":"https://openalex.org/C2781009160","wikidata":"https://www.wikidata.org/wiki/Q735604","display_name":"AspectJ","level":4,"score":0.2883000075817108},{"id":"https://openalex.org/C2780069185","wikidata":"https://www.wikidata.org/wiki/Q7977945","display_name":"Equivalence (formal languages)","level":2,"score":0.28529998660087585},{"id":"https://openalex.org/C19768560","wikidata":"https://www.wikidata.org/wiki/Q320727","display_name":"Dependency (UML)","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C105446022","wikidata":"https://www.wikidata.org/wiki/Q445962","display_name":"Legacy system","level":3,"score":0.27129998803138733},{"id":"https://openalex.org/C101317890","wikidata":"https://www.wikidata.org/wiki/Q940053","display_name":"Software maintenance","level":4,"score":0.27070000767707825},{"id":"https://openalex.org/C154504017","wikidata":"https://www.wikidata.org/wiki/Q853614","display_name":"Identifier","level":2,"score":0.27070000767707825},{"id":"https://openalex.org/C145644426","wikidata":"https://www.wikidata.org/wiki/Q169411","display_name":"Unified Modeling Language","level":3,"score":0.2689000070095062},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.26840001344680786},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2630000114440918},{"id":"https://openalex.org/C150202949","wikidata":"https://www.wikidata.org/wiki/Q107602","display_name":"Pointer (user interface)","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.26159998774528503},{"id":"https://openalex.org/C51929080","wikidata":"https://www.wikidata.org/wiki/Q2425187","display_name":"Codebase","level":3,"score":0.26010000705718994},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.25429999828338623},{"id":"https://openalex.org/C199519371","wikidata":"https://www.wikidata.org/wiki/Q942695","display_name":"Source lines of code","level":3,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.06754","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06754","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.06754","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.06754","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.7037526965141296,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Java":[0,61],"remains":[1],"central":[2],"to":[3],"enterprise":[4,60],"software,":[5],"and":[6,29,39,74,91,94,108,141,169,174,193,202,209,226,234],"many":[7],"applications":[8,77],"outlive":[9],"their":[10],"original":[11],"architecture.":[12],"Migrating":[13],"them":[14],"across":[15,70,88,190],"frameworks":[16],"is":[17,64,124,188,197],"a":[18,53,104,109,116,137,182,217],"behavior-preserving":[19,56],"refactoring":[20,47,58,97],"spanning":[21,223],"build":[22],"configuration,":[23],"dependency":[24],"injection,":[25],"persistence,":[26],"request":[27],"handling,":[28],"deployment.":[30],"Existing":[31],"software-engineering":[32],"benchmarks":[33],"cover":[34],"bug":[35],"fixing,":[36],"feature":[37],"implementation,":[38],"language":[40],"or":[41],"version":[42],"modernization,":[43],"but":[44],"leave":[45],"cross-framework":[46,57],"largely":[48],"unmeasured.":[49],"We":[50,150,229],"introduce":[51],"ScarfBench,":[52],"benchmark":[54],"for":[55],"of":[59,177,212,219],"applications.":[62],"It":[63],"built":[65],"from":[66],"expert-written":[67],"implementation":[68,118],"triples":[69],"Spring,":[71],"Jakarta":[72],"EE,":[73],"Quarkus:":[75],"34":[76],"(29":[78],"focused":[79],"single-layer,":[80],"5":[81],"whole)":[82],"yielding":[83],"102":[84],"variants":[85],"(~151K":[86],"lines":[87],"1946":[89],"source":[90,106,121],"test":[92,164,227],"files)":[93],"204":[95,179],"directed":[96],"tasks.":[98],"Each":[99],"task":[100],"gives":[101],"an":[102,127],"agent":[103,113,235],"working":[105],"application":[107],"target":[110,117,139],"framework;":[111],"the":[112,120,131,146,178,198,231],"must":[114,133],"synthesize":[115],"preserving":[119],"behavior.":[122],"Correctness":[123],"evaluated":[125],"by":[126],"application-specific":[128],"executable":[129],"oracle:":[130],"candidate":[132],"compile,":[134],"deploy":[135],"in":[136],"containerized":[138],"runtime,":[140],"pass":[142,165],"behavioral":[143],"tests":[144],"over":[145],"application's":[147],"observable":[148],"interface.":[149],"evaluate":[151],"five":[152],"state-of-the-art":[153],"coding":[154],"agents":[155],"on":[156,166,171],"ScarfBench.":[157],"The":[158],"strongest":[159],"achieves":[160],"only":[161,175],"15.3%":[162],"aggregate":[163],"focused-layer":[167],"migrations":[168,204],"12.2%":[170],"whole":[172],"applications,":[173],"one":[176],"tasks":[180],"yields":[181],"fully":[183],"behaviorally":[184],"equivalent":[185],"target.":[186],"Difficulty":[187],"asymmetric":[189],"framework":[191],"directions":[192],"architectural":[194],"layers:":[195],"Spring&lt;-&gt;Quarkus":[196],"most":[199],"tractable":[200],"pair,":[201],"Jakarta-targeted":[203],"are":[205],"hardest.":[206],"From":[207],"LLM-as-a-judge":[208],"expert":[210],"adjudication":[211],"failed-task":[213],"traces,":[214],"we":[215],"derive":[216],"taxonomy":[218],"recurring":[220],"failure":[221],"categories":[222],"build,":[224],"deploy,":[225],"stages.":[228],"release":[230],"benchmark,":[232],"harness,":[233],"traces":[236],"at":[237],"https://scarfbench.info.":[238]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-12T00:00:00"}
