{"id":"https://openalex.org/W7159654435","doi":"https://doi.org/10.48550/arxiv.2604.27319","title":"REBENCH: A Procedural, Fair-by-Construction Benchmark for LLMs on Stripped-Binary Types and Names (Extended Version)","display_name":"REBENCH: A Procedural, Fair-by-Construction Benchmark for LLMs on Stripped-Binary Types and Names (Extended Version)","publication_year":2026,"publication_date":"2026-04-30","ids":{"openalex":"https://openalex.org/W7159654435","doi":"https://doi.org/10.48550/arxiv.2604.27319"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.27319","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.27319","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.27319","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037608453","display_name":"Jun Yeon Won","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Won, Jun Yeon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134983251","display_name":"Xin Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Xin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134945818","display_name":"Shiqing Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Shiqing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134942072","display_name":"Zhiqiang Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Zhiqiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.18050000071525574,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.18050000071525574,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.09059999883174896,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.07980000227689743,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7247999906539917},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.5339000225067139},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5102999806404114},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4869999885559082},{"id":"https://openalex.org/keywords/reverse-engineering","display_name":"Reverse engineering","score":0.4602000117301941},{"id":"https://openalex.org/keywords/call-stack","display_name":"Call stack","score":0.4117000102996826},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.39879998564720154}],"concepts":[{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7247999906539917},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6391000151634216},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.5339000225067139},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5102999806404114},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4869999885559082},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4747999906539917},{"id":"https://openalex.org/C207850805","wikidata":"https://www.wikidata.org/wiki/Q269608","display_name":"Reverse engineering","level":2,"score":0.4602000117301941},{"id":"https://openalex.org/C119024030","wikidata":"https://www.wikidata.org/wiki/Q759899","display_name":"Call stack","level":3,"score":0.4117000102996826},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.4025000035762787},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.39879998564720154},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.3847000002861023},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.37599998712539673},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.2915000021457672},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.287200003862381},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.28130000829696655},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.2759999930858612},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2671999931335449},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.27319","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.27319","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.27319","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.27319","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"have":[4],"achieved":[5],"remarkable":[6],"progress":[7,53],"in":[8,50,89,197],"recent":[9],"years,":[10],"driving":[11],"their":[12],"adoption":[13],"across":[14,168],"a":[15,61,83,99,113,128,141,178],"wide":[16],"range":[17],"of":[18,48,60,86,115,120,122,124,131,190],"domains,":[19],"including":[20],"computer":[21],"security.":[22],"In":[23],"reverse":[24,108,187],"engineering,":[25],"LLMs":[26,105,191],"are":[27],"increasingly":[28],"applied":[29],"to":[30,149,184],"critical":[31],"tasks":[32,169],"such":[33],"as":[34],"function":[35],"and":[36,40,72,81,127,136,192],"variable":[37],"name":[38],"recovery":[39],"type":[41],"inference.":[42],"However,":[43],"despite":[44],"the":[45,58,186,193],"rapid":[46],"growth":[47],"research":[49],"this":[51],"area,":[52],"has":[54],"been":[55],"hindered":[56],"by":[57],"absence":[59],"standardized":[62],"dataset.":[63],"Existing":[64],"studies":[65],"rely":[66],"on":[67,106],"disparate":[68],"datasets,":[69,117],"preprocessing":[70],"pipelines,":[71],"evaluation":[73,167],"metrics,":[74],"making":[75],"fair":[76,166],"comparisons":[77],"between":[78],"approaches":[79],"difficult":[80],"obscuring":[82],"clear":[84],"understanding":[85],"LLM":[87],"capabilities":[88],"binary":[90,107],"analysis.":[91],"To":[92],"address":[93],"these":[94],"challenges,":[95],"we":[96,181],"present":[97],"REBench,":[98],"comprehensive":[100],"benchmark":[101],"dataset":[102],"for":[103],"evaluating":[104],"engineering":[109,188],"tasks.":[110,199],"REBench":[111,139,183],"consolidates":[112],"superset":[114],"existing":[116],"comprising":[118],"hundreds":[119],"millions":[121],"lines":[123],"source":[125],"code":[126],"diverse":[129],"collection":[130],"binaries":[132],"spanning":[133],"multiple":[134],"architectures":[135],"optimization":[137],"levels.":[138],"adopts":[140],"knowledge-base-driven":[142],"methodology":[143],"that":[144,154,173],"stores":[145],"byte-level":[146],"stack":[147],"information":[148],"generate":[150],"ground":[151],"truth,":[152],"ensuring":[153],"task":[155],"difficulty":[156],"is":[157],"preserved":[158],"while":[159,170],"maintaining":[160],"universal":[161],"applicability.":[162],"This":[163],"design":[164],"enables":[165],"avoiding":[171],"simplifications":[172],"could":[174],"bias":[175],"results.":[176],"As":[177],"use":[179],"case,":[180],"apply":[182],"measure":[185],"performance":[189],"result":[194],"demonstrates":[195],"difficulties":[196],"complex":[198]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-02T00:00:00"}
