{"id":"https://openalex.org/W7134813417","doi":"https://doi.org/10.48550/arxiv.2603.08225","title":"Practical Type Inference: High-Throughput Recovery of Real-World Structures and Function Signatures","display_name":"Practical Type Inference: High-Throughput Recovery of Real-World Structures and Function Signatures","publication_year":2026,"publication_date":"2026-03-09","ids":{"openalex":"https://openalex.org/W7134813417","doi":"https://doi.org/10.48550/arxiv.2603.08225"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.08225","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128633979","display_name":"Lukas Seidel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seidel, Lukas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128676575","display_name":"Sam Thomas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Thomas, Sam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5066077721","display_name":"Konrad Rieck","orcid":"https://orcid.org/0000-0002-5054-8758"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rieck, Konrad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.22419999539852142,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.22419999539852142,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.10750000178813934,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.07429999858140945,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6603999733924866},{"id":"https://openalex.org/keywords/type-inference","display_name":"Type inference","score":0.5595999956130981},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5436000227928162},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5356000065803528},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5238000154495239},{"id":"https://openalex.org/keywords/realization","display_name":"Realization (probability)","score":0.5224999785423279},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4309000074863434},{"id":"https://openalex.org/keywords/struct","display_name":"struct","score":0.42559999227523804},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4203000068664551}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6983000040054321},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6603999733924866},{"id":"https://openalex.org/C198370458","wikidata":"https://www.wikidata.org/wiki/Q586459","display_name":"Type inference","level":3,"score":0.5595999956130981},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5436000227928162},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5356000065803528},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5238000154495239},{"id":"https://openalex.org/C2781089630","wikidata":"https://www.wikidata.org/wiki/Q21856745","display_name":"Realization (probability)","level":2,"score":0.5224999785423279},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.45989999175071716},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4309000074863434},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4293999969959259},{"id":"https://openalex.org/C2776142590","wikidata":"https://www.wikidata.org/wiki/Q1164699","display_name":"struct","level":2,"score":0.42559999227523804},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4203000068664551},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.41920000314712524},{"id":"https://openalex.org/C2777299769","wikidata":"https://www.wikidata.org/wiki/Q3707858","display_name":"Type (biology)","level":2,"score":0.41620001196861267},{"id":"https://openalex.org/C2779696439","wikidata":"https://www.wikidata.org/wiki/Q7512811","display_name":"Signature (topology)","level":2,"score":0.40939998626708984},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.35569998621940613},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.33570000529289246},{"id":"https://openalex.org/C2778067643","wikidata":"https://www.wikidata.org/wiki/Q166507","display_name":"Interval (graph theory)","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33000001311302185},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.2712000012397766},{"id":"https://openalex.org/C113364801","wikidata":"https://www.wikidata.org/wiki/Q26674","display_name":"High fidelity","level":2,"score":0.2639999985694885},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2551000118255615},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.2538999915122986},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.08225","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.08225","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.08225","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.08225","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"recovery":[1],"of":[2,93,125,140],"types":[3],"from":[4],"stripped":[5],"binaries":[6],"is":[7,49,58,115],"a":[8,170],"key":[9],"to":[10,30,90,165,182],"exact":[11],"decompilation,":[12],"yet":[13],"its":[14],"practical":[15],"realization":[16],"suffers.":[17],"For":[18],"composite":[19],"structures":[20],"in":[21,61,85,96,117,187],"particular,":[22],"both":[23],"layout":[24],"and":[25,78,108],"semantic":[26],"fidelity":[27],"are":[28],"required":[29],"enable":[31],"end-to-end":[32],"reconstruction.":[33],"Many":[34],"existing":[35],"approaches":[36],"either":[37],"synthesize":[38],"layouts":[39],"or":[40],"infer":[41],"names":[42],"post-hoc,":[43],"which":[44],"weakens":[45],"downstream":[46],"usability.":[47],"This":[48],"further":[50],"aggravated":[51],"by":[52,147],"an":[53,67,130],"excessive":[54],"runtime":[55],"overhead":[56],"that":[57,71,160,178],"especially":[59],"prohibitive":[60],"automated":[62,86],"environments.":[63],"We":[64],"present":[65],"XTRIDE,":[66],"improved":[68],"n-gram-based":[69,161],"approach":[70,181],"focuses":[72],"on":[73,143,173],"practicality:":[74],"highly":[75],"optimized":[76,131],"throughput":[77],"actionable":[79],"confidence":[80],"scores":[81],"allow":[82],"for":[83],"deployment":[84],"pipelines.":[87],"When":[88],"compared":[89],"the":[91,94,122,137,141,144],"state":[92,139],"art":[95,142],"struct":[97,127],"recovery,":[98],"our":[99,113,134],"method":[100],"achieves":[101],"comparable":[102],"performance":[103],"while":[104],"being":[105],"between":[106],"70":[107],"2300":[109],"times":[110],"faster.":[111],"As":[112],"inference":[114,154],"grounded":[116],"real-world":[118],"types,":[119],"we":[120,158,176],"achieve":[121],"highest":[123],"ratio":[124],"fully-correct":[126],"layouts.":[128],"With":[129],"training":[132],"regimen,":[133],"model":[135],"outperforms":[136],"current":[138],"DIRT":[145],"dataset":[146],"5.09":[148],"percentage":[149],"points,":[150],"achieving":[151],"90.15%":[152],"type":[153,162],"accuracy":[155],"overall.":[156],"Furthermore,":[157],"show":[159,177],"prediction":[163],"generalizes":[164],"function":[166,183],"signature":[167],"recovery:":[168],"conducting":[169],"case":[171],"study":[172],"embedded":[174],"firmware,":[175],"this":[179],"efficient":[180],"similarity":[184],"can":[185],"assist":[186],"typical":[188],"reverse":[189],"engineering":[190],"tasks.":[191]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-11T00:00:00"}
