{"id":"https://openalex.org/W4411232016","doi":"https://doi.org/10.1109/jiot.2025.3579231","title":"Binary Code Similarity Detection via LLM-Based Source Code Conversion","display_name":"Binary Code Similarity Detection via LLM-Based Source Code Conversion","publication_year":2025,"publication_date":"2025-06-12","ids":{"openalex":"https://openalex.org/W4411232016","doi":"https://doi.org/10.1109/jiot.2025.3579231"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2025.3579231","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3579231","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114155127","display_name":"Bangrui Wan","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bangrui Wan","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China"],"raw_orcid":"https://orcid.org/0009-0001-0769-2527","affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100437635","display_name":"Shiyu Wang","orcid":"https://orcid.org/0000-0003-1904-6781"},"institutions":[{"id":"https://openalex.org/I10535382","display_name":"Chongqing University of Posts and Telecommunications","ror":"https://ror.org/03dgaqz26","country_code":"CN","type":"education","lineage":["https://openalex.org/I10535382"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiyu Wang","raw_affiliation_strings":["School of Software Engineering, Chongqing University of Posts and Telecommunications, Chongqing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Software Engineering, Chongqing University of Posts and Telecommunications, Chongqing, China","institution_ids":["https://openalex.org/I10535382"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zheng Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I10535382","display_name":"Chongqing University of Posts and Telecommunications","ror":"https://ror.org/03dgaqz26","country_code":"CN","type":"education","lineage":["https://openalex.org/I10535382"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zheng Wei","raw_affiliation_strings":["School of Software Engineering, Chongqing University of Posts and Telecommunications, Chongqing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Software Engineering, Chongqing University of Posts and Telecommunications, Chongqing, China","institution_ids":["https://openalex.org/I10535382"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082630903","display_name":"Jiangping Huang","orcid":"https://orcid.org/0000-0002-0288-6824"},"institutions":[{"id":"https://openalex.org/I10535382","display_name":"Chongqing University of Posts and Telecommunications","ror":"https://ror.org/03dgaqz26","country_code":"CN","type":"education","lineage":["https://openalex.org/I10535382"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiangping Huang","raw_affiliation_strings":["School of Software Engineering, Chongqing University of Posts and Telecommunications, Chongqing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Software Engineering, Chongqing University of Posts and Telecommunications, Chongqing, China","institution_ids":["https://openalex.org/I10535382"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007408033","display_name":"Chunqiang Hu","orcid":"https://orcid.org/0000-0001-5825-2241"},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunqiang Hu","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China"],"raw_orcid":"https://orcid.org/0000-0001-5825-2241","affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.7179,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.94603423,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"12","issue":"24","first_page":"51842","last_page":"51853"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12479","display_name":"Web Application Security Vulnerabilities","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12479","display_name":"Web Application Security Vulnerabilities","score":0.98580002784729,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9829999804496765,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9797000288963318,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7955923676490784},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5962302088737488},{"id":"https://openalex.org/keywords/source-code","display_name":"Source code","score":0.5551420450210571},{"id":"https://openalex.org/keywords/binary-code","display_name":"Binary code","score":0.4970689117908478},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.43527013063430786},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3216836750507355},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.31064271926879883},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.09329423308372498},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08423104882240295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7955923676490784},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5962302088737488},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.5551420450210571},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.4970689117908478},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.43527013063430786},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3216836750507355},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.31064271926879883},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.09329423308372498},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08423104882240295},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/jiot.2025.3579231","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2025.3579231","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5241027089","display_name":null,"funder_award_id":"CSTB2023TIAD-STX0034","funder_id":"https://openalex.org/F4320336612","funder_display_name":"Science and Technology Innovation Foundation of Harbin"},{"id":"https://openalex.org/G5461883845","display_name":null,"funder_award_id":"CSTB2024NSCQ-LZX0084","funder_id":"https://openalex.org/F4320323172","funder_display_name":"Natural Science Foundation of Chongqing"},{"id":"https://openalex.org/G6005639586","display_name":null,"funder_award_id":"62372075","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7516134290","display_name":null,"funder_award_id":"CSTB2023TIAD-STX0034","funder_id":"https://openalex.org/F4320321550","funder_display_name":"Chongqing Science and Technology Commission"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321550","display_name":"Chongqing Science and Technology Commission","ror":"https://ror.org/05w9erc61"},{"id":"https://openalex.org/F4320323172","display_name":"Natural Science Foundation of Chongqing","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336612","display_name":"Science and Technology Innovation Foundation of Harbin","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W2041839827","https://openalex.org/W2532962075","https://openalex.org/W2577142429","https://openalex.org/W2618635610","https://openalex.org/W2749008552","https://openalex.org/W2886694146","https://openalex.org/W2901689459","https://openalex.org/W2926178846","https://openalex.org/W3007413911","https://openalex.org/W3108936298","https://openalex.org/W3127424491","https://openalex.org/W3177323791","https://openalex.org/W4285586654","https://openalex.org/W4310494122","https://openalex.org/W4322766882","https://openalex.org/W4324007217","https://openalex.org/W4362615084","https://openalex.org/W4381050433","https://openalex.org/W4386211610","https://openalex.org/W4386608469","https://openalex.org/W4387344039","https://openalex.org/W4390067041","https://openalex.org/W4402667093","https://openalex.org/W4407678844"],"related_works":["https://openalex.org/W3081644756","https://openalex.org/W2134880816","https://openalex.org/W2111298487","https://openalex.org/W4308157887","https://openalex.org/W2510680828","https://openalex.org/W2765199869","https://openalex.org/W2055498716","https://openalex.org/W1984130439","https://openalex.org/W4386075138","https://openalex.org/W2371359060"],"abstract_inverted_index":{"Binary":[0],"Code":[1],"Similarity":[2],"Detection":[3],"(BCSD),":[4],"a":[5,80,86],"technique":[6],"for":[7,22],"assessing":[8],"the":[9,41,50,61,104,116,129,136,193],"similarity":[10,66,117,131,134,184],"between":[11,68,118,186],"two":[12,38,120],"given":[13],"binary":[14,53,69,93,121,187],"code":[15,54,70,94,97,109,122,188],"snippets,":[16],"holds":[17],"significant":[18],"value":[19],"in":[20,172],"searching":[21],"vulnerable":[23,173],"functions":[24,123],"within":[25,176],"embedded":[26],"device":[27,179],"firmware,":[28],"which":[29,56],"is":[30],"typically":[31],"closed-source.":[32],"However,":[33],"existing":[34],"BCSD":[35,82],"approaches":[36],"face":[37],"major":[39],"challenges:":[40],"irreversible":[42],"loss":[43],"of":[44,52,135,152,195],"semantic":[45],"and":[46,60,71,110,132,156,164,189],"structural":[47],"information":[48],"during":[49],"process":[51],"compilation,":[55],"affects":[57],"detection":[58,67,185,196],"performance;":[59],"inability":[62],"to":[63,91,106],"directly":[64],"perform":[65],"source":[72,96,113,138,190],"code.":[73,114,139],"In":[74],"this":[75],"paper,":[76],"we":[77],"present":[78],"Bin2SrcSim,":[79],"novel":[81],"approach":[83],"that":[84,144],"employs":[85],"Large":[87],"Language":[88],"Model":[89],"(LLM)":[90],"convert":[92],"into":[95,112],"representations.":[98],"Bin2SrcSim":[99,145,167,182],"fine-tunes":[100],"an":[101],"LLM":[102],"at":[103],"function-level":[105],"transform":[107],"assembly":[108],"pseudocode":[111],"Consequently,":[115],"any":[119],"can":[124],"be":[125],"assessed":[126],"by":[127],"calculating":[128],"cosine":[130],"Jaccard":[133],"transformed":[137],"The":[140],"experimental":[141],"results":[142],"demonstrate":[143],"outperforms":[146],"all":[147],"baselines,":[148],"achieving":[149],"Recall@1":[150],"scores":[151],"0.82,":[153],"0.83,":[154],"0.93,":[155],"0.81":[157],"across":[158],"various":[159],"scenarios":[160],"involving":[161],"cross-architecture,":[162],"cross-compiler,":[163],"cross-optimization":[165],"levels.":[166],"also":[168],"demonstrates":[169],"satisfactory":[170],"performance":[171],"function":[174],"search":[175],"real-world":[177],"IoT":[178],"firmware.":[180],"Moreover,":[181],"supports":[183],"code,":[191],"expanding":[192],"scope":[194],"applications.":[197]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
