{"id":"https://openalex.org/W4415428521","doi":"https://doi.org/10.3233/faia251283","title":"ASMA-Tune: Unlocking LLMs\u2019 Assembly Code Comprehension via Structural-Semantic Instruction Tuning","display_name":"ASMA-Tune: Unlocking LLMs\u2019 Assembly Code Comprehension via Structural-Semantic Instruction Tuning","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4415428521","doi":"https://doi.org/10.3233/faia251283"},"language":null,"primary_location":{"id":"doi:10.3233/faia251283","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251283","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia251283","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033623381","display_name":"X. Christine Wang","orcid":"https://orcid.org/0000-0002-1557-9583"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xinyi Wang","raw_affiliation_strings":["Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059024183","display_name":"Jiashui Wang","orcid":"https://orcid.org/0000-0002-3608-888X"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiashui Wang","raw_affiliation_strings":["Ant Group","Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Ant Group","institution_ids":[]},{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085904321","display_name":"Jiangtao Su","orcid":"https://orcid.org/0000-0002-5152-7318"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinbo Su","raw_affiliation_strings":["Renmin University of China"],"affiliations":[{"raw_affiliation_string":"Renmin University of China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100360160","display_name":"Ke Wang","orcid":"https://orcid.org/0000-0003-4508-1302"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Wang","raw_affiliation_strings":["Renmin University of China"],"affiliations":[{"raw_affiliation_string":"Renmin University of China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102027852","display_name":"Peng Chen","orcid":"https://orcid.org/0009-0006-4802-2382"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Chen","raw_affiliation_strings":["University of the Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"University of the Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107947108","display_name":"Yanming Liu","orcid":"https://orcid.org/0009-0000-7895-3547"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanming Liu","raw_affiliation_strings":["Zhejiang University"],"affiliations":[{"raw_affiliation_string":"Zhejiang University","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057532144","display_name":"Long Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Long Liu","raw_affiliation_strings":["Ant Group"],"affiliations":[{"raw_affiliation_string":"Ant Group","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100674281","display_name":"Xiang Li","orcid":"https://orcid.org/0000-0002-6482-2535"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiang Li","raw_affiliation_strings":["Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100322753","display_name":"Yan Wang","orcid":"https://orcid.org/0000-0002-6475-5045"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yangdong Wang","raw_affiliation_strings":["Ant Group"],"affiliations":[{"raw_affiliation_string":"Ant Group","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101830428","display_name":"Qiyuan Chen","orcid":"https://orcid.org/0009-0009-0701-8784"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiyuan Chen","raw_affiliation_strings":["Ant Group"],"affiliations":[{"raw_affiliation_string":"Ant Group","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052511548","display_name":"R. H. Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rongze Chen","raw_affiliation_strings":["Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005646333","display_name":"Chunfu Jia","orcid":"https://orcid.org/0000-0002-5588-9690"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunfu Jia","raw_affiliation_strings":["Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China"],"affiliations":[{"raw_affiliation_string":"Nankai University (College of Cryptology and Cyber Science, Nankai University), TKLNDST (Tianjin Key Laboratory of Network and Data Security Technology) & DISSEC (Key Laboratory of Data and Intelligent System Security, Ministry of Education, China), Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5033623381"],"corresponding_institution_ids":["https://openalex.org/I205237279"],"apc_list":null,"apc_paid":null,"fwci":6.4467,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.97046352,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11159","display_name":"Manufacturing Process and Optimization","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9746999740600586,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9101999998092651,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.676800012588501},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5634999871253967},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5045999884605408},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4853000044822693},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.47859999537467957},{"id":"https://openalex.org/keywords/assembly-language","display_name":"Assembly language","score":0.4587000012397766},{"id":"https://openalex.org/keywords/program-comprehension","display_name":"Program comprehension","score":0.424699991941452},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4203999936580658},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.41370001435279846},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.3944000005722046}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.771399974822998},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.676800012588501},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5634999871253967},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5045999884605408},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4853000044822693},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.47859999537467957},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4756999909877777},{"id":"https://openalex.org/C50831359","wikidata":"https://www.wikidata.org/wiki/Q165436","display_name":"Assembly language","level":3,"score":0.4587000012397766},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42649999260902405},{"id":"https://openalex.org/C2777561058","wikidata":"https://www.wikidata.org/wiki/Q2652119","display_name":"Program comprehension","level":4,"score":0.424699991941452},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4203999936580658},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.41370001435279846},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.3944000005722046},{"id":"https://openalex.org/C2776187449","wikidata":"https://www.wikidata.org/wiki/Q1513879","display_name":"Natural language generation","level":3,"score":0.3806999921798706},{"id":"https://openalex.org/C63435697","wikidata":"https://www.wikidata.org/wiki/Q864135","display_name":"Binary code","level":3,"score":0.3792000114917755},{"id":"https://openalex.org/C2779439875","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Natural language understanding","level":3,"score":0.3767000138759613},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.35339999198913574},{"id":"https://openalex.org/C2776865275","wikidata":"https://www.wikidata.org/wiki/Q311666","display_name":"Projector","level":2,"score":0.35260000824928284},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.35249999165534973},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3522999882698059},{"id":"https://openalex.org/C133162039","wikidata":"https://www.wikidata.org/wiki/Q1061077","display_name":"Code generation","level":3,"score":0.34790000319480896},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3174000084400177},{"id":"https://openalex.org/C18552078","wikidata":"https://www.wikidata.org/wiki/Q255615","display_name":"Code-switching","level":2,"score":0.3140999972820282},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.30219998955726624},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.29989999532699585},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2987000048160553},{"id":"https://openalex.org/C83479923","wikidata":"https://www.wikidata.org/wiki/Q2063748","display_name":"Universal Networking Language","level":4,"score":0.28299999237060547},{"id":"https://openalex.org/C77660490","wikidata":"https://www.wikidata.org/wiki/Q244916","display_name":"Intermediate language","level":3,"score":0.2720000147819519},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.26330000162124634},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.2621000111103058},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.25220000743865967},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.25110000371932983},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia251283","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251283","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia251283","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251283","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Assembly":[0,65],"code":[1,157],"analysis":[2,56],"and":[3,23,102,125,139,145,148],"comprehension":[4,121],"play":[5],"critical":[6],"roles":[7],"in":[8,54,119],"applications":[9],"like":[10],"reverse":[11],"engineering,":[12],"yet":[13,57],"they":[14],"face":[15],"substantial":[16],"challenges":[17],"due":[18],"to":[19,161],"low":[20],"information":[21],"density":[22],"a":[24,83],"lack":[25],"of":[26],"explicit":[27],"syntactic":[28],"structures.":[29],"While":[30],"traditional":[31],"masked":[32],"language":[33,43,48,108],"modeling":[34],"(MLM)":[35],"approaches":[36],"do":[37],"not":[38],"explicitly":[39],"focus":[40],"on":[41,142],"natural":[42,107],"interaction,":[44],"emerging":[45],"decoder-focused":[46],"large":[47],"models":[49,136],"(LLMs)":[50],"demonstrate":[51,112],"partial":[52],"success":[53],"binary":[55],"remain":[58],"underexplored":[59],"for":[60],"holistic":[61],"comprehension.":[62],"We":[63],"present":[64],"Augmented":[66],"Tuning":[67],"(ASMA-Tune),":[68],"an":[69],"end-to-end":[70],"structural-semantic":[71],"instruction":[72],"tuning":[73],"framework":[74],"that":[75],"synergizes":[76],"encoder":[77,89],"architecture":[78],"with":[79,98,122,155],"decoder-based":[80],"LLMs":[81],"through":[82],"projector":[84,95],"module,":[85],"where":[86],"the":[87,94,99,103],"assembly":[88,120],"extracts":[90],"hardware-level":[91],"structural":[92],"features,":[93],"bridges":[96],"representations":[97],"semantic":[100],"space,":[101],"instruction-tuned":[104],"LLM":[105],"preserves":[106],"capabilities.":[109],"Experimental":[110],"results":[111],"three":[113],"key":[114],"advantages:":[115],"(1)":[116],"State-of-the-art":[117],"performance":[118],"+39.7%":[123],"Recall@1":[124,138],"+17.8%":[126],"MRR":[127,141],"improvements":[128],"over":[129],"GPT-4-Turbo,":[130],"(2)":[131],"Consistent":[132],"enhancements":[133],"across":[134,163],"base":[135],"(24.6\u2013107.4%":[137],"15.2\u2013106.3%":[140],"Qwen2.5-Coder,":[143],"Deepseek-Coder":[144],"CodeLlama":[146],"variants),":[147],"(3)":[149],"Superior":[150],"instruction-following":[151],"capabilities":[152],"(41.5%\u2013118%":[153],"improvements)":[154],"controlled":[156],"generation":[158],"degradation":[159],"(\u20138.9%":[160],"\u201335%":[162],"architectures).":[164]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-24T00:00:00"}
