{"id":"https://openalex.org/W7125629137","doi":"https://doi.org/10.1109/jiot.2026.3654102","title":"Adaptive Pruning for Large Language Models With Structural Importance Awareness","display_name":"Adaptive Pruning for Large Language Models With Structural Importance Awareness","publication_year":2026,"publication_date":"2026-01-23","ids":{"openalex":"https://openalex.org/W7125629137","doi":"https://doi.org/10.1109/jiot.2026.3654102"},"language":"en","primary_location":{"id":"doi:10.1109/jiot.2026.3654102","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2026.3654102","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123818525","display_name":"Haotian Zheng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haotian Zheng","raw_affiliation_strings":["Shenzhen Future Network of Intelligence Institute (FNii-Shenzhen), The Chinese University of Hong Kong, Shenzhen, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Future Network of Intelligence Institute (FNii-Shenzhen), The Chinese University of Hong Kong, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123671884","display_name":"Jinke Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinke Ren","raw_affiliation_strings":["School of Science and Engineering, FNii-Shenzhen, and Guangdong Provincial Key Laboratory of Future Networks of Intelligence, The Chinese University of Hong Kong, Shenzhen, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"School of Science and Engineering, FNii-Shenzhen, and Guangdong Provincial Key Laboratory of Future Networks of Intelligence, The Chinese University of Hong Kong, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101198400","display_name":"Yatong Han","orcid":null},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yatong Han","raw_affiliation_strings":["FNii-Shenzhen, The Chinese University of Hong Kong, Shenzhen, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"FNii-Shenzhen, The Chinese University of Hong Kong, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123810731","display_name":"Yushan Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yushan Sun","raw_affiliation_strings":["National Key Laboratory of Autonomous Marine Vehicle Technology, Harbin Engineering University, Harbin, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Marine Vehicle Technology, Harbin Engineering University, Harbin, China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049587970","display_name":"Ruichen Zhang","orcid":"https://orcid.org/0000-0002-6859-3645"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Ruichen Zhang","raw_affiliation_strings":["College of Computing and Data Science, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"College of Computing and Data Science, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123786077","display_name":"Wenbo Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wenbo Zhang","raw_affiliation_strings":["Hangzhou RoboCT Technology Development Company Ltd., Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Hangzhou RoboCT Technology Development Company Ltd., Hangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089372152","display_name":"Z. Merrick Li","orcid":"https://orcid.org/0000-0002-7421-4779"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Li","raw_affiliation_strings":["School of Science and Engineering, FNii-Shenzhen, and Guangdong Provincial Key Laboratory of Future Networks of Intelligence, The Chinese University of Hong Kong, Shenzhen, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"School of Science and Engineering, FNii-Shenzhen, and Guangdong Provincial Key Laboratory of Future Networks of Intelligence, The Chinese University of Hong Kong, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210116924"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123796573","display_name":"Dusit Niyato","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dusit Niyato","raw_affiliation_strings":["College of Computing and Data Science, Nanyang Technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"College of Computing and Data Science, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009164482","display_name":"Shuguang Cui","orcid":"https://orcid.org/0000-0003-2608-775X"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuguang Cui","raw_affiliation_strings":["School of Science and Engineering, FNii-Shenzhen, and Guangdong Provincial Key Laboratory of Future Networks of Intelligence, The Chinese University of Hong Kong, Shenzhen, Guangdong, China"],"affiliations":[{"raw_affiliation_string":"School of Science and Engineering, FNii-Shenzhen, and Guangdong Provincial Key Laboratory of Future Networks of Intelligence, The Chinese University of Hong Kong, Shenzhen, Guangdong, China","institution_ids":["https://openalex.org/I4210116924"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5123818525"],"corresponding_institution_ids":["https://openalex.org/I4210116924"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.19721716,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"13","issue":"7","first_page":"14882","last_page":"14897"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.23899999260902405,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.23899999260902405,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.1891999989748001,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.043699998408555984,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5555999875068665},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5533999800682068},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.45190000534057617},{"id":"https://openalex.org/keywords/context-model","display_name":"Context model","score":0.40070000290870667},{"id":"https://openalex.org/keywords/language-understanding","display_name":"Language understanding","score":0.39100000262260437},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.33160001039505005}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8273000121116638},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6439999938011169},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5555999875068665},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5533999800682068},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4803999960422516},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.45190000534057617},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4465999901294708},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.40070000290870667},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.39100000262260437},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.33160001039505005},{"id":"https://openalex.org/C129792486","wikidata":"https://www.wikidata.org/wiki/Q1050419","display_name":"Language identification","level":3,"score":0.32600000500679016},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3107999861240387},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2906000018119812},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.29030001163482666},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.25600001215934753},{"id":"https://openalex.org/C3020028006","wikidata":"https://www.wikidata.org/wiki/Q9158","display_name":"Electronic mail","level":2,"score":0.25540000200271606}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/jiot.2026.3654102","is_oa":false,"landing_page_url":"https://doi.org/10.1109/jiot.2026.3654102","pdf_url":null,"source":{"id":"https://openalex.org/S2480266640","display_name":"IEEE Internet of Things Journal","issn_l":"2327-4662","issn":["2327-4662","2372-2541"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Internet of Things Journal","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/212005","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/212005","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4636031687259674,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1566289585","https://openalex.org/W1632114991","https://openalex.org/W2890894339","https://openalex.org/W2946609015","https://openalex.org/W2996908057","https://openalex.org/W2998617917","https://openalex.org/W4285294723","https://openalex.org/W4386083031","https://openalex.org/W4393147854","https://openalex.org/W4399768834","https://openalex.org/W4400945784","https://openalex.org/W4401635364","https://openalex.org/W4401726555","https://openalex.org/W4402670757","https://openalex.org/W4404134026","https://openalex.org/W4404918643","https://openalex.org/W4405717632","https://openalex.org/W4405887239","https://openalex.org/W4405934565","https://openalex.org/W4406458045","https://openalex.org/W4415799087","https://openalex.org/W7133233472"],"related_works":[],"abstract_inverted_index":{"The":[0],"recent":[1],"advancements":[2],"in":[3,95],"large":[4],"language":[5,11],"models":[6],"(LLMs)":[7],"have":[8],"significantly":[9],"enhanced":[10],"understanding":[12],"and":[13,36,58,167,186,191],"content":[14],"generation":[15],"capabilities.":[16],"However,":[17],"the":[18,92,141,144,150,194,218,223],"deployment":[19,239],"of":[20,25,101,143,152,183,232],"LLMs":[21,62,161],"on":[22,115,158,188,203,240],"resource-constrained":[23,241],"Internet":[24],"Things":[26],"(IoT)":[27],"devices":[28],"remains":[29],"challenging":[30],"due":[31],"to":[32,55,74,90,123,217],"their":[33],"substantial":[34],"computational":[35,57],"storage":[37,59],"requirements.":[38],"To":[39,148],"address":[40,91],"this":[41],"issue,":[42],"we":[43,154],"propose":[44],"a":[45,86,109,128,204,229],"novel":[46],"LLM":[47,81,145],"pruning":[48,53,126,195,230],"method,":[49],"termed":[50],"structurally-aware":[51],"adaptive":[52],"(SAAP),":[54],"reduce":[56],"costs":[60],"for":[61,80,104,139,237],"while":[63],"maintaining":[64],"model":[65],"performance.":[66],"Specifically,":[67],"SAAP":[68,107,132,174,200,221],"first":[69],"leverages":[70],"maximum":[71],"likelihood":[72],"estimation":[73],"calibrate":[75],"traditional":[76],"structural":[77,102],"importance":[78,103,111,121],"metrics":[79],"pruning.":[82,147],"Next,":[83],"it":[84],"employs":[85],"Bayesian":[87],"fusion":[88],"approach":[89],"predictive":[93],"uncertainty":[94],"multi-granularity":[96],"metrics,":[97],"enabling":[98],"accurate":[99],"assessments":[100],"LLMs.":[105],"Then,":[106],"introduces":[108],"cross-layer":[110],"alignment":[112],"mechanism":[113],"based":[114],"quantile":[116],"mapping,":[117],"which":[118],"normalizes":[119],"layer-wise":[120],"scores":[122],"ensure":[124],"consistent":[125],"from":[127],"global":[129],"perspective.":[130],"Furthermore,":[131],"develops":[133],"an":[134],"efficient":[135],"block-wise":[136],"fine-tuning":[137],"strategy":[138],"enhancing":[140],"performance":[142],"after":[146],"validate":[149],"effectiveness":[151],"SAAP,":[153],"conduct":[155],"extensive":[156],"experiments":[157],"nine":[159],"open-source":[160],"across":[162],"two":[163],"representative":[164],"tasks\u2014language":[165],"modeling":[166],"zero-shot":[168],"classification.":[169],"Experimental":[170],"results":[171,213],"show":[172],"that":[173,215],"consistently":[175],"outperforms":[176],"several":[177],"baseline":[178],"methods,":[179],"achieving":[180],"accuracy":[181],"improvements":[182],"2.5%,":[184],"2.63%,":[185],"2.44%":[187],"LLaMA-7B,":[189],"Vicuna-7B,":[190],"LLaMA-13B":[192],"when":[193],"ratio":[196,231],"is":[197,201],"50%.":[198],"Finally,":[199],"implemented":[202],"testbed\u2014NVIDIA":[205],"Jetson":[206],"AGX":[207],"Orin":[208],"32GB":[209],"Developer":[210],"Kit.":[211],"Test":[212],"demonstrate":[214],"compared":[216],"foundation":[219],"LLM,":[220],"enhances":[222],"inference":[224],"speed":[225],"by":[226],"86.86%":[227],"at":[228],"50%,":[233],"highlighting":[234],"its":[235],"potential":[236],"practical":[238],"IoT":[242],"devices.":[243]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2026-01-26T00:00:00"}
