{"id":"https://openalex.org/W4415492722","doi":"https://doi.org/10.1142/s0218001425580042","title":"Efficient Compression of Large Language Model based on Hybrid Layer and Channel Pruning","display_name":"Efficient Compression of Large Language Model based on Hybrid Layer and Channel Pruning","publication_year":2025,"publication_date":"2025-10-24","ids":{"openalex":"https://openalex.org/W4415492722","doi":"https://doi.org/10.1142/s0218001425580042"},"language":"en","primary_location":{"id":"doi:10.1142/s0218001425580042","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0218001425580042","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052034358","display_name":"Ruixuan Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]},{"id":"https://openalex.org/I17442442","display_name":"State Grid Corporation of China (China)","ror":"https://ror.org/05twwhs70","country_code":"CN","type":"company","lineage":["https://openalex.org/I17442442"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruixuan Lu","raw_affiliation_strings":["School of Electrical Engineering and Automation, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","State Grid Anhui Electric Power Co., Ltd. Information and Communication Branch, Hefei, Anhui 230061, P.\u00a0R.\u00a0China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"State Grid Anhui Electric Power Co., Ltd. Information and Communication Branch, Hefei, Anhui 230061, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I17442442"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049652197","display_name":"Kun Jing","orcid":"https://orcid.org/0000-0001-9028-8869"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kun Jing","raw_affiliation_strings":["School of Internet, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China"],"raw_orcid":"https://orcid.org/0000-0001-9028-8869","affiliations":[{"raw_affiliation_string":"School of Internet, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024606762","display_name":"Shichuan Ding","orcid":"https://orcid.org/0000-0001-6435-8210"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shichuan Ding","raw_affiliation_strings":["School of Electrical Engineering and Automation, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China"],"raw_orcid":"https://orcid.org/0000-0001-6435-8210","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017935525","display_name":"Zhaohong Jia","orcid":"https://orcid.org/0000-0001-6607-7025"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhaohong Jia","raw_affiliation_strings":["School of Internet, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China"],"raw_orcid":"https://orcid.org/0000-0001-6607-7025","affiliations":[{"raw_affiliation_string":"School of Internet, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034197623","display_name":"Jun Hang","orcid":"https://orcid.org/0000-0003-2950-431X"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Hang","raw_affiliation_strings":["School of Electrical Engineering and Automation, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China"],"raw_orcid":"https://orcid.org/0000-0003-2950-431X","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052525241","display_name":"Xiaoping Huang","orcid":"https://orcid.org/0009-0002-1627-0219"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoping Huang","raw_affiliation_strings":["School of Internet, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Internet, Anhui University, Hefei, Anhui 230039, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I143868143"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14327233,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"39","issue":"16","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.8919000029563904,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.8919000029563904,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.8195000290870667,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.7631000280380249,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.8949000239372253},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5360000133514404},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.5360000133514404},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5349000096321106},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.4814000129699707},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4810999929904938},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.453000009059906},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.42289999127388}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.8949000239372253},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8282999992370605},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.5360000133514404},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5360000133514404},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5349000096321106},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.4814000129699707},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4810999929904938},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.453000009059906},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44929999113082886},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.42289999127388},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.4050999879837036},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39649999141693115},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.388700008392334},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37310001254081726},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.3264000117778778},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.31130000948905945},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.29750001430511475},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.29750001430511475},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.29249998927116394},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2702000141143799},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2653000056743622},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1142/s0218001425580042","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0218001425580042","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2064675550","https://openalex.org/W2110485445","https://openalex.org/W3130144398","https://openalex.org/W4285340871","https://openalex.org/W4385571335","https://openalex.org/W4385948838","https://openalex.org/W4391857750","https://openalex.org/W4404460707","https://openalex.org/W4404918643"],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2],"(LLMs)":[3],"are":[4],"constrained":[5],"by":[6,138],"their":[7,59],"large":[8],"parameter":[9],"size":[10],"and":[11,31,52,105,125,152],"high":[12],"computational":[13],"resource":[14],"consumption,":[15],"making":[16],"deployment":[17,30,61],"on":[18,50,73,88,103,149,156],"terminal":[19],"devices":[20],"with":[21],"limited":[22],"computing":[23],"resources":[24],"difficult.":[25],"This":[26],"severely":[27],"hinders":[28],"the":[29,132],"application":[32],"of":[33],"LLMs":[34],"in":[35,62,82],"power":[36,63],"grid":[37,64],"systems.":[38,65],"To":[39],"address":[40],"this,":[41],"we":[42],"propose":[43],"a":[44,79,110,117,143],"hybrid":[45],"structured":[46,150],"pruning":[47,54,112,124,127,158],"method":[48,67,115],"based":[49,72,87],"layer":[51],"channel":[53],"to":[55,93,122],"compress":[56],"LLMs,":[57],"enabling":[58],"efficient":[60],"Our":[66,140],"first":[68],"removes":[69],"noncritical":[70],"layers":[71],"inter-layer":[74],"cosine":[75],"similarity,":[76],"thereby":[77],"achieving":[78],"significant":[80],"reduction":[81],"model":[83,95,133],"parameters.":[84],"Then":[85],"channel-pruning":[86],"PCA":[89],"is":[90,136],"employed,":[91],"aiming":[92],"improve":[94],"inference":[96,134],"speed":[97,135],"while":[98],"preserving":[99],"performance.":[100],"Experimental":[101],"results":[102],"Wikitext2":[104],"PTB":[106],"demonstrate":[107],"that":[108],"at":[109],"30%":[111],"rate,":[113],"our":[114],"exhibits":[116],"superior":[118],"performance":[119],"retention":[120],"compared":[121],"single-layer":[123],"channel-wise":[126],"methods.":[128],"For":[129],"generation":[130],"tasks,":[131],"increased":[137],"5.91%.":[139],"work":[141],"provides":[142],"novel":[144],"insight":[145],"for":[146],"future":[147],"research":[148,155],"pruning,":[151],"inspires":[153],"more":[154],"composite":[157],"from":[159],"multi-dimensional":[160],"perspectives.":[161]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-24T00:00:00"}
