{"id":"https://openalex.org/W4416251594","doi":"https://doi.org/10.1109/ijcnn64981.2025.11227985","title":"Efficient LLMs with AMP: Attention Heads and MLP Pruning","display_name":"Efficient LLMs with AMP: Attention Heads and MLP Pruning","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4416251594","doi":"https://doi.org/10.1109/ijcnn64981.2025.11227985"},"language":null,"primary_location":{"id":"doi:10.1109/ijcnn64981.2025.11227985","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11227985","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5107738951","display_name":"Leandro Giusti Mugnaini","orcid":null},"institutions":[{"id":"https://openalex.org/I4210129339","display_name":"Funda\u00e7\u00e3o Escola de Sociologia e Pol\u00edtica de S\u00e3o Paulo","ror":"https://ror.org/036rdqh43","country_code":"BR","type":"nonprofit","lineage":["https://openalex.org/I4210129339"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Leandro Giusti Mugnaini","raw_affiliation_strings":["Escola Polit&#x00E9;cnica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Escola Polit&#x00E9;cnica","institution_ids":["https://openalex.org/I4210129339"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070659570","display_name":"Bruno Lopes Yamamoto","orcid":null},"institutions":[{"id":"https://openalex.org/I4210129339","display_name":"Funda\u00e7\u00e3o Escola de Sociologia e Pol\u00edtica de S\u00e3o Paulo","ror":"https://ror.org/036rdqh43","country_code":"BR","type":"nonprofit","lineage":["https://openalex.org/I4210129339"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Bruno Lopes Yamamoto","raw_affiliation_strings":["Escola Polit&#x00E9;cnica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Escola Polit&#x00E9;cnica","institution_ids":["https://openalex.org/I4210129339"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017514975","display_name":"L. Alc\u00e1ntara","orcid":"https://orcid.org/0000-0001-8644-4443"},"institutions":[{"id":"https://openalex.org/I4210129339","display_name":"Funda\u00e7\u00e3o Escola de Sociologia e Pol\u00edtica de S\u00e3o Paulo","ror":"https://ror.org/036rdqh43","country_code":"BR","type":"nonprofit","lineage":["https://openalex.org/I4210129339"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Lucas Lauton de Alcantara","raw_affiliation_strings":["Escola Polit&#x00E9;cnica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Escola Polit&#x00E9;cnica","institution_ids":["https://openalex.org/I4210129339"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120499611","display_name":"Victor Zacarias","orcid":null},"institutions":[{"id":"https://openalex.org/I2799978770","display_name":"X-Fab (Germany)","ror":"https://ror.org/030bh9196","country_code":"DE","type":"company","lineage":["https://openalex.org/I2799978770"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Victor Zacarias","raw_affiliation_strings":["Universidade de S&#x00E3;o Paulo,Instituto de Matem&#x00E1;tica e Estat&#x00ED;stica,S&#x00E3;o Paulo,Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universidade de S&#x00E3;o Paulo,Instituto de Matem&#x00E1;tica e Estat&#x00ED;stica,S&#x00E3;o Paulo,Brazil","institution_ids":["https://openalex.org/I2799978770"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085487887","display_name":"Edson Bollis","orcid":"https://orcid.org/0000-0002-0993-784X"},"institutions":[{"id":"https://openalex.org/I4210107081","display_name":"Xenobe Research Institute","ror":"https://ror.org/01pb5g963","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210107081"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Edson Bollis","raw_affiliation_strings":["Instituto de Ci&#x00EA;ncia e Tecnologia Ita&#x00FA; (ICTi),S&#x00E3;o Paulo,Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Instituto de Ci&#x00EA;ncia e Tecnologia Ita&#x00FA; (ICTi),S&#x00E3;o Paulo,Brazil","institution_ids":["https://openalex.org/I4210107081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038120583","display_name":"Lucas Francisco Amaral Orosco Pellicer","orcid":"https://orcid.org/0000-0003-2827-7602"},"institutions":[{"id":"https://openalex.org/I4210107081","display_name":"Xenobe Research Institute","ror":"https://ror.org/01pb5g963","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210107081"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lucas Pellicer","raw_affiliation_strings":["Instituto de Ci&#x00EA;ncia e Tecnologia Ita&#x00FA; (ICTi),S&#x00E3;o Paulo,Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Instituto de Ci&#x00EA;ncia e Tecnologia Ita&#x00FA; (ICTi),S&#x00E3;o Paulo,Brazil","institution_ids":["https://openalex.org/I4210107081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069264027","display_name":"Anna Helena Reali Costa","orcid":"https://orcid.org/0000-0001-7309-4528"},"institutions":[{"id":"https://openalex.org/I4210129339","display_name":"Funda\u00e7\u00e3o Escola de Sociologia e Pol\u00edtica de S\u00e3o Paulo","ror":"https://ror.org/036rdqh43","country_code":"BR","type":"nonprofit","lineage":["https://openalex.org/I4210129339"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Anna Helena Reali Costa","raw_affiliation_strings":["Escola Polit&#x00E9;cnica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Escola Polit&#x00E9;cnica","institution_ids":["https://openalex.org/I4210129339"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112859940","display_name":"Artur Jord\u00e3o","orcid":null},"institutions":[{"id":"https://openalex.org/I4210129339","display_name":"Funda\u00e7\u00e3o Escola de Sociologia e Pol\u00edtica de S\u00e3o Paulo","ror":"https://ror.org/036rdqh43","country_code":"BR","type":"nonprofit","lineage":["https://openalex.org/I4210129339"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Artur Jordao","raw_affiliation_strings":["Escola Polit&#x00E9;cnica"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Escola Polit&#x00E9;cnica","institution_ids":["https://openalex.org/I4210129339"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7588,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89545935,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.20170000195503235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.20170000195503235,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.10980000346899033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.10530000180006027,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.8294000029563904},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.618399977684021},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5939000248908997},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5738000273704529},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.49230000376701355},{"id":"https://openalex.org/keywords/automation","display_name":"Automation","score":0.424699991941452},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4230000078678131},{"id":"https://openalex.org/keywords/multilayer-perceptron","display_name":"Multilayer perceptron","score":0.4066999852657318}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.8294000029563904},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6887000203132629},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6830999851226807},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.618399977684021},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6173999905586243},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5939000248908997},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5738000273704529},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.49230000376701355},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.424699991941452},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4230000078678131},{"id":"https://openalex.org/C179717631","wikidata":"https://www.wikidata.org/wiki/Q2991667","display_name":"Multilayer perceptron","level":3,"score":0.4066999852657318},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.40450000762939453},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3747999966144562},{"id":"https://openalex.org/C60908668","wikidata":"https://www.wikidata.org/wiki/Q690207","display_name":"Perceptron","level":3,"score":0.37040001153945923},{"id":"https://openalex.org/C169900460","wikidata":"https://www.wikidata.org/wiki/Q2200417","display_name":"Cognition","level":2,"score":0.3603000044822693},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3450999855995178},{"id":"https://openalex.org/C193221554","wikidata":"https://www.wikidata.org/wiki/Q5153664","display_name":"Commonsense reasoning","level":2,"score":0.34150001406669617},{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.31529998779296875},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.27309998869895935}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn64981.2025.11227985","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn64981.2025.11227985","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W2946609015","https://openalex.org/W2996908057","https://openalex.org/W2998617917","https://openalex.org/W4223937247","https://openalex.org/W4312690709","https://openalex.org/W4393147854","https://openalex.org/W4401726555","https://openalex.org/W4402683730","https://openalex.org/W4404918643","https://openalex.org/W4415796952"],"related_works":[],"abstract_inverted_index":{"Deep":[0],"learning":[1],"drives":[2],"a":[3,65,88,154],"new":[4],"wave":[5],"in":[6,40,51,132,176],"computing":[7],"systems":[8],"and":[9,44,85,106,121,192],"triggers":[10],"the":[11,55,59,112,123,140,181],"automation":[12],"of":[13,125,183,188],"increasingly":[14],"complex":[15],"problems.":[16],"In":[17,77,136],"particular,":[18,137],"Large":[19],"Language":[20],"Models":[21],"(LLMs)":[22],"have":[23],"significantly":[24],"advanced":[25],"cognitive":[26],"tasks,":[27],"often":[28,129],"matching":[29],"or":[30,134],"even":[31],"surpassing":[32],"human-level":[33],"performance.":[34,164],"However,":[35],"their":[36],"extensive":[37],"parameters":[38],"result":[39],"high":[41],"computational":[42],"costs":[43],"slow":[45],"inference,":[46],"posing":[47],"challenges":[48],"for":[49,174],"deployment":[50,175],"resource-limited":[52],"settings.":[53],"Among":[54],"strategies":[56],"to":[57,149],"overcome":[58],"aforementioned":[60],"challenges,":[61],"pruning":[62,91,156],"emerges":[63],"as":[64],"successful":[66],"mechanism":[67],"since":[68],"it":[69,172],"reduces":[70],"model":[71],"size":[72],"while":[73],"maintaining":[74],"predictive":[75],"ability.":[76],"this":[78],"paper,":[79],"we":[80],"introduce":[81],"AMP:":[82],"Attention":[83,104],"Heads":[84],"MLP":[86],"Pruning,":[87],"novel":[89],"structured":[90],"method":[92],"that":[93],"efficiently":[94],"compresses":[95],"LLMs":[96],"by":[97,147],"removing":[98],"less":[99],"critical":[100],"structures":[101],"within":[102],"Multi-Head":[103],"(MHA)":[105],"Multilayer":[107],"Perceptron":[108],"(MLP).":[109],"By":[110],"projecting":[111],"input":[113],"data":[114],"onto":[115],"weights,":[116],"AMP":[117,138,166,184],"assesses":[118],"structural":[119],"importance":[120],"overcomes":[122],"limitations":[124],"existing":[126],"techniques,":[127],"which":[128],"fall":[130],"short":[131],"flexibility":[133,182],"efficiency.":[135],"surpasses":[139],"current":[141],"state-of-the-art":[142],"on":[143,161,185],"commonsense":[144],"reasoning":[145],"tasks":[146],"up":[148],"1.49":[150],"percentage":[151],"points,":[152],"achieving":[153],"30%":[155],"ratio":[157],"with":[158],"minimal":[159],"impact":[160],"zero-shot":[162],"task":[163],"Moreover,":[165],"also":[167],"improves":[168],"inference":[169],"speeds,":[170],"making":[171],"well-suited":[173],"resource-constrained":[177],"environments.":[178],"We":[179],"confirm":[180],"different":[186],"families":[187],"LLMs,":[189],"including":[190],"LLaMA":[191],"Phi.":[193]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-14T00:00:00"}
