{"id":"https://openalex.org/W3117731702","doi":"https://doi.org/10.1145/3437963.3441766","title":"Filter Pruning via Probabilistic Model-based Optimization for Accelerating Deep Convolutional Neural Networks","display_name":"Filter Pruning via Probabilistic Model-based Optimization for Accelerating Deep Convolutional Neural Networks","publication_year":2021,"publication_date":"2021-03-06","ids":{"openalex":"https://openalex.org/W3117731702","doi":"https://doi.org/10.1145/3437963.3441766","mag":"3117731702"},"language":"en","primary_location":{"id":"doi:10.1145/3437963.3441766","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3437963.3441766","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100670298","display_name":"Qinghua Li","orcid":"https://orcid.org/0000-0001-5291-1445"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qinghua Li","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100619237","display_name":"Cuiping Li","orcid":"https://orcid.org/0000-0003-0089-1045"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cuiping Li","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100420423","display_name":"Hong Chen","orcid":"https://orcid.org/0000-0002-2035-6851"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Chen","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100670298"],"corresponding_institution_ids":["https://openalex.org/I78988378"],"apc_list":null,"apc_paid":null,"fwci":0.3843,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.58264706,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"653","last_page":"661"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.702072024345398},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6694521903991699},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6589269042015076},{"id":"https://openalex.org/keywords/flops","display_name":"FLOPS","score":0.5675480961799622},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5205617547035217},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5012588500976562},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4884585440158844},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.47761791944503784},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.45364993810653687},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4399052560329437},{"id":"https://openalex.org/keywords/norm","display_name":"Norm (philosophy)","score":0.42127394676208496},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3465942144393921},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2689429521560669},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.0890498161315918},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.07005199790000916}],"concepts":[{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.702072024345398},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6694521903991699},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6589269042015076},{"id":"https://openalex.org/C3826847","wikidata":"https://www.wikidata.org/wiki/Q188768","display_name":"FLOPS","level":2,"score":0.5675480961799622},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5205617547035217},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5012588500976562},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4884585440158844},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.47761791944503784},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.45364993810653687},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4399052560329437},{"id":"https://openalex.org/C191795146","wikidata":"https://www.wikidata.org/wiki/Q3878446","display_name":"Norm (philosophy)","level":2,"score":0.42127394676208496},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3465942144393921},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2689429521560669},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0890498161315918},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.07005199790000916},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3437963.3441766","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3437963.3441766","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 14th ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1935978687","https://openalex.org/W2072458630","https://openalex.org/W2117539524","https://openalex.org/W2125389748","https://openalex.org/W2141083508","https://openalex.org/W2142508340","https://openalex.org/W2147768505","https://openalex.org/W2302255633","https://openalex.org/W2554302513","https://openalex.org/W2604998962","https://openalex.org/W2798170643","https://openalex.org/W2798603777","https://openalex.org/W2808384944","https://openalex.org/W2928560789","https://openalex.org/W2962851801","https://openalex.org/W2963145730","https://openalex.org/W2963363373","https://openalex.org/W2964233199","https://openalex.org/W3007384386","https://openalex.org/W3014290610","https://openalex.org/W3104263540","https://openalex.org/W3177525997","https://openalex.org/W4233533910","https://openalex.org/W6819060087"],"related_works":["https://openalex.org/W2898360562","https://openalex.org/W3191582637","https://openalex.org/W3119066197","https://openalex.org/W4286251925","https://openalex.org/W3047530476","https://openalex.org/W4200040586","https://openalex.org/W2788715907","https://openalex.org/W2770717529","https://openalex.org/W2767651786","https://openalex.org/W2912288872"],"abstract_inverted_index":{"Accelerating":[0],"Deep":[1],"Convolutional":[2],"Neural":[3],"Networks(CNNs)":[4],"has":[5,20],"recently":[6],"received":[7],"ever-increasing":[8],"research":[9],"focus.":[10],"Among":[11],"various":[12],"approaches":[13,73],"proposed":[14,168],"in":[15,33,104,141,182],"the":[16,67,79,82,93,96,105,113,134,160,171,176,179,183,193,240],"literature,":[17],"filter":[18,86,109,121,242],"pruning":[19,60,122,139,148,154,161,172,184,243],"been":[21],"regarded":[22],"as":[23,99],"a":[24,119,142,147],"promising":[25],"solution,":[26],"which":[27],"is":[28,155,167,198],"due":[29],"to":[30,52,169,188],"its":[31],"advantage":[32],"significant":[34],"speedup":[35],"and":[36,43,61,153],"memory":[37],"reduction":[38],"of":[39,69,81,95,108,115,136,178,195],"both":[40],"network":[41],"model":[42,98,181],"intermediate":[44],"feature":[45],"maps.":[46],"Previous":[47],"works":[48],"utilized":[49],"\"smaller-norm-less-important\"":[50],"criterion":[51],"prune":[53,75,85],"filters":[54,76,83,140],"with":[55,87,212],"smaller":[56],"lp-norm":[57,89],"values":[58],"by":[59,138,157],"retraining":[62],"alternately.":[63],"However,":[64],"they":[65],"ignore":[66],"effects":[68],"$feedback:":[70],"most":[71],"current":[72],"that":[74,236],"only":[77],"consider":[78],"statistics":[80],"(e.g.,":[84],"small":[88],"values),":[90],"without":[91,230],"considering":[92],"performance":[94,177],"pruned":[97,180],"an":[100],"important":[101],"feedback":[102],"signal":[103],"next":[106],"iteration":[107],"pruning.":[110],"To":[111],"solve":[112],"problem":[114,135],"non-feedback,":[116],"we":[117],"propose":[118],"novel":[120],"method,":[123],"namely":[124],"Filter":[125],"Pruning":[126],"via":[127],"Probabilistic":[128],"Model-based":[129],"Optimization":[130],"(FPPMO).":[131],"FPPMO":[132,197,204,222,238],"solves":[133],"non-feedback":[137],"probabilistic":[143],"manner.":[144],"We":[145],"introduce":[146],"probability":[149,162,173],"for":[150],"each":[151],"filter,":[152],"guided":[156],"sampling":[158],"from":[159],"distribution.":[163],"An":[164],"optimization":[165],"method":[166],"update":[170],"based":[174],"on":[175,201,210,219,228],"process.":[185],"When":[186],"applied":[187],"two":[189],"image":[190],"classification":[191],"benchmarks,":[192],"effectiveness":[194],"our":[196,203,221,237],"validated.":[199],"Notably,":[200],"CIFAR-10,":[202],"reduces":[205,223],"more":[206,224],"than":[207,225],"57%":[208],"FLOPs":[209,227],"ResNet-110":[211],"even":[213],"0.08%":[214],"relative":[215],"accuracy":[216,232],"improvement.":[217],"Moreover,":[218],"ILSVRC-2012,":[220],"50%":[226],"ResNet-101":[229],"top-5":[231],"drop.":[233],"Which":[234],"proving":[235],"outperforms":[239],"state-of-the-art":[241],"method.":[244]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
