{"id":"https://openalex.org/W4415428411","doi":"https://doi.org/10.3233/faia251119","title":"PROM: Prioritize Reduction of Multiplications Over Lower Bit-Widths for Efficient CNNs","display_name":"PROM: Prioritize Reduction of Multiplications Over Lower Bit-Widths for Efficient CNNs","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4415428411","doi":"https://doi.org/10.3233/faia251119"},"language":null,"primary_location":{"id":"doi:10.3233/faia251119","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251119","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia251119","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092991040","display_name":"Lukas Meiner","orcid":null},"institutions":[{"id":"https://openalex.org/I9341345","display_name":"University of L\u00fcbeck","ror":"https://ror.org/00t3r8h32","country_code":"DE","type":"education","lineage":["https://openalex.org/I9341345"]},{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Lukas Meiner","raw_affiliation_strings":["Robert Bosch GmbH, Leonberg, Germany","Universit\u00e4t zu L\u00fcbeck, L\u00fcbeck, Germany"],"affiliations":[{"raw_affiliation_string":"Robert Bosch GmbH, Leonberg, Germany","institution_ids":["https://openalex.org/I889804353"]},{"raw_affiliation_string":"Universit\u00e4t zu L\u00fcbeck, L\u00fcbeck, Germany","institution_ids":["https://openalex.org/I9341345"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089696208","display_name":"Jens Mehnert","orcid":"https://orcid.org/0000-0002-0079-0036"},"institutions":[{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jens Mehnert","raw_affiliation_strings":["Robert Bosch GmbH, Leonberg, Germany"],"affiliations":[{"raw_affiliation_string":"Robert Bosch GmbH, Leonberg, Germany","institution_ids":["https://openalex.org/I889804353"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112353924","display_name":"Alexandru Paul Condurache","orcid":null},"institutions":[{"id":"https://openalex.org/I9341345","display_name":"University of L\u00fcbeck","ror":"https://ror.org/00t3r8h32","country_code":"DE","type":"education","lineage":["https://openalex.org/I9341345"]},{"id":"https://openalex.org/I889804353","display_name":"Robert Bosch (Germany)","ror":"https://ror.org/01fe0jt45","country_code":"DE","type":"company","lineage":["https://openalex.org/I889804353"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Alexandru Paul Condurache","raw_affiliation_strings":["Robert Bosch GmbH, Leonberg, Germany","Universit\u00e4t zu L\u00fcbeck, L\u00fcbeck, Germany"],"affiliations":[{"raw_affiliation_string":"Robert Bosch GmbH, Leonberg, Germany","institution_ids":["https://openalex.org/I889804353"]},{"raw_affiliation_string":"Universit\u00e4t zu L\u00fcbeck, L\u00fcbeck, Germany","institution_ids":["https://openalex.org/I9341345"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5092991040"],"corresponding_institution_ids":["https://openalex.org/I889804353","https://openalex.org/I9341345"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.68119266,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9868999719619751,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pointwise","display_name":"Pointwise","score":0.7882999777793884},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.644599974155426},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5577999949455261},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.5045999884605408},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.4307999908924103},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.42100000381469727},{"id":"https://openalex.org/keywords/cost-reduction","display_name":"Cost reduction","score":0.4056999981403351},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.36809998750686646}],"concepts":[{"id":"https://openalex.org/C2777984123","wikidata":"https://www.wikidata.org/wiki/Q9248237","display_name":"Pointwise","level":2,"score":0.7882999777793884},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.644599974155426},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6301000118255615},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5577999949455261},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5045999884605408},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.45969998836517334},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.4307999908924103},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.42100000381469727},{"id":"https://openalex.org/C2778820799","wikidata":"https://www.wikidata.org/wiki/Q3454688","display_name":"Cost reduction","level":2,"score":0.4056999981403351},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.36809998750686646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3582000136375427},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.35740000009536743},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.3314000070095062},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.3174000084400177},{"id":"https://openalex.org/C159423971","wikidata":"https://www.wikidata.org/wiki/Q177251","display_name":"Associative property","level":2,"score":0.3122999966144562},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C64452783","wikidata":"https://www.wikidata.org/wiki/Q1524945","display_name":"Ternary operation","level":2,"score":0.28870001435279846},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2718000113964081},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.27140000462532043},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C70518039","wikidata":"https://www.wikidata.org/wiki/Q16000077","display_name":"Dimensionality reduction","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/faia251119","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251119","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"}],"best_oa_location":{"id":"doi:10.3233/faia251119","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251119","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Convolutional":[0],"neural":[1],"networks":[2,80,204],"(CNNs)":[3],"are":[4,90],"crucial":[5],"for":[6,75,140,184,190],"computer":[7],"vision":[8],"tasks":[9],"on":[10,176,194],"resource-constrained":[11],"devices.":[12],"Quantization":[13],"effectively":[14,136],"compresses":[15],"these":[16],"models,":[17],"reducing":[18],"storage":[19,162,220],"size":[20,163],"and":[21,135,160,208,219],"energy":[22,150,185,217],"cost.":[23],"However,":[24],"in":[25],"modern":[26,77],"depthwise-separable":[27,78,202],"architectures,":[28],"the":[29,42,96,138,148,168,181,198],"computational":[30],"cost":[31,54,151,218],"is":[32,103],"distributed":[33],"unevenly":[34],"across":[35,132],"its":[36,161],"components,":[37],"with":[38,122],"pointwise":[39,88,120],"operations":[40],"being":[41],"most":[43],"expensive.":[44],"By":[45],"applying":[46],"a":[47,72,106,212],"general":[48],"quantization":[49,57],"scheme":[50],"to":[51,60,92,115,145,167,205,215],"this":[52,67],"imbalanced":[53],"distribution,":[55],"existing":[56],"approaches":[58],"fail":[59],"fully":[61],"exploit":[62],"potential":[63],"efficiency":[64],"gains.":[65],"To":[66],"end,":[68],"we":[69],"introduce":[70],"PROM,":[71],"straightforward":[73],"approach":[74],"quantizing":[76,113,201],"convolutional":[79,192,203],"by":[81,112,152,164],"selectively":[82],"using":[83],"two":[84],"distinct":[85],"bit-widths.":[86],"Specifically,":[87],"convolutions":[89,121],"quantized":[91,191],"ternary":[93,123,207],"weights,":[94,101,210],"while":[95,171],"remaining":[97],"modules":[98],"use":[99],"8-bit":[100,209],"which":[102,128],"achieved":[104],"through":[105],"simple":[107,213],"quantization-aware":[108],"training":[109],"procedure.":[110],"Additionally,":[111],"activations":[114],"8-bit,":[116],"our":[117],"method":[118,179],"transforms":[119],"weights":[124],"into":[125],"int8":[126],"additions,":[127],"enjoy":[129],"broad":[130],"support":[131],"hardware":[133],"platforms":[134],"eliminates":[137],"need":[139],"expensive":[141],"multiplications.":[142],"Applying":[143],"PROM":[144,196],"MobileNetV2":[146],"reduces":[147],"model\u2019s":[149],"more":[153],"than":[154],"an":[155],"order":[156],"of":[157,200],"magnitude":[158],"(23.9\u00d7)":[159],"2.7\u00d7":[165],"compared":[166],"float16":[169],"baseline":[170],"retaining":[172],"similar":[173],"classification":[174],"performance":[175],"ImageNet.":[177,195],"Our":[178],"advances":[180],"Pareto":[182],"frontier":[183],"consumption":[186],"vs.":[187],"top-1":[188],"accuracy":[189],"models":[193],"addresses":[197],"challenges":[199],"both":[206],"offering":[211],"way":[214],"reduce":[216],"size.":[221]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-24T00:00:00"}
