{"id":"https://openalex.org/W7152096143","doi":"https://doi.org/10.48550/arxiv.2604.05856","title":"Neural Network Pruning via QUBO Optimization","display_name":"Neural Network Pruning via QUBO Optimization","publication_year":2026,"publication_date":"2026-04-07","ids":{"openalex":"https://openalex.org/W7152096143","doi":"https://doi.org/10.48550/arxiv.2604.05856"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05856","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05856","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05856","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095070141","display_name":"Osama Orabi","orcid":"https://orcid.org/0009-0000-0028-315X"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Orabi, Osama","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116325799","display_name":"Artur Zagitov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zagitov, Artur","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095070139","display_name":"Hadi Salloum","orcid":"https://orcid.org/0009-0005-6068-0532"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Salloum, Hadi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133184316","display_name":"Viktor A. Lobachev","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lobachev, Viktor A.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122390411","display_name":"Kasymkhan Khubiev","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Khubiev, Kasymkhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077533023","display_name":"Yaroslav Kholodov","orcid":"https://orcid.org/0000-0003-2466-1594"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kholodov, Yaroslav","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5095070141"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.28450000286102295,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.28450000286102295,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.1785999983549118,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.13030000030994415,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.6021000146865845},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.5393000245094299},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.48420000076293945},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.4555000066757202},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.450300008058548},{"id":"https://openalex.org/keywords/combinatorial-optimization","display_name":"Combinatorial optimization","score":0.4169999957084656},{"id":"https://openalex.org/keywords/optimization-problem","display_name":"Optimization problem","score":0.40790000557899475},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.39570000767707825},{"id":"https://openalex.org/keywords/submodular-set-function","display_name":"Submodular set function","score":0.38929998874664307}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6036999821662903},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.6021000146865845},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.5393000245094299},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.48420000076293945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4634999930858612},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.4555000066757202},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.450300008058548},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.43070000410079956},{"id":"https://openalex.org/C52692508","wikidata":"https://www.wikidata.org/wiki/Q1333872","display_name":"Combinatorial optimization","level":2,"score":0.4169999957084656},{"id":"https://openalex.org/C137836250","wikidata":"https://www.wikidata.org/wiki/Q984063","display_name":"Optimization problem","level":2,"score":0.40790000557899475},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.39570000767707825},{"id":"https://openalex.org/C178621042","wikidata":"https://www.wikidata.org/wiki/Q7631710","display_name":"Submodular set function","level":2,"score":0.38929998874664307},{"id":"https://openalex.org/C51823790","wikidata":"https://www.wikidata.org/wiki/Q504353","display_name":"Greedy algorithm","level":2,"score":0.37709999084472656},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.37229999899864197},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.35040000081062317},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3456999957561493},{"id":"https://openalex.org/C3309286","wikidata":"https://www.wikidata.org/wiki/Q4907693","display_name":"Bilevel optimization","level":3,"score":0.3449999988079071},{"id":"https://openalex.org/C177179195","wikidata":"https://www.wikidata.org/wiki/Q7268372","display_name":"Quadratic unconstrained binary optimization","level":4,"score":0.33640000224113464},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33070001006126404},{"id":"https://openalex.org/C129844170","wikidata":"https://www.wikidata.org/wiki/Q41299","display_name":"Quadratic equation","level":2,"score":0.3149999976158142},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.3075999915599823},{"id":"https://openalex.org/C98036226","wikidata":"https://www.wikidata.org/wiki/Q7268356","display_name":"Quadratic assignment problem","level":3,"score":0.298799991607666},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.2987000048160553},{"id":"https://openalex.org/C115908005","wikidata":"https://www.wikidata.org/wiki/Q2668364","display_name":"Combinatorial explosion","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.29649999737739563},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.28299999237060547},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2824000120162964},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.27559998631477356},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2687999904155731},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.2572000026702881}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05856","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05856","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05856","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05856","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Neural":[0],"network":[1,209],"pruning":[2,179],"can":[3],"be":[4],"formulated":[5],"as":[6,29],"a":[7,36,60,120,137,141,147],"combinatorial":[8,72,193,201],"optimization":[9,26,132],"problem,":[10],"yet":[11],"most":[12],"existing":[13],"approaches":[14],"rely":[15],"on":[16,50,162],"greedy":[17,177],"heuristics":[18],"that":[19,65,150,169],"ignore":[20],"complex":[21],"interactions":[22],"between":[23],"filters.":[24],"Formal":[25],"methods":[27],"such":[28],"Quadratic":[30],"Unconstrained":[31],"Binary":[32],"Optimization":[33],"(QUBO)":[34],"provide":[35],"principled":[37],"alternative":[38],"but":[39],"have":[40],"so":[41],"far":[42],"underperformed":[43],"due":[44],"to":[45,107,124],"oversimplified":[46],"objective":[47,106],"formulations":[48,202],"based":[49],"metrics":[51,79],"like":[52],"the":[53,90,99,104,131,152,157,163,170,197],"L1-norm.":[54],"In":[55],"this":[56],"work,":[57],"we":[58,135],"propose":[59],"unified":[61],"Hybrid":[62,172],"QUBO":[63,105,173],"framework":[64],"bridges":[66],"heuristic":[67],"importance":[68],"estimation":[69],"with":[70,184],"global":[71],"optimization.":[73],"Our":[74],"formulation":[75],"integrates":[76],"gradient-aware":[77],"sensitivity":[78],"-":[80,88,146],"specifically":[81],"first-order":[82],"Taylor":[83,178],"and":[84,113,180,206],"second-order":[85],"Fisher":[86],"information":[87],"into":[89],"linear":[91],"term,":[92],"while":[93],"utilizing":[94],"data-driven":[95],"activation":[96],"similarity":[97],"in":[98],"quadratic":[100],"term.":[101],"This":[102,195],"allows":[103],"jointly":[108],"capture":[109],"individual":[110],"filter":[111],"relevance":[112],"inter-filter":[114],"functional":[115],"redundancy.":[116],"We":[117],"further":[118,188],"introduce":[119],"dynamic":[121],"capacity-driven":[122],"search":[123],"strictly":[125],"enforce":[126],"target":[127],"sparsity":[128],"without":[129],"distorting":[130],"landscape.":[133],"Finally,":[134],"employ":[136],"two-stage":[138],"pipeline":[139],"featuring":[140],"Tensor-Train":[142],"(TT)":[143],"Refinement":[144,186],"stage":[145],"gradient-free":[148],"optimizer":[149],"fine-tunes":[151],"QUBO-derived":[153],"solution":[154],"directly":[155],"against":[156],"true":[158],"evaluation":[159],"metric.":[160],"Experiments":[161],"SIDD":[164],"image":[165],"denoising":[166],"dataset":[167],"demonstrate":[168],"proposed":[171],"significantly":[174],"outperforms":[175],"both":[176],"traditional":[181],"L1-based":[182],"QUBO,":[183],"TT":[185],"providing":[187],"consistent":[189],"gains":[190],"at":[191],"appropriate":[192],"scales.":[194],"highlights":[196],"potential":[198],"of":[199],"hybrid":[200],"for":[203],"robust,":[204],"scalable,":[205],"interpretable":[207],"neural":[208],"compression.":[210]},"counts_by_year":[],"updated_date":"2026-04-09T06:13:59.934233","created_date":"2026-04-09T00:00:00"}
