{"id":"https://openalex.org/W4409687655","doi":"https://doi.org/10.32604/cmc.2025.062980","title":"Reinforcement Learning for Solving the Knapsack Problem","display_name":"Reinforcement Learning for Solving the Knapsack Problem","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4409687655","doi":"https://doi.org/10.32604/cmc.2025.062980"},"language":"en","primary_location":{"id":"doi:10.32604/cmc.2025.062980","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.062980","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.32604/cmc.2025.062980","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019795083","display_name":"Zhenfu Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhenfu Zhang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026660809","display_name":"Haiyan Yin","orcid":"https://orcid.org/0009-0007-9576-9398"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haiyan Yin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liudong Zuo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liudong Zuo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5014790039","display_name":"Pan Lai","orcid":"https://orcid.org/0000-0002-4967-5573"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pan Lai","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5019795083"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.2618,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.87886142,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"84","issue":"1","first_page":"919","last_page":"936"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11814","display_name":"Advanced Manufacturing and Logistics Optimization","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11814","display_name":"Advanced Manufacturing and Logistics Optimization","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12176","display_name":"Optimization and Packing Problems","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9800000190734863,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/knapsack-problem","display_name":"Knapsack problem","score":0.8880903124809265},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7815068960189819},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.6506840586662292},{"id":"https://openalex.org/keywords/continuous-knapsack-problem","display_name":"Continuous knapsack problem","score":0.5151461362838745},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4968855679035187},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4514642059803009},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32315897941589355},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29719021916389465},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.15994760394096375},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.06697586178779602}],"concepts":[{"id":"https://openalex.org/C113138325","wikidata":"https://www.wikidata.org/wiki/Q864457","display_name":"Knapsack problem","level":2,"score":0.8880903124809265},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7815068960189819},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.6506840586662292},{"id":"https://openalex.org/C94569963","wikidata":"https://www.wikidata.org/wiki/Q5165487","display_name":"Continuous knapsack problem","level":3,"score":0.5151461362838745},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4968855679035187},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4514642059803009},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32315897941589355},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29719021916389465},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.15994760394096375},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.06697586178779602}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.32604/cmc.2025.062980","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.062980","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.32604/cmc.2025.062980","is_oa":true,"landing_page_url":"https://doi.org/10.32604/cmc.2025.062980","pdf_url":null,"source":{"id":"https://openalex.org/S4210191605","display_name":"Computers, materials & continua/Computers, materials & continua (Print)","issn_l":"1546-2218","issn":["1546-2218","1546-2226"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers, Materials &amp; Continua","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.5799999833106995,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1586409345","https://openalex.org/W1776713878","https://openalex.org/W1968058578","https://openalex.org/W1972300623","https://openalex.org/W2089047615","https://openalex.org/W2101493843","https://openalex.org/W2128105951","https://openalex.org/W2145339207","https://openalex.org/W2257979135","https://openalex.org/W2890515088","https://openalex.org/W2919115771","https://openalex.org/W2991046523","https://openalex.org/W3192302584","https://openalex.org/W4283264203","https://openalex.org/W4383112908","https://openalex.org/W4390322843"],"related_works":["https://openalex.org/W246960280","https://openalex.org/W2087209118","https://openalex.org/W2168163332","https://openalex.org/W2005493932","https://openalex.org/W179363847","https://openalex.org/W2381035939","https://openalex.org/W2145407993","https://openalex.org/W2378557713","https://openalex.org/W2141701778","https://openalex.org/W3169691842"],"abstract_inverted_index":{"The":[0,213,233],"knapsack":[1,107],"problem":[2,8,36,47,64,86,108,193],"is":[3],"a":[4,98,120,158,257,273],"classical":[5],"combinatorial":[6],"optimization":[7,279],"widely":[9],"encountered":[10],"in":[11,33,161,183,226,250,262,281],"areas":[12],"such":[13,245],"as":[14,45,129,246],"logistics,":[15],"resource":[16],"allocation,":[17],"and":[18,27,43,57,125,136,270,287],"portfolio":[19],"optimization.":[20],"Traditional":[21],"methods,":[22],"including":[23],"dynamic":[24],"programming":[25],"(DP)":[26],"greedy":[28,70],"algorithms,":[29,168],"have":[30],"been":[31],"effective":[32],"solving":[34],"small":[35],"instances":[37],"but":[38,75,254],"often":[39],"struggle":[40],"with":[41],"scalability":[42],"efficiency":[44],"the":[46,67,80,85,106,111,115,133,146,165,198,201,209,219,223,247],"size":[48],"increases.":[49],"DP,":[50],"for":[51,62,191,276],"instance,":[52],"has":[53],"exponential":[54],"time":[55,288],"complexity":[56],"can":[58],"become":[59],"computationally":[60],"prohibitive":[61],"large":[63,91],"instances.":[65,194],"On":[66],"other":[68],"hand,":[69],"algorithms":[71],"offer":[72],"faster":[73],"solutions":[74],"may":[76],"not":[77,239],"always":[78],"yield":[79],"optimal":[81],"results,":[82],"especially":[83],"when":[84],"involves":[87],"complex":[88],"constraints":[89],"or":[90],"numbers":[92],"of":[93,145,185,200,215,222,231,252,267],"items.":[94,151],"This":[95,152,265],"paper":[96],"introduces":[97],"novel":[99,153],"reinforcement":[100],"learning":[101,116],"(RL)":[102],"approach":[103,238],"to":[104,132,141,157,164],"solve":[105],"by":[109,179,204],"enhancing":[110],"state":[112,154],"representation":[113,121],"within":[114],"environment.":[117],"We":[118],"propose":[119],"where":[122,284],"item":[123,137],"weights":[124],"volumes":[126],"are":[127,139,289],"expressed":[128],"ratios":[130],"relative":[131],"knapsack\u2019s":[134],"capacity,":[135],"values":[138],"normalized":[140],"represent":[142],"their":[143],"percentage":[144],"total":[147],"value":[148],"across":[149],"all":[150],"modification":[155],"leads":[156],"5%":[159],"improvement":[160,259],"accuracy":[162,229,269],"compared":[163],"state-of-the-art":[166],"RL-based":[167,175],"while":[169],"significantly":[170],"reducing":[171],"execution":[172],"time.":[173],"Our":[174],"method":[176],"outperforms":[177,241],"DP":[178,261],"over":[180],"9000":[181],"times":[182],"terms":[184,251],"speed,":[186],"making":[187],"it":[188],"highly":[189],"scalable":[190],"larger":[192],"Furthermore,":[195],"we":[196],"improve":[197],"performance":[199],"RL":[202,243],"model":[203,249],"incorporating":[205],"Noisy":[206,216],"layers":[207,217],"into":[208],"neural":[210],"network":[211],"architecture.":[212],"addition":[214],"enhances":[218],"exploration":[220],"capabilities":[221],"agent,":[224],"resulting":[225],"an":[227],"additional":[228],"boost":[230],"0.2%\u20130.5%.":[232],"results":[234],"demonstrate":[235],"that":[236],"our":[237],"only":[240],"existing":[242],"techniques,":[244],"Transformer":[248],"accuracy,":[253],"also":[255],"provides":[256],"substantial":[258],"than":[260],"computational":[263],"efficiency.":[264],"combination":[266],"enhanced":[268],"speed":[271],"presents":[272],"promising":[274],"solution":[275],"tackling":[277],"large-scale":[278],"problems":[280],"real-world":[282],"applications,":[283],"both":[285],"precision":[286],"critical":[290],"factors.":[291]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
