{"id":"https://openalex.org/W3093720865","doi":"https://doi.org/10.1088/2632-2153/abc328","title":"Reinforcement learning enhanced quantum-inspired algorithm for combinatorial optimization","display_name":"Reinforcement learning enhanced quantum-inspired algorithm for combinatorial optimization","publication_year":2020,"publication_date":"2020-10-20","ids":{"openalex":"https://openalex.org/W3093720865","doi":"https://doi.org/10.1088/2632-2153/abc328","mag":"3093720865"},"language":"en","primary_location":{"id":"doi:10.1088/2632-2153/abc328","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/abc328","pdf_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abc328/pdf","source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abc328/pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033938244","display_name":"Dmitrii Beloborodov","orcid":null},"institutions":[{"id":"https://openalex.org/I4210139586","display_name":"Russian Quantum Center","ror":"https://ror.org/03v8t4025","country_code":"RU","type":"facility","lineage":["https://openalex.org/I4210139586"]}],"countries":["RU"],"is_corresponding":true,"raw_author_name":"Dmitrii Beloborodov","raw_affiliation_strings":["Russian Quantum Center, Moscow, Russia"],"affiliations":[{"raw_affiliation_string":"Russian Quantum Center, Moscow, Russia","institution_ids":["https://openalex.org/I4210139586"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043326371","display_name":"Alexander E. Ulanov","orcid":"https://orcid.org/0000-0003-2211-559X"},"institutions":[{"id":"https://openalex.org/I4210139586","display_name":"Russian Quantum Center","ror":"https://ror.org/03v8t4025","country_code":"RU","type":"facility","lineage":["https://openalex.org/I4210139586"]}],"countries":["RU"],"is_corresponding":false,"raw_author_name":"A E Ulanov","raw_affiliation_strings":["Russian Quantum Center, Moscow, Russia"],"affiliations":[{"raw_affiliation_string":"Russian Quantum Center, Moscow, Russia","institution_ids":["https://openalex.org/I4210139586"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059094093","display_name":"Jakob Foerster","orcid":"https://orcid.org/0000-0001-9688-2498"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jakob N Foerster","raw_affiliation_strings":["Department of Computer Science, University of Oxford, Oxford, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Oxford, Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056879203","display_name":"Shimon Whiteson","orcid":null},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Shimon Whiteson","raw_affiliation_strings":["Department of Computer Science, University of Oxford, Oxford, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Oxford, Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040418974","display_name":"A. I. Lvovsky","orcid":"https://orcid.org/0000-0003-3165-6654"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]},{"id":"https://openalex.org/I4210139586","display_name":"Russian Quantum Center","ror":"https://ror.org/03v8t4025","country_code":"RU","type":"facility","lineage":["https://openalex.org/I4210139586"]}],"countries":["GB","RU"],"is_corresponding":false,"raw_author_name":"A I Lvovsky","raw_affiliation_strings":["Department of Physics, University of Oxford, Oxford, United Kingdom","Russian Quantum Center, Moscow, Russia"],"affiliations":[{"raw_affiliation_string":"Department of Physics, University of Oxford, Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]},{"raw_affiliation_string":"Russian Quantum Center, Moscow, Russia","institution_ids":["https://openalex.org/I4210139586"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5033938244"],"corresponding_institution_ids":["https://openalex.org/I4210139586"],"apc_list":{"value":1600,"currency":"GBP","value_usd":1962},"apc_paid":{"value":1600,"currency":"GBP","value_usd":1962},"fwci":1.509,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.86584476,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"2","issue":"2","first_page":"025009","last_page":"025009"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12002","display_name":"Computability, Logic, AI Algorithms","score":0.970300018787384,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13182","display_name":"Quantum-Dot Cellular Automata","score":0.9606000185012817,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8688664436340332},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5464068055152893},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.5141194462776184},{"id":"https://openalex.org/keywords/optimization-algorithm","display_name":"Optimization algorithm","score":0.48908430337905884},{"id":"https://openalex.org/keywords/combinatorial-optimization","display_name":"Combinatorial optimization","score":0.4115336835384369},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.40121346712112427},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38837945461273193},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.29118359088897705},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20888912677764893},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11205399036407471},{"id":"https://openalex.org/keywords/quantum-mechanics","display_name":"Quantum mechanics","score":0.08264845609664917}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8688664436340332},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5464068055152893},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.5141194462776184},{"id":"https://openalex.org/C2987595161","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Optimization algorithm","level":2,"score":0.48908430337905884},{"id":"https://openalex.org/C52692508","wikidata":"https://www.wikidata.org/wiki/Q1333872","display_name":"Combinatorial optimization","level":2,"score":0.4115336835384369},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.40121346712112427},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38837945461273193},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.29118359088897705},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20888912677764893},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11205399036407471},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.08264845609664917}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1088/2632-2153/abc328","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/abc328","pdf_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abc328/pdf","source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1088/2632-2153/abc328","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/abc328","pdf_url":"https://iopscience.iop.org/article/10.1088/2632-2153/abc328/pdf","source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.6200000047683716,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G4905048667","display_name":null,"funder_award_id":"19-71-10092","funder_id":"https://openalex.org/F4320324099","funder_display_name":"Russian Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320324099","display_name":"Russian Science Foundation","ror":"https://ror.org/03y2gwe85"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3093720865.pdf","grobid_xml":"https://content.openalex.org/works/W3093720865.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W1501413300","https://openalex.org/W1568345435","https://openalex.org/W1981276685","https://openalex.org/W2010526455","https://openalex.org/W2013520638","https://openalex.org/W2024060531","https://openalex.org/W2042214415","https://openalex.org/W2118518847","https://openalex.org/W2138537392","https://openalex.org/W2281273319","https://openalex.org/W2507756961","https://openalex.org/W2533968486","https://openalex.org/W2538025098","https://openalex.org/W2607264901","https://openalex.org/W2612690371","https://openalex.org/W2617411258","https://openalex.org/W2736601468","https://openalex.org/W2772709170","https://openalex.org/W2809824610","https://openalex.org/W2810649880","https://openalex.org/W2897628955","https://openalex.org/W2899130070","https://openalex.org/W2914109135","https://openalex.org/W2922429874","https://openalex.org/W2948610381","https://openalex.org/W2951846985","https://openalex.org/W2953054324","https://openalex.org/W2963867952","https://openalex.org/W2964054038","https://openalex.org/W2970706905","https://openalex.org/W2990613907","https://openalex.org/W2995206647","https://openalex.org/W3104153566","https://openalex.org/W3104824731","https://openalex.org/W3143219376"],"related_works":["https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W4380318855","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W3102694108","https://openalex.org/W4309955903","https://openalex.org/W3013871151"],"abstract_inverted_index":{"Quantum":[0],"hardware":[1],"and":[2,88,130,135],"quantum-inspired":[3,34],"algorithms":[4,14],"are":[5],"becoming":[6],"increasingly":[7],"popular":[8],"for":[9,20],"combinatorial":[10],"optimization.":[11],"However,":[12],"these":[13],"may":[15],"require":[16],"careful":[17],"hyperparameter":[18,138],"tuning":[19,57],"each":[21],"problem":[22,99,126],"instance.":[23],"We":[24,70],"use":[25],"a":[26,33,72,81,136],"reinforcement":[27],"learning":[28,107],"agent":[29,52,91,110],"in":[30],"conjunction":[31],"with":[32,62,127],"algorithm":[35,55],"to":[36,46,123],"solve":[37],"the":[38,47,54,63,90,124],"Ising":[39,125],"energy":[40],"minimization":[41],"problem,":[42],"which":[43],"is":[44],"equivalent":[45],"Maximum":[48],"Cut":[49],"problem.":[50],"The":[51,95],"controls":[53],"by":[56,104],"one":[58],"of":[59,65,85],"its":[60],"parameters":[61],"goal":[64],"improving":[66],"recently":[67],"seen":[68],"solutions.":[69],"propose":[71],"new":[73],"Rescaled":[74],"Ranked":[75],"Reward":[76],"(R3)":[77],"method":[78],"that":[79],"enables":[80],"stable":[82],"single-player":[83],"version":[84],"self-play":[86],"training":[87,96],"helps":[89],"escape":[92],"local":[93],"optima.":[94],"on":[97,112],"any":[98],"instance":[100],"can":[101],"be":[102],"accelerated":[103],"applying":[105],"transfer":[106],"from":[108],"an":[109],"trained":[111],"randomly":[113],"generated":[114],"problems.":[115],"Our":[116],"approach":[117],"allows":[118],"sampling":[119],"high":[120,128],"quality":[121],"solutions":[122],"probability":[129],"outperforms":[131],"both":[132],"baseline":[133],"heuristics":[134],"black-box":[137],"optimization":[139],"approach.":[140]},"counts_by_year":[{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
