{"id":"https://openalex.org/W2773252567","doi":"https://doi.org/10.1109/smc.2017.8122616","title":"Advances in quantum reinforcement learning","display_name":"Advances in quantum reinforcement learning","publication_year":2017,"publication_date":"2017-10-01","ids":{"openalex":"https://openalex.org/W2773252567","doi":"https://doi.org/10.1109/smc.2017.8122616","mag":"2773252567"},"language":"en","primary_location":{"id":"doi:10.1109/smc.2017.8122616","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc.2017.8122616","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1811.08676","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069043772","display_name":"Vedran Dunjko","orcid":"https://orcid.org/0000-0002-2632-7955"},"institutions":[{"id":"https://openalex.org/I4210120293","display_name":"Max Planck Institute of Quantum Optics","ror":"https://ror.org/01vekys64","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210120293"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Vedran Dunjko","raw_affiliation_strings":["Institute for Theoretical Physics, Max Planck Institute of Quantum Optics, Garching, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute for Theoretical Physics, Max Planck Institute of Quantum Optics, Garching, Germany","institution_ids":["https://openalex.org/I4210120293"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101524935","display_name":"Jacob M. Taylor","orcid":"https://orcid.org/0000-0003-0493-5594"},"institutions":[{"id":"https://openalex.org/I4210151733","display_name":"Joint Quantum Institute","ror":"https://ror.org/04xz38214","country_code":"US","type":"facility","lineage":["https://openalex.org/I1321296531","https://openalex.org/I1343035065","https://openalex.org/I4210151733","https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jacob M. Taylor","raw_affiliation_strings":["Joint Quantum Institute & NIST, Maryland, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Joint Quantum Institute & NIST, Maryland, USA","institution_ids":["https://openalex.org/I4210151733"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009007803","display_name":"Hans J. Briegel","orcid":"https://orcid.org/0000-0002-9065-1565"},"institutions":[{"id":"https://openalex.org/I189712700","display_name":"University of Konstanz","ror":"https://ror.org/0546hnb39","country_code":"DE","type":"education","lineage":["https://openalex.org/I189712700"]},{"id":"https://openalex.org/I190249584","display_name":"Universit\u00e4t Innsbruck","ror":"https://ror.org/054pv6659","country_code":"AT","type":"education","lineage":["https://openalex.org/I190249584"]}],"countries":["AT","DE"],"is_corresponding":false,"raw_author_name":"Hans J. Briegel","raw_affiliation_strings":["University of Innsbruck Innsbruck 6020, Austria, and Department of Philosophy, University of Konstanz, Konstanz, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Innsbruck Innsbruck 6020, Austria, and Department of Philosophy, University of Konstanz, Konstanz, Germany","institution_ids":["https://openalex.org/I190249584","https://openalex.org/I189712700"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":3.5111,"has_fulltext":false,"cited_by_count":77,"citation_normalized_percentile":{"value":0.94378362,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"282","last_page":"287"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10020","display_name":"Quantum Information and Cryptography","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9003355503082275},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7205447554588318},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5719015598297119},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.5177509188652039},{"id":"https://openalex.org/keywords/quantum-machine-learning","display_name":"Quantum machine learning","score":0.5129110813140869},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5026223659515381},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.47694316506385803},{"id":"https://openalex.org/keywords/quantum-computer","display_name":"Quantum computer","score":0.26353463530540466},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09216240048408508},{"id":"https://openalex.org/keywords/quantum-mechanics","display_name":"Quantum mechanics","score":0.08110129833221436}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9003355503082275},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7205447554588318},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5719015598297119},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.5177509188652039},{"id":"https://openalex.org/C2779094486","wikidata":"https://www.wikidata.org/wiki/Q18811578","display_name":"Quantum machine learning","level":4,"score":0.5129110813140869},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5026223659515381},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.47694316506385803},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.26353463530540466},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09216240048408508},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.08110129833221436},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/smc.2017.8122616","is_oa":false,"landing_page_url":"https://doi.org/10.1109/smc.2017.8122616","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Systems, Man, and Cybernetics (SMC)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1811.08676","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1811.08676","pdf_url":"https://arxiv.org/pdf/1811.08676","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1811.08676","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1811.08676","pdf_url":"https://arxiv.org/pdf/1811.08676","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8199999928474426,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W118877790","https://openalex.org/W199424061","https://openalex.org/W1823319392","https://openalex.org/W1968493380","https://openalex.org/W1994630055","https://openalex.org/W2031056773","https://openalex.org/W2051446825","https://openalex.org/W2062938319","https://openalex.org/W2079905842","https://openalex.org/W2100483895","https://openalex.org/W2103956991","https://openalex.org/W2111790732","https://openalex.org/W2121863487","https://openalex.org/W2121981260","https://openalex.org/W2127830251","https://openalex.org/W2153887174","https://openalex.org/W2257979135","https://openalex.org/W2266138411","https://openalex.org/W2489886790","https://openalex.org/W2521267242","https://openalex.org/W2590232898","https://openalex.org/W2623293810","https://openalex.org/W2914656440","https://openalex.org/W2949945034","https://openalex.org/W2962688653","https://openalex.org/W3145497935","https://openalex.org/W3217033513","https://openalex.org/W4214717370","https://openalex.org/W4298644983"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W4387806146","https://openalex.org/W2982197950","https://openalex.org/W2981886227","https://openalex.org/W4320521261","https://openalex.org/W4284897515","https://openalex.org/W3111799909"],"abstract_inverted_index":{"In":[0,120],"recent":[1],"times,":[2],"there":[3],"has":[4],"been":[5],"much":[6],"interest":[7],"in":[8,15,31,34,39,49,65,156,175],"quantum":[9,42,60,130,180],"enhancements":[10,61],"of":[11,18,28,71,98,125,128,140,163,167,179],"machine":[12],"learning,":[13,24,29],"specifically":[14],"the":[16,69,96,126,134,157,164,168],"context":[17],"data":[19],"mining":[20],"and":[21,57,159],"analysis.":[22],"Reinforcement":[23],"an":[25],"interactive":[26],"form":[27],"is,":[30,82],"turn,":[32],"vital":[33],"artificial":[35],"intelligence-type":[36],"applications.":[37],"Also":[38],"this":[40],"case,":[41],"mechanics":[43],"was":[44],"shown":[45],"to":[46,77,102,115],"be":[47,63,113,173],"useful,":[48],"certain":[50],"instances.":[51],"Here,":[52],"we":[53,122,144],"elucidate":[54],"these":[55,151],"results,":[56],"show":[58,107],"that":[59,81,84,108],"can":[62,112],"achieved":[64],"a":[66,147],"new":[67],"setting:":[68],"setting":[70],"learning":[72,89,132],"models":[73,90,94,111],"which":[74,149],"learn":[75],"how":[76],"improve":[78],"themselves":[79],"-":[80],"those":[83],"metalearn.":[85],"While":[86],"not":[87],"all":[88,92],"meta-learn,":[91],"non-trivial":[93],"have":[95],"potential":[97],"being":[99],"\"lifted\",":[100],"enhanced,":[101],"meta-learning":[103],"models.":[104],"Our":[105],"results":[106],"also":[109],"such":[110],"quantum-enhanced":[114],"make":[116],"even":[117],"better":[118],"learners.":[119],"parallel,":[121],"address":[123],"one":[124],"bottlenecks":[127],"current":[129],"reinforcement":[131,181],"approaches:":[133],"need":[135],"for":[136],"so-called":[137],"oracularized":[138],"variants":[139],"task":[141],"environments.":[142,169],"Here":[143],"elaborate":[145],"on":[146],"method":[148],"realizes":[150],"variants,":[152],"with":[153,160],"minimal":[154],"changes":[155],"setting,":[158],"no":[161],"corruption":[162],"operative":[165],"specification":[166],"This":[170],"result":[171],"may":[172],"important":[174],"near-term":[176],"experimental":[177],"demonstrations":[178],"learning.":[182]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":9},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
