{"id":"https://openalex.org/W4364377871","doi":"https://doi.org/10.1007/s42484-023-00101-8","title":"Policy gradients using variational quantum circuits","display_name":"Policy gradients using variational quantum circuits","publication_year":2023,"publication_date":"2023-04-11","ids":{"openalex":"https://openalex.org/W4364377871","doi":"https://doi.org/10.1007/s42484-023-00101-8"},"language":"en","primary_location":{"id":"doi:10.1007/s42484-023-00101-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s42484-023-00101-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s42484-023-00101-8.pdf","source":{"id":"https://openalex.org/S4210217596","display_name":"Quantum Machine Intelligence","issn_l":"2524-4906","issn":["2524-4906","2524-4914"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Quantum Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s42484-023-00101-8.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035661885","display_name":"Andr\u00e9 Sequeira","orcid":"https://orcid.org/0000-0002-6659-9277"},"institutions":[{"id":"https://openalex.org/I121345201","display_name":"Instituto de Engenharia de Sistemas e Computadores Investiga\u00e7\u00e3o e Desenvolvimento","ror":"https://ror.org/04mqy3p58","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I121345201","https://openalex.org/I4210125590"]},{"id":"https://openalex.org/I4210141319","display_name":"International Iberian Nanotechnology Laboratory","ror":"https://ror.org/04dv3aq25","country_code":"PT","type":"facility","lineage":["https://openalex.org/I4210141319"]},{"id":"https://openalex.org/I4210166615","display_name":"INESC TEC","ror":"https://ror.org/05fa8ka61","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I4210125590","https://openalex.org/I4210166615"]},{"id":"https://openalex.org/I99682543","display_name":"University of Minho","ror":"https://ror.org/037wpkx04","country_code":"PT","type":"education","lineage":["https://openalex.org/I99682543"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Andr\u00e9 Sequeira","raw_affiliation_strings":["Department of Informatics, University of Minho, Braga, Portugal","HASLab, INESC TEC, Braga, Portugal","International Nanotechnology Laboratory (INL), Braga, Portugal"],"raw_orcid":"https://orcid.org/0000-0002-6659-9277","affiliations":[{"raw_affiliation_string":"Department of Informatics, University of Minho, Braga, Portugal","institution_ids":["https://openalex.org/I99682543"]},{"raw_affiliation_string":"HASLab, INESC TEC, Braga, Portugal","institution_ids":["https://openalex.org/I121345201","https://openalex.org/I4210166615"]},{"raw_affiliation_string":"International Nanotechnology Laboratory (INL), Braga, Portugal","institution_ids":["https://openalex.org/I4210141319"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014275814","display_name":"Lu\u00eds Paulo Santos","orcid":"https://orcid.org/0000-0003-4466-1129"},"institutions":[{"id":"https://openalex.org/I121345201","display_name":"Instituto de Engenharia de Sistemas e Computadores Investiga\u00e7\u00e3o e Desenvolvimento","ror":"https://ror.org/04mqy3p58","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I121345201","https://openalex.org/I4210125590"]},{"id":"https://openalex.org/I4210141319","display_name":"International Iberian Nanotechnology Laboratory","ror":"https://ror.org/04dv3aq25","country_code":"PT","type":"facility","lineage":["https://openalex.org/I4210141319"]},{"id":"https://openalex.org/I4210166615","display_name":"INESC TEC","ror":"https://ror.org/05fa8ka61","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I4210125590","https://openalex.org/I4210166615"]},{"id":"https://openalex.org/I99682543","display_name":"University of Minho","ror":"https://ror.org/037wpkx04","country_code":"PT","type":"education","lineage":["https://openalex.org/I99682543"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Luis Paulo Santos","raw_affiliation_strings":["Department of Informatics, University of Minho, Braga, Portugal","HASLab, INESC TEC, Braga, Portugal","International Nanotechnology Laboratory (INL), Braga, Portugal"],"raw_orcid":"https://orcid.org/0000-0003-4466-1129","affiliations":[{"raw_affiliation_string":"Department of Informatics, University of Minho, Braga, Portugal","institution_ids":["https://openalex.org/I99682543"]},{"raw_affiliation_string":"HASLab, INESC TEC, Braga, Portugal","institution_ids":["https://openalex.org/I121345201","https://openalex.org/I4210166615"]},{"raw_affiliation_string":"International Nanotechnology Laboratory (INL), Braga, Portugal","institution_ids":["https://openalex.org/I4210141319"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062334330","display_name":"Lu\u00ad\u00eds Soares Barbosa","orcid":"https://orcid.org/0000-0002-5037-2588"},"institutions":[{"id":"https://openalex.org/I121345201","display_name":"Instituto de Engenharia de Sistemas e Computadores Investiga\u00e7\u00e3o e Desenvolvimento","ror":"https://ror.org/04mqy3p58","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I121345201","https://openalex.org/I4210125590"]},{"id":"https://openalex.org/I4210141319","display_name":"International Iberian Nanotechnology Laboratory","ror":"https://ror.org/04dv3aq25","country_code":"PT","type":"facility","lineage":["https://openalex.org/I4210141319"]},{"id":"https://openalex.org/I4210166615","display_name":"INESC TEC","ror":"https://ror.org/05fa8ka61","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I4210125590","https://openalex.org/I4210166615"]},{"id":"https://openalex.org/I99682543","display_name":"University of Minho","ror":"https://ror.org/037wpkx04","country_code":"PT","type":"education","lineage":["https://openalex.org/I99682543"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Luis Soares Barbosa","raw_affiliation_strings":["Department of Informatics, University of Minho, Braga, Portugal","HASLab, INESC TEC, Braga, Portugal","International Nanotechnology Laboratory (INL), Braga, Portugal"],"raw_orcid":"https://orcid.org/0000-0002-5037-2588","affiliations":[{"raw_affiliation_string":"Department of Informatics, University of Minho, Braga, Portugal","institution_ids":["https://openalex.org/I99682543"]},{"raw_affiliation_string":"HASLab, INESC TEC, Braga, Portugal","institution_ids":["https://openalex.org/I121345201","https://openalex.org/I4210166615"]},{"raw_affiliation_string":"International Nanotechnology Laboratory (INL), Braga, Portugal","institution_ids":["https://openalex.org/I4210141319"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5035661885"],"corresponding_institution_ids":["https://openalex.org/I121345201","https://openalex.org/I4210141319","https://openalex.org/I4210166615","https://openalex.org/I99682543"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":3.8105,"has_fulltext":true,"cited_by_count":23,"citation_normalized_percentile":{"value":0.94562205,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"5","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10020","display_name":"Quantum Information and Cryptography","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7318245768547058},{"id":"https://openalex.org/keywords/parameterized-complexity","display_name":"Parameterized complexity","score":0.638516366481781},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.6335196495056152},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5633887648582458},{"id":"https://openalex.org/keywords/quantum-circuit","display_name":"Quantum circuit","score":0.5077973008155823},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4985942840576172},{"id":"https://openalex.org/keywords/quantum-algorithm","display_name":"Quantum algorithm","score":0.49846696853637695},{"id":"https://openalex.org/keywords/electronic-circuit","display_name":"Electronic circuit","score":0.44928503036499023},{"id":"https://openalex.org/keywords/statistical-physics","display_name":"Statistical physics","score":0.4442101716995239},{"id":"https://openalex.org/keywords/ansatz","display_name":"Ansatz","score":0.44367364048957825},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.37653446197509766},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.36918914318084717},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33819878101348877},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.29172948002815247},{"id":"https://openalex.org/keywords/quantum-mechanics","display_name":"Quantum mechanics","score":0.21456009149551392},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.20792436599731445},{"id":"https://openalex.org/keywords/quantum-error-correction","display_name":"Quantum error correction","score":0.1808614730834961}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7318245768547058},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.638516366481781},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.6335196495056152},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5633887648582458},{"id":"https://openalex.org/C124148022","wikidata":"https://www.wikidata.org/wiki/Q2122210","display_name":"Quantum circuit","level":5,"score":0.5077973008155823},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4985942840576172},{"id":"https://openalex.org/C137019171","wikidata":"https://www.wikidata.org/wiki/Q2623817","display_name":"Quantum algorithm","level":3,"score":0.49846696853637695},{"id":"https://openalex.org/C134146338","wikidata":"https://www.wikidata.org/wiki/Q1815901","display_name":"Electronic circuit","level":2,"score":0.44928503036499023},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.4442101716995239},{"id":"https://openalex.org/C130979935","wikidata":"https://www.wikidata.org/wiki/Q568954","display_name":"Ansatz","level":2,"score":0.44367364048957825},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.37653446197509766},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.36918914318084717},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33819878101348877},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.29172948002815247},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.21456009149551392},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.20792436599731445},{"id":"https://openalex.org/C51003876","wikidata":"https://www.wikidata.org/wiki/Q1536431","display_name":"Quantum error correction","level":4,"score":0.1808614730834961}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s42484-023-00101-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s42484-023-00101-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s42484-023-00101-8.pdf","source":{"id":"https://openalex.org/S4210217596","display_name":"Quantum Machine Intelligence","issn_l":"2524-4906","issn":["2524-4906","2524-4914"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Quantum Machine Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s42484-023-00101-8","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s42484-023-00101-8","pdf_url":"https://link.springer.com/content/pdf/10.1007/s42484-023-00101-8.pdf","source":{"id":"https://openalex.org/S4210217596","display_name":"Quantum Machine Intelligence","issn_l":"2524-4906","issn":["2524-4906","2524-4914"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Quantum Machine Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.5099999904632568}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4364377871.pdf"},"referenced_works_count":55,"referenced_works":["https://openalex.org/W32507011","https://openalex.org/W41554520","https://openalex.org/W1639600422","https://openalex.org/W1994630055","https://openalex.org/W2119717200","https://openalex.org/W2124269824","https://openalex.org/W2257979135","https://openalex.org/W2521267242","https://openalex.org/W2773252567","https://openalex.org/W2781738013","https://openalex.org/W2792315573","https://openalex.org/W2888774813","https://openalex.org/W2903221501","https://openalex.org/W2914552685","https://openalex.org/W2914809905","https://openalex.org/W2945680873","https://openalex.org/W2964155733","https://openalex.org/W2972032089","https://openalex.org/W2978899725","https://openalex.org/W2989847975","https://openalex.org/W3009313620","https://openalex.org/W3014487071","https://openalex.org/W3045093737","https://openalex.org/W3075559820","https://openalex.org/W3093944484","https://openalex.org/W3096052452","https://openalex.org/W3100931082","https://openalex.org/W3101427288","https://openalex.org/W3102731313","https://openalex.org/W3103145727","https://openalex.org/W3103766662","https://openalex.org/W3103898263","https://openalex.org/W3104428150","https://openalex.org/W3111162498","https://openalex.org/W3116019732","https://openalex.org/W3118210634","https://openalex.org/W3120939413","https://openalex.org/W3122688976","https://openalex.org/W3123348991","https://openalex.org/W3127561923","https://openalex.org/W3129458892","https://openalex.org/W3132743969","https://openalex.org/W3133779704","https://openalex.org/W3134827716","https://openalex.org/W3142041921","https://openalex.org/W3162607076","https://openalex.org/W3173713405","https://openalex.org/W3196475060","https://openalex.org/W3197289147","https://openalex.org/W3200849153","https://openalex.org/W3200900716","https://openalex.org/W3207479555","https://openalex.org/W4213212652","https://openalex.org/W4221149720","https://openalex.org/W4233413206"],"related_works":["https://openalex.org/W4309028366","https://openalex.org/W3203550463","https://openalex.org/W4306815925","https://openalex.org/W4281550036","https://openalex.org/W2906136444","https://openalex.org/W4310985960","https://openalex.org/W2037426566","https://openalex.org/W4375959436","https://openalex.org/W4388032411","https://openalex.org/W4289799474"],"abstract_inverted_index":{"Abstract":[0],"Variational":[1],"quantum":[2,9,41,88,103,120],"circuits":[3],"are":[4],"being":[5],"used":[6,97],"as":[7,49],"versatile":[8],"machine":[10],"learning":[11,23,56],"models.":[12],"Some":[13],"empirical":[14],"results":[15],"exhibit":[16],"an":[17,61],"advantage":[18],"in":[19,98,119],"supervised":[20],"and":[21,102],"generative":[22],"tasks.":[24],"However,":[25],"when":[26],"applied":[27],"to":[28,92],"reinforcement":[29,55],"learning,":[30],"less":[31],"is":[32],"known.":[33],"In":[34],"this":[35],"work,":[36],"we":[37,113],"considered":[38],"a":[39,45,54,72,107],"variational":[40],"circuit":[42],"composed":[43],"of":[44,53,64,75,81,109],"low-depth":[46],"hardware-efficient":[47],"ansatz":[48],"the":[50,65,78,110,115,124],"parameterized":[51],"policy":[52,66,121],"agent.":[57],"We":[58,83],"show":[59],"that":[60,86],"\ud835\udf16":[62],"-approximation":[63],"gradient":[67],"can":[68],"be":[69],"obtained":[70],"using":[71,105,123],"logarithmic":[73],"number":[74,80],"samples":[76],"concerning":[77],"total":[79],"parameters.":[82,111],"empirically":[84],"verify":[85],"such":[87],"models":[89],"behave":[90],"similarly":[91],"typical":[93],"classical":[94],"neural":[95],"networks":[96],"standard":[99],"benchmarking":[100],"environments":[101],"control,":[104],"only":[106],"fraction":[108],"Moreover,":[112],"study":[114],"barren":[116],"plateau":[117],"phenomenon":[118],"gradients":[122],"Fisher":[125],"information":[126],"matrix":[127],"spectrum.":[128]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
