{"id":"https://openalex.org/W4416874763","doi":"https://doi.org/10.1109/qce65121.2025.10326","title":"Quantum Reinforcement Learning by Adaptive Non-Local Observables","display_name":"Quantum Reinforcement Learning by Adaptive Non-Local Observables","publication_year":2025,"publication_date":"2025-08-30","ids":{"openalex":"https://openalex.org/W4416874763","doi":"https://doi.org/10.1109/qce65121.2025.10326"},"language":null,"primary_location":{"id":"doi:10.1109/qce65121.2025.10326","is_oa":false,"landing_page_url":"https://doi.org/10.1109/qce65121.2025.10326","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Quantum Computing and Engineering (QCE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100652782","display_name":"Hsin-Yi Lin","orcid":"https://orcid.org/0000-0001-5731-2353"},"institutions":[{"id":"https://openalex.org/I12524447","display_name":"Seton Hall University","ror":"https://ror.org/007tn5k56","country_code":"US","type":"education","lineage":["https://openalex.org/I12524447"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hsin-Yi Lin","raw_affiliation_strings":["Seton Hall University,Department of Mathematics and Computer Science,South Orange,NJ,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Seton Hall University,Department of Mathematics and Computer Science,South Orange,NJ,USA","institution_ids":["https://openalex.org/I12524447"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021414038","display_name":"Samuel Yen-Chi Chen","orcid":"https://orcid.org/0000-0003-0114-4826"},"institutions":[{"id":"https://openalex.org/I166794780","display_name":"Wells Fargo (United States)","ror":"https://ror.org/037r2ff59","country_code":"US","type":"company","lineage":["https://openalex.org/I166794780"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samuel Yen-Chi Chen","raw_affiliation_strings":["Wells Fargo,New York,NY,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wells Fargo,New York,NY,USA","institution_ids":["https://openalex.org/I166794780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034788095","display_name":"H. Eric Tseng","orcid":"https://orcid.org/0000-0001-9544-4226"},"institutions":[{"id":"https://openalex.org/I200870766","display_name":"Brookhaven National Laboratory","ror":"https://ror.org/02ex6cf31","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I200870766","https://openalex.org/I39565521","https://openalex.org/I4210142672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Huan-Hsin Tseng","raw_affiliation_strings":["Brookhaven National Laboratory,AI &#x0026; ML Department,Upton,NY,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Brookhaven National Laboratory,AI &#x0026; ML Department,Upton,NY,USA","institution_ids":["https://openalex.org/I200870766"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048176207","display_name":"Shinjae Yoo","orcid":"https://orcid.org/0000-0003-4378-6448"},"institutions":[{"id":"https://openalex.org/I200870766","display_name":"Brookhaven National Laboratory","ror":"https://ror.org/02ex6cf31","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I200870766","https://openalex.org/I39565521","https://openalex.org/I4210142672"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shinjae Yoo","raw_affiliation_strings":["Brookhaven National Laboratory,AI &#x0026; ML Department,Upton,NY,USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Brookhaven National Laboratory,AI &#x0026; ML Department,Upton,NY,USA","institution_ids":["https://openalex.org/I200870766"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7588,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.89740663,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"241","last_page":"246"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.919700026512146,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.919700026512146,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.026100000366568565,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10020","display_name":"Quantum Information and Cryptography","score":0.01549999974668026,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.8420000076293945},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8108000159263611},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.5986999869346619},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5968000292778015},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5285000205039978},{"id":"https://openalex.org/keywords/temporal-difference-learning","display_name":"Temporal difference learning","score":0.46790000796318054},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.4377000033855438},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.41370001435279846},{"id":"https://openalex.org/keywords/quantum-gate","display_name":"Quantum gate","score":0.37610000371932983}],"concepts":[{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.8420000076293945},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8108000159263611},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.5986999869346619},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5968000292778015},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5461999773979187},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5285000205039978},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.46790000796318054},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.4377000033855438},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.41370001435279846},{"id":"https://openalex.org/C58849907","wikidata":"https://www.wikidata.org/wiki/Q2118982","display_name":"Quantum gate","level":4,"score":0.37610000371932983},{"id":"https://openalex.org/C124148022","wikidata":"https://www.wikidata.org/wiki/Q2122210","display_name":"Quantum circuit","level":5,"score":0.36230000853538513},{"id":"https://openalex.org/C150072547","wikidata":"https://www.wikidata.org/wiki/Q212923","display_name":"Memristor","level":2,"score":0.34060001373291016},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3345000147819519},{"id":"https://openalex.org/C2778926657","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum system","level":3,"score":0.329800009727478},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.31610000133514404},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.30820000171661377},{"id":"https://openalex.org/C134146338","wikidata":"https://www.wikidata.org/wiki/Q1815901","display_name":"Electronic circuit","level":2,"score":0.3050000071525574},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.3041999936103821},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.3041999936103821},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2971000075340271},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.29269999265670776},{"id":"https://openalex.org/C137019171","wikidata":"https://www.wikidata.org/wiki/Q2623817","display_name":"Quantum algorithm","level":3,"score":0.2775999903678894},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2720000147819519},{"id":"https://openalex.org/C15706264","wikidata":"https://www.wikidata.org/wiki/Q230883","display_name":"Quantum state","level":3,"score":0.2685000002384186},{"id":"https://openalex.org/C73586568","wikidata":"https://www.wikidata.org/wiki/Q2600211","display_name":"Parameter space","level":2,"score":0.26170000433921814}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/qce65121.2025.10326","is_oa":false,"landing_page_url":"https://doi.org/10.1109/qce65121.2025.10326","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Quantum Computing and Engineering (QCE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5720546791","display_name":null,"funder_award_id":"DE-AC02-05CH11231,HEPERCAP0033786","funder_id":"https://openalex.org/F4320317220","funder_display_name":"National Energy Research Scientific Computing Center"}],"funders":[{"id":"https://openalex.org/F4320317220","display_name":"National Energy Research Scientific Computing Center","ror":"https://ror.org/05v3mvq14"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2015811642","https://openalex.org/W2145339207","https://openalex.org/W2275410481","https://openalex.org/W2559394418","https://openalex.org/W2755255888","https://openalex.org/W2781738013","https://openalex.org/W2790388700","https://openalex.org/W2798434869","https://openalex.org/W2896712926","https://openalex.org/W2898401615","https://openalex.org/W2954939433","https://openalex.org/W2980446414","https://openalex.org/W2990961515","https://openalex.org/W3045093737","https://openalex.org/W3075559820","https://openalex.org/W3093944484","https://openalex.org/W3111162498","https://openalex.org/W3141755656","https://openalex.org/W3196514226","https://openalex.org/W4213212652","https://openalex.org/W4313566505","https://openalex.org/W4386336967","https://openalex.org/W4392305618","https://openalex.org/W4399493235","https://openalex.org/W4410770879"],"related_works":[],"abstract_inverted_index":{"Hybrid":[0],"quantum-classical":[1],"frameworks":[2],"leverage":[3],"quantum":[4,11,30,92],"computing":[5],"for":[6,29],"machine":[7],"learning;":[8],"however,":[9],"variational":[10],"circuits":[12],"(VQCs)":[13],"are":[14],"limited":[15],"by":[16],"local":[17],"measurements.":[18,40],"We":[19],"introduce":[20],"an":[21],"adaptive":[22,72,86],"non-local":[23],"observable":[24],"(ANO)":[25],"paradigm":[26],"within":[27],"VQCs":[28],"reinforcement":[31,95],"learning":[32],"(QRL),":[33],"jointly":[34],"optimizing":[35],"circuit":[36,80],"parameters":[37],"and":[38,53],"multi-qubit":[39,87],"The":[41],"ANO-VQC":[42],"architecture":[43],"serves":[44],"as":[45],"the":[46,75],"function":[47,76],"approximator":[48],"in":[49,94],"Deep":[50],"Q-Network":[51],"(DQN)":[52],"Asynchronous":[54],"Advantage":[55],"Actor-Critic":[56],"(A3C)":[57],"algorithms.":[58],"On":[59],"multiple":[60],"benchmark":[61],"tasks,":[62],"ANOVQC":[63],"agents":[64],"outperform":[65],"baseline":[66],"VQCs.":[67],"Ablation":[68],"studies":[69],"reveal":[70],"that":[71,85],"measurements":[73],"enhance":[74],"space":[77],"without":[78],"increasing":[79],"depth.":[81],"Our":[82],"results":[83],"demonstrate":[84],"observables":[88],"can":[89],"enable":[90],"practical":[91],"advantages":[93],"learning.":[96]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-12-01T00:00:00"}
