{"id":"https://openalex.org/W7160421993","doi":"https://doi.org/10.48550/arxiv.2605.03434","title":"Quantum Hierarchical Reinforcement Learning via Variational Quantum Circuits","display_name":"Quantum Hierarchical Reinforcement Learning via Variational Quantum Circuits","publication_year":2026,"publication_date":"2026-05-05","ids":{"openalex":"https://openalex.org/W7160421993","doi":"https://doi.org/10.48550/arxiv.2605.03434"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.03434","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03434","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.03434","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135441709","display_name":"Yu-Ting Lee","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lee, Yu-Ting","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135512157","display_name":"Samuel Yen-Chi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Samuel Yen-Chi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135447208","display_name":"Fu-Chieh Chang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chang, Fu-Chieh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.96670001745224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.96670001745224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10020","display_name":"Quantum Information and Cryptography","score":0.01600000075995922,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11804","display_name":"Quantum many-body systems","score":0.002899999963119626,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7786999940872192},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.6180999875068665},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.5827999711036682},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.462799996137619},{"id":"https://openalex.org/keywords/quantum-algorithm","display_name":"Quantum algorithm","score":0.4498000144958496},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.44179999828338623},{"id":"https://openalex.org/keywords/quantum-machine-learning","display_name":"Quantum machine learning","score":0.37459999322891235},{"id":"https://openalex.org/keywords/quantum-system","display_name":"Quantum system","score":0.3718000054359436},{"id":"https://openalex.org/keywords/quantum-computer","display_name":"Quantum computer","score":0.37139999866485596},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3677999973297119}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7786999940872192},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6187000274658203},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.6180999875068665},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.5827999711036682},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.462799996137619},{"id":"https://openalex.org/C137019171","wikidata":"https://www.wikidata.org/wiki/Q2623817","display_name":"Quantum algorithm","level":3,"score":0.4498000144958496},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4431000053882599},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.44179999828338623},{"id":"https://openalex.org/C2779094486","wikidata":"https://www.wikidata.org/wiki/Q18811578","display_name":"Quantum machine learning","level":4,"score":0.37459999322891235},{"id":"https://openalex.org/C2778926657","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum system","level":3,"score":0.3718000054359436},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.37139999866485596},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3677999973297119},{"id":"https://openalex.org/C184720557","wikidata":"https://www.wikidata.org/wiki/Q7825049","display_name":"Topology (electrical circuits)","level":2,"score":0.35120001435279846},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3472000062465668},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.34139999747276306},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.3411000072956085},{"id":"https://openalex.org/C124148022","wikidata":"https://www.wikidata.org/wiki/Q2122210","display_name":"Quantum circuit","level":5,"score":0.3231000006198883},{"id":"https://openalex.org/C50897621","wikidata":"https://www.wikidata.org/wiki/Q2665508","display_name":"Hybrid system","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C58849907","wikidata":"https://www.wikidata.org/wiki/Q2118982","display_name":"Quantum gate","level":4,"score":0.31130000948905945},{"id":"https://openalex.org/C134146338","wikidata":"https://www.wikidata.org/wiki/Q1815901","display_name":"Electronic circuit","level":2,"score":0.30979999899864197},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.28679999709129333},{"id":"https://openalex.org/C186468114","wikidata":"https://www.wikidata.org/wiki/Q836478","display_name":"Quantum network","level":4,"score":0.2766999900341034},{"id":"https://openalex.org/C67820243","wikidata":"https://www.wikidata.org/wiki/Q179164","display_name":"Unitary state","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.2687999904155731},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.25929999351501465},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.257999986410141},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2563999891281128},{"id":"https://openalex.org/C199185054","wikidata":"https://www.wikidata.org/wiki/Q552299","display_name":"Chain (unit)","level":2,"score":0.2563999891281128},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.03434","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03434","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.03434","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03434","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.6646456122398376}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,8,20],"is":[2,21],"one":[3],"of":[4,135],"the":[5,65,136],"most":[6],"challenging":[7],"paradigms":[9],"where":[10],"efficacy":[11],"and":[12,85],"efficiency":[13],"gains":[14],"are":[15],"extremely":[16],"valuable.":[17],"Hierarchical":[18],"reinforcement":[19,40],"a":[22,50,59,96,100],"variant":[23],"that":[24,95,121],"leverages":[25],"temporal":[26],"abstraction":[27],"to":[28,46,111],"structure":[29],"decision-making.":[30],"While":[31],"parametrized":[32],"quantum":[33,76,101,122,137],"computations":[34],"have":[35],"shown":[36],"success":[37],"in":[38],"non-hierarchical":[39],"learning,":[41],"whether":[42],"these":[43],"advantages":[44],"adapt":[45],"hierarchical":[47,61,149],"decision-making":[48],"remains":[49],"critical":[51],"open":[52],"question.":[53],"In":[54],"this":[55],"work,":[56],"we":[57],"develop":[58],"hybrid":[60,69,97,148],"agent":[62,70,98],"based":[63],"on":[64,89],"option-critic":[66],"architecture.":[67],"This":[68],"substitutes":[71],"classical":[72,106],"components":[73],"with":[74],"variational":[75],"circuits":[77,138],"for":[78,146],"feature":[79,102],"extractors,":[80],"option-value":[81,123],"functions,":[82,84],"termination":[83],"intra-option":[86],"policies.":[87],"Evaluated":[88],"standard":[90],"benchmarking":[91],"environments,":[92],"results":[93],"show":[94],"utilizing":[99],"extractor":[103],"can":[104],"outperform":[105],"baselines":[107],"while":[108],"saving":[109],"up":[110],"66\\%":[112],"trainable":[113],"parameters.":[114],"We":[115],"also":[116],"identify":[117],"an":[118],"architectural":[119,133],"bottleneck":[120],"estimation":[124],"severely":[125],"degrades":[126],"performance.":[127,140],"Further":[128],"ablation":[129],"studies":[130],"reveal":[131],"how":[132],"choices":[134],"affect":[139],"Our":[141],"work":[142],"establishes":[143],"design":[144],"principles":[145],"parameter-efficient":[147],"agents.":[150]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-07T00:00:00"}
