{"id":"https://openalex.org/W3138349270","doi":"https://doi.org/10.1007/s11633-021-1278-z","title":"Optimal Policies for Quantum Markov Decision Processes","display_name":"Optimal Policies for Quantum Markov Decision Processes","publication_year":2021,"publication_date":"2021-03-19","ids":{"openalex":"https://openalex.org/W3138349270","doi":"https://doi.org/10.1007/s11633-021-1278-z","mag":"3138349270"},"language":"en","primary_location":{"id":"doi:10.1007/s11633-021-1278-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11633-021-1278-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11633-021-1278-z.pdf","source":{"id":"https://openalex.org/S28082686","display_name":"International Journal of Automation and Computing","issn_l":"1476-8186","issn":["1476-8186","1751-8520"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Automation and Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11633-021-1278-z.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023088481","display_name":"Mingsheng Ying","orcid":"https://orcid.org/0000-0003-4847-702X"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210096034","display_name":"Centre for Quantum Computation and Communication Technology","ror":"https://ror.org/00rnbty21","country_code":"AU","type":"facility","lineage":["https://openalex.org/I1337719021","https://openalex.org/I165143802","https://openalex.org/I2801453606","https://openalex.org/I4210096034","https://openalex.org/I4210132349"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["AU","CN"],"is_corresponding":true,"raw_author_name":"Ming-Sheng Ying","raw_affiliation_strings":["Centre for Quantum Software and Information, University of Technology, Sydney, NSW, 2007, Australia","Department of Computer Science and Technology, Tsinghua University, Beijing, 100084, China","State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, 100190, China","Department of Computer Science and Technology, Tsinghua University, Beijing, China","Centre for Quantum Software and Information, University of Technology, Sydney, Australia","State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4847-702X","affiliations":[{"raw_affiliation_string":"Centre for Quantum Software and Information, University of Technology, Sydney, NSW, 2007, Australia","institution_ids":["https://openalex.org/I4210096034","https://openalex.org/I114017466"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, 100084, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Centre for Quantum Software and Information, University of Technology, Sydney, Australia","institution_ids":["https://openalex.org/I4210096034","https://openalex.org/I114017466"]},{"raw_affiliation_string":"State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022869475","display_name":"Yuan Feng","orcid":"https://orcid.org/0000-0002-3097-3896"},"institutions":[{"id":"https://openalex.org/I114017466","display_name":"University of Technology Sydney","ror":"https://ror.org/03f0f6041","country_code":"AU","type":"education","lineage":["https://openalex.org/I114017466"]},{"id":"https://openalex.org/I4210096034","display_name":"Centre for Quantum Computation and Communication Technology","ror":"https://ror.org/00rnbty21","country_code":"AU","type":"facility","lineage":["https://openalex.org/I1337719021","https://openalex.org/I165143802","https://openalex.org/I2801453606","https://openalex.org/I4210096034","https://openalex.org/I4210132349"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Yuan Feng","raw_affiliation_strings":["Centre for Quantum Software and Information, University of Technology, Sydney, NSW, 2007, Australia","Centre for Quantum Software and Information, University of Technology, Sydney, Australia"],"raw_orcid":"https://orcid.org/0000-0002-3097-3896","affiliations":[{"raw_affiliation_string":"Centre for Quantum Software and Information, University of Technology, Sydney, NSW, 2007, Australia","institution_ids":["https://openalex.org/I4210096034","https://openalex.org/I114017466"]},{"raw_affiliation_string":"Centre for Quantum Software and Information, University of Technology, Sydney, Australia","institution_ids":["https://openalex.org/I4210096034","https://openalex.org/I114017466"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075583677","display_name":"Shenggang Ying","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210128818","display_name":"Institute of Software","ror":"https://ror.org/033dfsn42","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210128818"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sheng-Gang Ying","raw_affiliation_strings":["State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, 100190, China","State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-5052-5142","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, 100190, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I19820366"]},{"raw_affiliation_string":"State Key Laboratory of Computer Science, Institute of Software, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210128818","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5023088481"],"corresponding_institution_ids":["https://openalex.org/I114017466","https://openalex.org/I19820366","https://openalex.org/I4210096034","https://openalex.org/I4210128818","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.2593,"has_fulltext":true,"cited_by_count":13,"citation_normalized_percentile":{"value":0.83326231,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"18","issue":"3","first_page":"410","last_page":"421"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10020","display_name":"Quantum Information and Cryptography","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.879537045955658},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7898920774459839},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6289659738540649},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.6080582737922668},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.507843554019928},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.49985790252685547},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.486186683177948},{"id":"https://openalex.org/keywords/decision-problem","display_name":"Decision problem","score":0.45365986227989197},{"id":"https://openalex.org/keywords/quantum-computer","display_name":"Quantum computer","score":0.42186439037323},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41739022731781006},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.41660308837890625},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.3987525701522827},{"id":"https://openalex.org/keywords/management-science","display_name":"Management science","score":0.3742695152759552},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.36651116609573364},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2961443066596985},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2555958330631256},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.21307110786437988},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.21054130792617798},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09439122676849365}],"concepts":[{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.879537045955658},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7898920774459839},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6289659738540649},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.6080582737922668},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.507843554019928},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.49985790252685547},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.486186683177948},{"id":"https://openalex.org/C115988155","wikidata":"https://www.wikidata.org/wiki/Q3262192","display_name":"Decision problem","level":2,"score":0.45365986227989197},{"id":"https://openalex.org/C58053490","wikidata":"https://www.wikidata.org/wiki/Q176555","display_name":"Quantum computer","level":3,"score":0.42186439037323},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41739022731781006},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.41660308837890625},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.3987525701522827},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.3742695152759552},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.36651116609573364},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2961443066596985},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2555958330631256},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.21307110786437988},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.21054130792617798},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09439122676849365},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11633-021-1278-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11633-021-1278-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11633-021-1278-z.pdf","source":{"id":"https://openalex.org/S28082686","display_name":"International Journal of Automation and Computing","issn_l":"1476-8186","issn":["1476-8186","1751-8520"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Automation and Computing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11633-021-1278-z","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11633-021-1278-z","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11633-021-1278-z.pdf","source":{"id":"https://openalex.org/S28082686","display_name":"International Journal of Automation and Computing","issn_l":"1476-8186","issn":["1476-8186","1751-8520"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Automation and Computing","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.800000011920929,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G1915554876","display_name":null,"funder_award_id":"DP160101652","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"},{"id":"https://openalex.org/G8331665637","display_name":null,"funder_award_id":"DP180100691","funder_id":"https://openalex.org/F4320334704","funder_display_name":"Australian Research Council"},{"id":"https://openalex.org/G8332624565","display_name":"\u91cf\u5b50\u7a0b\u5e8f\u8bbe\u8ba1\u7684\u7406\u8bba\u57fa\u7840","funder_award_id":"61832015","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"},{"id":"https://openalex.org/F4320334704","display_name":"Australian Research Council","ror":"https://ror.org/05mmh0f86"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3138349270.pdf","grobid_xml":"https://content.openalex.org/works/W3138349270.grobid-xml"},"referenced_works_count":39,"referenced_works":["https://openalex.org/W294073838","https://openalex.org/W1546944959","https://openalex.org/W1630029119","https://openalex.org/W1835855307","https://openalex.org/W1971221192","https://openalex.org/W1981691276","https://openalex.org/W2011585646","https://openalex.org/W2032100464","https://openalex.org/W2032675708","https://openalex.org/W2101697221","https://openalex.org/W2107726111","https://openalex.org/W2117941808","https://openalex.org/W2119567691","https://openalex.org/W2121863487","https://openalex.org/W2127830251","https://openalex.org/W2128609675","https://openalex.org/W2168359464","https://openalex.org/W2314872319","https://openalex.org/W2521267242","https://openalex.org/W2559394418","https://openalex.org/W2773252567","https://openalex.org/W2787337287","https://openalex.org/W2792315573","https://openalex.org/W2797758148","https://openalex.org/W2918644153","https://openalex.org/W2939102864","https://openalex.org/W2954678526","https://openalex.org/W2962822640","https://openalex.org/W2963975928","https://openalex.org/W2964331425","https://openalex.org/W3022578515","https://openalex.org/W3038224590","https://openalex.org/W3099910066","https://openalex.org/W3101558632","https://openalex.org/W3102731313","https://openalex.org/W3119597650","https://openalex.org/W4210251360","https://openalex.org/W4214717370","https://openalex.org/W4298023569"],"related_works":["https://openalex.org/W2808418668","https://openalex.org/W4241327272","https://openalex.org/W2120406836","https://openalex.org/W1996214847","https://openalex.org/W2903299703","https://openalex.org/W2117282672","https://openalex.org/W4211224558","https://openalex.org/W4385342861","https://openalex.org/W1672382258","https://openalex.org/W1574958246"],"abstract_inverted_index":{"Abstract":[0],"Markov":[1],"decision":[2,12,48],"process":[3],"(MDP)":[4],"offers":[5],"a":[6,23,44],"general":[7],"framework":[8,25],"for":[9,26,58,65,83],"modelling":[10],"sequential":[11],"making":[13,49],"where":[14],"outcomes":[15],"are":[16],"random.":[17],"In":[18],"particular,":[19],"it":[20],"serves":[21],"as":[22,43],"mathematical":[24,45,81],"reinforcement":[27,84],"learning.":[28],"This":[29],"paper":[30,77],"introduces":[31],"an":[32],"extension":[33],"of":[34,47,70],"MDP,":[35],"namely":[36],"quantum":[37,51,90],"MDP":[38],"(qMDP),":[39],"that":[40],"can":[41],"serve":[42],"model":[46],"about":[50],"systems.":[52],"We":[53],"develop":[54],"dynamic":[55],"programming":[56],"algorithms":[57],"policy":[59],"evaluation":[60],"and":[61],"finding":[62],"optimal":[63],"policies":[64],"qMDPs":[66],"in":[67,75],"the":[68,89],"case":[69],"finite-horizon.":[71],"The":[72],"results":[73],"obtained":[74],"this":[76],"provide":[78],"some":[79],"useful":[80],"tools":[82],"learning":[85],"techniques":[86],"applied":[87],"to":[88],"world.":[91]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":4}],"updated_date":"2026-06-06T09:05:17.133730","created_date":"2025-10-10T00:00:00"}
