{"id":"https://openalex.org/W2523799074","doi":"https://doi.org/10.23919/acc.2017.7962986","title":"Quickest change detection approach to optimal control in Markov decision processes with model changes","display_name":"Quickest change detection approach to optimal control in Markov decision processes with model changes","publication_year":2017,"publication_date":"2017-05-01","ids":{"openalex":"https://openalex.org/W2523799074","doi":"https://doi.org/10.23919/acc.2017.7962986","mag":"2523799074"},"language":"en","primary_location":{"id":"doi:10.23919/acc.2017.7962986","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc.2017.7962986","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 American Control Conference (ACC)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1609.06757","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103110148","display_name":"Taposh Banerjee","orcid":"https://orcid.org/0000-0002-9550-8573"},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]},{"id":"https://openalex.org/I2801851002","display_name":"Harvard University Press","ror":"https://ror.org/006v7bf86","country_code":"US","type":"other","lineage":["https://openalex.org/I136199984","https://openalex.org/I2801851002"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Taposh Banerjee","raw_affiliation_strings":["LIDS, Harvard University, Cambridge, MA","School of Engineering and Applied Sciences, Harvard University, Cambridge, MA, United States of America"],"affiliations":[{"raw_affiliation_string":"LIDS, Harvard University, Cambridge, MA","institution_ids":["https://openalex.org/I2801851002"]},{"raw_affiliation_string":"School of Engineering and Applied Sciences, Harvard University, Cambridge, MA, United States of America","institution_ids":["https://openalex.org/I136199984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100348904","display_name":"Miao Liu","orcid":"https://orcid.org/0000-0002-6650-9972"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Miao Liu","raw_affiliation_strings":["LIDS, Research Center, Yorktown Heights, New York","IBM T. J. Watson Research Center, Yorktown Heights, New York, United States of America"],"affiliations":[{"raw_affiliation_string":"LIDS, Research Center, Yorktown Heights, New York","institution_ids":[]},{"raw_affiliation_string":"IBM T. J. Watson Research Center, Yorktown Heights, New York, United States of America","institution_ids":["https://openalex.org/I4210114115"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011665886","display_name":"Jonathan P. How","orcid":"https://orcid.org/0000-0001-8576-1930"},"institutions":[{"id":"https://openalex.org/I4210143601","display_name":"Decision Systems (United States)","ror":"https://ror.org/0434dpa13","country_code":"US","type":"company","lineage":["https://openalex.org/I4210143601"]},{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jonathan P. How","raw_affiliation_strings":["Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology, Cambridge, MA","Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology, Cambridge, United States of America"],"affiliations":[{"raw_affiliation_string":"Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology, Cambridge, MA","institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"]},{"raw_affiliation_string":"Laboratory for Information and Decision Systems (LIDS), Massachusetts Institute of Technology, Cambridge, United States of America","institution_ids":["https://openalex.org/I4210143601","https://openalex.org/I63966007"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5103110148"],"corresponding_institution_ids":["https://openalex.org/I136199984","https://openalex.org/I2801851002"],"apc_list":null,"apc_paid":null,"fwci":0.6782,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.73934923,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"399","last_page":"405"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11443","display_name":"Advanced Statistical Process Monitoring","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11443","display_name":"Advanced Statistical Process Monitoring","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1804","display_name":"Statistics, Probability and Uncertainty"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/partially-observable-markov-decision-process","display_name":"Partially observable Markov decision process","score":0.7756353616714478},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.666862964630127},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6100417375564575},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5942215323448181},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.5543555021286011},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.48319971561431885},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.47102078795433044},{"id":"https://openalex.org/keywords/decision-problem","display_name":"Decision problem","score":0.43437063694000244},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.42206236720085144},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.3680037260055542},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2951057255268097},{"id":"https://openalex.org/keywords/markov-model","display_name":"Markov model","score":0.2946195602416992},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29357948899269104},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.27636733651161194},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2142675518989563},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.10448160767555237}],"concepts":[{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.7756353616714478},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.666862964630127},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6100417375564575},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5942215323448181},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.5543555021286011},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.48319971561431885},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.47102078795433044},{"id":"https://openalex.org/C115988155","wikidata":"https://www.wikidata.org/wiki/Q3262192","display_name":"Decision problem","level":2,"score":0.43437063694000244},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.42206236720085144},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3680037260055542},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2951057255268097},{"id":"https://openalex.org/C163836022","wikidata":"https://www.wikidata.org/wiki/Q6771326","display_name":"Markov model","level":3,"score":0.2946195602416992},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29357948899269104},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.27636733651161194},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2142675518989563},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.10448160767555237},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.23919/acc.2017.7962986","is_oa":false,"landing_page_url":"https://doi.org/10.23919/acc.2017.7962986","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 American Control Conference (ACC)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1609.06757","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1609.06757","pdf_url":"https://arxiv.org/pdf/1609.06757","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:dspace.mit.edu:1721.1/114735","is_oa":true,"landing_page_url":"http://hdl.handle.net/1721.1/114735","pdf_url":null,"source":{"id":"https://openalex.org/S4306400425","display_name":"DSpace@MIT (Massachusetts Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63966007","host_organization_name":"Massachusetts Institute of Technology","host_organization_lineage":["https://openalex.org/I63966007"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv","raw_type":"http://purl.org/eprint/type/ConferencePaper"},{"id":"doi:10.48550/arxiv.1609.06757","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1609.06757","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"},{"id":"mag:2523799074","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":null,"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1609.06757","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1609.06757","pdf_url":"https://arxiv.org/pdf/1609.06757","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.5600000023841858}],"awards":[],"funders":[{"id":"https://openalex.org/F4320308204","display_name":"Northrop Grumman","ror":"https://ror.org/05kewds18"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2523799074.pdf"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W60519195","https://openalex.org/W201409579","https://openalex.org/W1533983758","https://openalex.org/W1546020435","https://openalex.org/W1587845729","https://openalex.org/W1850608659","https://openalex.org/W1967128863","https://openalex.org/W1981904416","https://openalex.org/W2001825424","https://openalex.org/W2004094275","https://openalex.org/W2006650111","https://openalex.org/W2018319586","https://openalex.org/W2037420795","https://openalex.org/W2051903196","https://openalex.org/W2078273556","https://openalex.org/W2098432798","https://openalex.org/W2107726111","https://openalex.org/W2112072995","https://openalex.org/W2115524942","https://openalex.org/W2115597380","https://openalex.org/W2166426063","https://openalex.org/W2168342951","https://openalex.org/W2170341113","https://openalex.org/W2317700292","https://openalex.org/W2499002200","https://openalex.org/W2577420768","https://openalex.org/W2591832919","https://openalex.org/W2732645484","https://openalex.org/W4232896127","https://openalex.org/W4236243725","https://openalex.org/W6608186120","https://openalex.org/W6740804295","https://openalex.org/W7043203782"],"related_works":["https://openalex.org/W2964254877","https://openalex.org/W1527869850","https://openalex.org/W2964074953","https://openalex.org/W2408899602","https://openalex.org/W90968195","https://openalex.org/W2128775537","https://openalex.org/W2972441443","https://openalex.org/W2256566929","https://openalex.org/W1548514401","https://openalex.org/W2276878381","https://openalex.org/W1514031120","https://openalex.org/W2122187689","https://openalex.org/W2547295696","https://openalex.org/W3092636900","https://openalex.org/W2142410606","https://openalex.org/W2808013820","https://openalex.org/W3155179702","https://openalex.org/W2990691216","https://openalex.org/W3096263346","https://openalex.org/W3154040352"],"abstract_inverted_index":{"Optimal":[0],"control":[1,17],"in":[2,14,99,145,202],"non-stationary":[3,191],"Markov":[4],"decision":[5],"processes":[6],"(MDP)":[7],"is":[8,19,45,54,81,164,184],"a":[9,16,39,59,91,97,103,142,151,170,190],"challenging":[10],"problem.":[11],"The":[12,176],"aim":[13],"such":[15,113],"problem":[18,53,80,162],"to":[20,51,55,112,156],"maximize":[21],"the":[22,27,31,47,79,84,100,125,137,158,179,195,198],"long-term":[23],"discounted":[24],"reward":[25,32],"when":[26],"transition":[28],"dynamics":[29],"or":[30],"function":[33],"can":[34,140],"change":[35,43,88,98],"over":[36],"time.":[37],"When":[38],"prior":[40],"knowledge":[41],"of":[42,86,93,102,105,127,178],"statistics":[44],"available,":[46],"standard":[48],"Bayesian":[49,171,204],"approach":[50],"this":[52,77],"reformulate":[56],"it":[57,66],"as":[58],"partially":[60],"observable":[61],"MDP":[62,192],"(POMDP)":[63],"and":[64,149,194,205],"solve":[65,157],"using":[67],"approximate":[68],"POMDP":[69],"solvers,":[70],"which":[71],"are":[72],"typically":[73],"computationally":[74],"demanding.":[75],"In":[76],"paper,":[78],"analyzed":[82],"through":[83,186],"viewpoint":[85],"quickest":[87],"detection":[89],"(QCD),":[90],"set":[92],"tools":[94],"for":[95,129,167],"detecting":[96],"distribution":[101],"sequence":[104],"random":[106],"variables.":[107],"Current":[108],"methods":[109,201],"applying":[110],"QCD":[111,200],"problems":[114],"only":[115],"passively":[116],"detect":[117],"changes":[118],"by":[119],"following":[120],"prescribed":[121],"policies,":[122],"without":[123],"optimizing":[124],"choice":[126],"actions":[128],"long":[130,146],"term":[131,147],"performance.":[132],"We":[133],"demonstrate":[134],"that":[135],"ignoring":[136],"reward-detection":[138],"trade-off":[139],"cause":[141],"significant":[143],"loss":[144],"rewards,":[148],"propose":[150],"two":[152,181],"threshold":[153,182],"switching":[154],"strategy":[155,183,196],"issue.":[159],"A":[160],"non-Bayesian":[161,206],"formulation":[163,172],"also":[165],"proposed":[166,180],"scenarios":[168],"where":[169],"cannot":[173],"be":[174],"defined.":[175],"performance":[177],"examined":[185],"numerical":[187],"analysis":[188],"on":[189],"task,":[193],"outperforms":[197],"state-of-the-art":[199],"both":[203],"settings.":[207]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}