{"id":"https://openalex.org/W2620827312","doi":"https://doi.org/10.1177/0278364915581505","title":"Temporal logic motion control using actor\u2013critic methods","display_name":"Temporal logic motion control using actor\u2013critic methods","publication_year":2015,"publication_date":"2015-05-26","ids":{"openalex":"https://openalex.org/W2620827312","doi":"https://doi.org/10.1177/0278364915581505","mag":"2620827312"},"language":"en","primary_location":{"id":"doi:10.1177/0278364915581505","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0278364915581505","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of Robotics Research","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100378632","display_name":"Jing Wang","orcid":"https://orcid.org/0000-0003-0182-0353"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jing Wang","raw_affiliation_strings":["Division of System Engineering, Department of Mechanical Engineering, and Department of Electrical and Computer Engineering, Boston University, Boston, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of System Engineering, Department of Mechanical Engineering, and Department of Electrical and Computer Engineering, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111565635","display_name":"Xuchu Ding","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145666","display_name":"Embedded Systems (United States)","ror":"https://ror.org/04742eh45","country_code":"US","type":"company","lineage":["https://openalex.org/I4210145666"]},{"id":"https://openalex.org/I4401726811","display_name":"Hartford Financial Services (United States)","ror":"https://ror.org/00mwq1g96","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726811"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuchu Ding","raw_affiliation_strings":["Embedded Systems and Networks Group, United Technologies Research Center, East Hartford, CT, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Embedded Systems and Networks Group, United Technologies Research Center, East Hartford, CT, USA","institution_ids":["https://openalex.org/I4210145666","https://openalex.org/I4401726811"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069564559","display_name":"Morteza Lahijanian","orcid":"https://orcid.org/0000-0001-7549-4365"},"institutions":[{"id":"https://openalex.org/I74775410","display_name":"Rice University","ror":"https://ror.org/008zs3103","country_code":"US","type":"education","lineage":["https://openalex.org/I74775410"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Morteza Lahijanian","raw_affiliation_strings":["Department of Computer Science, Rice University, Houston, TX, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Rice University, Houston, TX, USA","institution_ids":["https://openalex.org/I74775410"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075696701","display_name":"Ioannis Ch. Paschalidis","orcid":"https://orcid.org/0000-0002-3343-2913"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ioannis Ch. Paschalidis","raw_affiliation_strings":["Division of System Engineering, Department of Mechanical Engineering, and Department of Electrical and Computer Engineering, Boston University, Boston, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of System Engineering, Department of Mechanical Engineering, and Department of Electrical and Computer Engineering, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086742095","display_name":"C\u0103lin Belta","orcid":"https://orcid.org/0000-0002-7141-2657"},"institutions":[{"id":"https://openalex.org/I111088046","display_name":"Boston University","ror":"https://ror.org/05qwgg493","country_code":"US","type":"education","lineage":["https://openalex.org/I111088046"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Calin A. Belta","raw_affiliation_strings":["Division of System Engineering, Department of Mechanical Engineering, and Department of Electrical and Computer Engineering, Boston University, Boston, MA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of System Engineering, Department of Mechanical Engineering, and Department of Electrical and Computer Engineering, Boston University, Boston, MA, USA","institution_ids":["https://openalex.org/I111088046"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":4.8969,"has_fulltext":false,"cited_by_count":30,"citation_normalized_percentile":{"value":0.95546034,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"34","issue":"10","first_page":"1329","last_page":"1344"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10675","display_name":"Mechanical Circulatory Support Devices","score":0.9843000173568726,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.8219923377037048},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6943356990814209},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6037983894348145},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.5703661441802979},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5649059414863586},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.5442547798156738},{"id":"https://openalex.org/keywords/temporal-logic","display_name":"Temporal logic","score":0.5306289196014404},{"id":"https://openalex.org/keywords/linear-temporal-logic","display_name":"Linear temporal logic","score":0.5011422634124756},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.47264567017555237},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4657462537288666},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.4485104978084564},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4261954426765442},{"id":"https://openalex.org/keywords/temporal-difference-learning","display_name":"Temporal difference learning","score":0.42143648862838745},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4114193618297577},{"id":"https://openalex.org/keywords/stochastic-control","display_name":"Stochastic control","score":0.41023150086402893},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3473926782608032},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24086755514144897},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16865292191505432},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.16844579577445984},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.15183097124099731}],"concepts":[{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.8219923377037048},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6943356990814209},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6037983894348145},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.5703661441802979},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5649059414863586},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.5442547798156738},{"id":"https://openalex.org/C25016198","wikidata":"https://www.wikidata.org/wiki/Q781833","display_name":"Temporal logic","level":2,"score":0.5306289196014404},{"id":"https://openalex.org/C4777664","wikidata":"https://www.wikidata.org/wiki/Q1536492","display_name":"Linear temporal logic","level":2,"score":0.5011422634124756},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.47264567017555237},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4657462537288666},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.4485104978084564},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4261954426765442},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.42143648862838745},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4114193618297577},{"id":"https://openalex.org/C170131372","wikidata":"https://www.wikidata.org/wiki/Q7617811","display_name":"Stochastic control","level":3,"score":0.41023150086402893},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3473926782608032},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24086755514144897},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16865292191505432},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.16844579577445984},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.15183097124099731},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":7,"locations":[{"id":"doi:10.1177/0278364915581505","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0278364915581505","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of Robotics Research","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.712.8024","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.712.8024","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.rice.edu/%7Emml9/papers/ICRA2012.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.728.159","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.728.159","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://sites.bu.edu/paschalidis/files/2015/06/IJRR-AC-rev2-v1-final.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.750.4586","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.750.4586","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://arxiv.org/pdf/1202.2185.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.906.4268","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.906.4268","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://www.researchgate.net/profile/Jing_Wang33/publication/221663433_Temporal_Logic_Motion_Control_using_Actor-Critic_Methods/links/0912f510051c40dac8000000.pdf?origin%3Dpublication_detail","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.914.6638","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.914.6638","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://www.researchgate.net/profile/Jing_Wang33/publication/221663433_Temporal_Logic_Motion_Control_using_Actor-Critic_Methods/links/0912f510051c40dac8000000.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.921.2202","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.921.2202","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://sites.bu.edu/hyness/files/2014/05/dennis_icra2012_actor_critic.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.7799999713897705}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W195642197","https://openalex.org/W1266757872","https://openalex.org/W1482244486","https://openalex.org/W1496256885","https://openalex.org/W1498432697","https://openalex.org/W1576452626","https://openalex.org/W1579117491","https://openalex.org/W1597303641","https://openalex.org/W1752118222","https://openalex.org/W1854776945","https://openalex.org/W1964782533","https://openalex.org/W1967294943","https://openalex.org/W1970269621","https://openalex.org/W1994511055","https://openalex.org/W2009303086","https://openalex.org/W2016990484","https://openalex.org/W2020293036","https://openalex.org/W2020883449","https://openalex.org/W2049553644","https://openalex.org/W2078151802","https://openalex.org/W2091565802","https://openalex.org/W2098432798","https://openalex.org/W2104241562","https://openalex.org/W2115174789","https://openalex.org/W2119567691","https://openalex.org/W2121863487","https://openalex.org/W2124339220","https://openalex.org/W2130786035","https://openalex.org/W2153358971","https://openalex.org/W2156737235","https://openalex.org/W2157807654","https://openalex.org/W2163941698","https://openalex.org/W2165364079","https://openalex.org/W2334782222","https://openalex.org/W2502103274","https://openalex.org/W2913459036","https://openalex.org/W2963778636","https://openalex.org/W4210727445","https://openalex.org/W4214717370","https://openalex.org/W4307347247"],"related_works":["https://openalex.org/W2124110813","https://openalex.org/W3021103820","https://openalex.org/W2763487042","https://openalex.org/W2031188261","https://openalex.org/W4232446061","https://openalex.org/W4285022830","https://openalex.org/W2020883449","https://openalex.org/W3035590440","https://openalex.org/W3205267199","https://openalex.org/W4386081380"],"abstract_inverted_index":{"This":[0,127],"paper":[1],"considers":[2],"the":[3,23,33,45,48,62,67,71,76,93,98,124,134,163],"problem":[4,59,96],"of":[5,25,47,69,123,133,148,162],"deploying":[6],"a":[7,10,14,26,51,79,117,138,145],"robot":[8,34,57,135],"from":[9],"specification":[11],"given":[12],"as":[13,50,89,91],"temporal":[15,72,119],"logic":[16,73],"statement":[17],"about":[18],"some":[19],"properties":[20],"satisfied":[21],"by":[22],"regions":[24,46],"large,":[27],"partitioned":[28],"environment.":[29],"We":[30],"assume":[31],"that":[32,160],"has":[35],"noisy":[36],"sensors":[37],"and":[38,40,136],"actuators":[39],"model":[41],"its":[42],"motion":[43],"through":[44],"environment":[49],"Markov":[52],"decision":[53],"process":[54],"(MDP).":[55],"The":[56,150],"control":[58,63,140],"becomes":[60],"finding":[61],"policy":[64,141],"which":[65],"maximizes":[66],"probability":[68],"satisfying":[70],"task":[74],"on":[75,116,130],"MDP.":[77],"For":[78],"large":[80],"environment,":[81],"obtaining":[82],"transition":[83,151],"probabilities":[84,152],"for":[85,97],"each":[86],"state\u2013action":[87],"pair,":[88],"well":[90],"solving":[92],"necessary":[94],"optimization":[95],"optimal":[99,169],"policy,":[100],"are":[101,153],"computationally":[102],"intensive.":[103],"To":[104],"address":[105],"these":[106],"issues,":[107],"we":[108],"propose":[109],"an":[110,167],"approximate":[111],"dynamic":[112],"programming":[113],"framework":[114,128],"based":[115],"least-squares":[118],"difference":[120],"learning":[121],"method":[122],"actor\u2013critic":[125],"type.":[126],"operates":[129],"sample":[131],"paths":[132],"optimizes":[137],"randomized":[139],"with":[142],"respect":[143],"to":[144,166],"small":[146],"set":[147],"parameters.":[149],"obtained":[154],"only":[155],"when":[156],"needed.":[157],"Simulations":[158],"confirm":[159],"convergence":[161],"parameters":[164],"translates":[165],"approximately":[168],"policy.":[170]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
