{"id":"https://openalex.org/W4394627255","doi":"https://doi.org/10.1109/tnnls.2024.3379654","title":"Pontryagin\u2019s Minimum Principle-Guided RL for Minimum-Time Exploration of Spatiotemporal Fields","display_name":"Pontryagin\u2019s Minimum Principle-Guided RL for Minimum-Time Exploration of Spatiotemporal Fields","publication_year":2024,"publication_date":"2024-04-09","ids":{"openalex":"https://openalex.org/W4394627255","doi":"https://doi.org/10.1109/tnnls.2024.3379654","pmid":"https://pubmed.ncbi.nlm.nih.gov/38593018"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2024.3379654","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3379654","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036876831","display_name":"Zhuo Li","orcid":"https://orcid.org/0000-0002-1958-024X"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]},{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhuo Li","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","Beijing Institute of Technology Chongqing Innovation Center, Chongqing, China","School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"Beijing Institute of Technology Chongqing Innovation Center, Chongqing, China","institution_ids":["https://openalex.org/I50632499","https://openalex.org/I125839683"]},{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100701131","display_name":"Jian Sun","orcid":"https://orcid.org/0000-0001-9898-3129"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]},{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Sun","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","Beijing Institute of Technology Chongqing Innovation Center, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"Beijing Institute of Technology Chongqing Innovation Center, Chongqing, China","institution_ids":["https://openalex.org/I50632499","https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054312245","display_name":"Antonio G. Marqu\u00e9s","orcid":"https://orcid.org/0000-0002-4642-7718"},"institutions":[{"id":"https://openalex.org/I182083151","display_name":"Universidad Rey Juan Carlos","ror":"https://ror.org/01v5cv687","country_code":"ES","type":"education","lineage":["https://openalex.org/I182083151"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Antonio G. Marques","raw_affiliation_strings":["Department of Signal Theory and Communications, King Juan Carlos University, Madrid, Spain"],"affiliations":[{"raw_affiliation_string":"Department of Signal Theory and Communications, King Juan Carlos University, Madrid, Spain","institution_ids":["https://openalex.org/I182083151"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100367403","display_name":"Gang Wang","orcid":"https://orcid.org/0000-0002-7266-2412"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]},{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Wang","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","Beijing Institute of Technology Chongqing Innovation Center, Chongqing, China","School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"Beijing Institute of Technology Chongqing Innovation Center, Chongqing, China","institution_ids":["https://openalex.org/I50632499","https://openalex.org/I125839683"]},{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088962631","display_name":"Keyou You","orcid":"https://orcid.org/0000-0003-4355-5340"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Keyou You","raw_affiliation_strings":["Department of Automation and BNRist, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Automation and BNRist, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5036876831"],"corresponding_institution_ids":["https://openalex.org/I125839683","https://openalex.org/I50632499"],"apc_list":null,"apc_paid":null,"fwci":0.2493,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.46999609,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"36","issue":"3","first_page":"5375","last_page":"5387"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discretization","display_name":"Discretization","score":0.6577941179275513},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6200612187385559},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5941849946975708},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.5387367606163025},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5380252599716187},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.5089986324310303},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.41218191385269165},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.41163530945777893},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.37717700004577637},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.287853479385376}],"concepts":[{"id":"https://openalex.org/C73000952","wikidata":"https://www.wikidata.org/wiki/Q17007827","display_name":"Discretization","level":2,"score":0.6577941179275513},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6200612187385559},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5941849946975708},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.5387367606163025},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5380252599716187},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.5089986324310303},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.41218191385269165},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.41163530945777893},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.37717700004577637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.287853479385376},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2024.3379654","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2024.3379654","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:38593018","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38593018","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.550000011920929,"display_name":"Climate action","id":"https://metadata.un.org/sdg/13"}],"awards":[{"id":"https://openalex.org/G2059183635","display_name":null,"funder_award_id":"61925303","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2493513157","display_name":null,"funder_award_id":"U23B2059","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2575069074","display_name":null,"funder_award_id":"62088101","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7093390570","display_name":null,"funder_award_id":"62303054","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W879905685","https://openalex.org/W1492326914","https://openalex.org/W1606119439","https://openalex.org/W1855169650","https://openalex.org/W2019738489","https://openalex.org/W2031521898","https://openalex.org/W2055014394","https://openalex.org/W2145339207","https://openalex.org/W2313274380","https://openalex.org/W2484646121","https://openalex.org/W2746553466","https://openalex.org/W2790049323","https://openalex.org/W2794499044","https://openalex.org/W2804397006","https://openalex.org/W2906829782","https://openalex.org/W2912964491","https://openalex.org/W2945053513","https://openalex.org/W2966982543","https://openalex.org/W2972296478","https://openalex.org/W3015470607","https://openalex.org/W3036859942","https://openalex.org/W3088197938","https://openalex.org/W3119447081","https://openalex.org/W3175147250","https://openalex.org/W3176761908","https://openalex.org/W3209083247","https://openalex.org/W4200630212","https://openalex.org/W4200635426","https://openalex.org/W4206602738","https://openalex.org/W4213246061","https://openalex.org/W4214717370","https://openalex.org/W4220741039","https://openalex.org/W4225390809","https://openalex.org/W4304480790","https://openalex.org/W4308637970","https://openalex.org/W4385834370","https://openalex.org/W6631190155","https://openalex.org/W6747473740","https://openalex.org/W6748839928"],"related_works":["https://openalex.org/W2006251942","https://openalex.org/W2364741597","https://openalex.org/W1492103595","https://openalex.org/W1864774435","https://openalex.org/W946352265","https://openalex.org/W3020787026","https://openalex.org/W2334479858","https://openalex.org/W2793786119","https://openalex.org/W1507702947","https://openalex.org/W2022062253"],"abstract_inverted_index":{"This":[0,115],"article":[1],"studies":[2],"the":[3,24,29,34,43,54,57,71,76,96,106,146,149,165],"trajectory":[4,125],"planning":[5,126,131],"problem":[6,26,109],"of":[7,33,45,148,160],"an":[8],"autonomous":[9],"vehicle":[10],"for":[11,80,85,105,173],"exploring":[12],"a":[13,18,46,61,120,130,138],"spatiotemporal":[14],"field":[15],"subject":[16],"to":[17,52,68,118],"constraint":[19],"on":[20,28,137],"cumulative":[21],"information.":[22],"Since":[23],"resulting":[25],"depends":[27],"signal":[30],"strength":[31],"distribution":[32],"field,":[35],"which":[36,86,128],"is":[37,66],"unknown":[38],"in":[39,158],"practice,":[40],"we":[41,94],"advocate":[42],"use":[44],"model-free":[47,77],"reinforcement":[48],"learning":[49,162],"(RL)":[50],"method":[51],"find":[53],"solution.":[55],"Given":[56],"vehicle's":[58,166],"dynamical":[59],"model,":[60],"critical":[62],"(and":[63],"open)":[64],"question":[65],"how":[67],"judiciously":[69],"merge":[70],"model-based":[72],"optimality":[73,103],"conditions":[74,104],"into":[75],"RL":[78,124,151],"framework":[79],"improved":[81],"efficiency":[82,163],"and":[83,153,164],"generalization,":[84],"this":[87],"work":[88],"provides":[89],"some":[90],"positive":[91],"results.":[92],"Specifically,":[93],"discretize":[95],"continuous":[97,139,174],"action":[98,140],"space":[99],"by":[100],"leveraging":[101],"analytic":[102],"minimum-time":[107],"optimization":[108],"via":[110],"Pontryagin's":[111],"minimum":[112],"principle":[113],"(PMP).":[114],"allows":[116],"us":[117],"develop":[119],"novel":[121],"discrete":[122],"PMP-based":[123,150],"algorithm,":[127],"learns":[129],"policy":[132],"faster":[133],"than":[134],"those":[135],"based":[136],"space.":[141],"Simulation":[142],"results:":[143],"1)":[144],"validate":[145],"effectiveness":[147],"algorithm":[152],"2)":[154],"demonstrate":[155],"its":[156],"advantages,":[157],"terms":[159],"both":[161],"exploration":[167],"time,":[168],"over":[169],"two":[170],"baseline":[171],"methods":[172],"control":[175],"inputs.":[176]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
