{"id":"https://openalex.org/W4402808998","doi":"https://doi.org/10.1109/tits.2024.3443397","title":"Cross-Observability Optimistic-Pessimistic Safe Reinforcement Learning for Interactive Motion Planning With Visual Occlusion","display_name":"Cross-Observability Optimistic-Pessimistic Safe Reinforcement Learning for Interactive Motion Planning With Visual Occlusion","publication_year":2024,"publication_date":"2024-09-24","ids":{"openalex":"https://openalex.org/W4402808998","doi":"https://doi.org/10.1109/tits.2024.3443397"},"language":"en","primary_location":{"id":"doi:10.1109/tits.2024.3443397","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tits.2024.3443397","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102936751","display_name":"Xiaohui Hou","orcid":"https://orcid.org/0000-0002-5673-2396"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaohui Hou","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Minggang Gan","orcid":"https://orcid.org/0000-0002-2163-2475"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Minggang Gan","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107837750","display_name":"Wei Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wu","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, School of Automation, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"School of Automation, National Key Laboratory of Autonomous Intelligent Unmanned Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107939210","display_name":"Yuan Ji","orcid":"https://orcid.org/0000-0002-5991-2421"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yuan Ji","raw_affiliation_strings":["School of Mechanical and Aerospace Engineering, Nanyang Technological University, Jurong West, Singapore","School of Mechanical and Aerospace Engineering, Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Nanyang Technological University, Jurong West, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"School of Mechanical and Aerospace Engineering, Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068593680","display_name":"Shiyue Zhao","orcid":"https://orcid.org/0000-0001-6742-2767"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiyue Zhao","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108047474","display_name":"Jie Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Chen","raw_affiliation_strings":["National Key Laboratory of Autonomous Intelligent Unmanned Systems, Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"National Key Laboratory of Autonomous Intelligent Unmanned Systems, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102936751"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":0.4949,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.64982906,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"25","issue":"11","first_page":"17602","last_page":"17613"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.9098224639892578},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6770885586738586},{"id":"https://openalex.org/keywords/pessimism","display_name":"Pessimism","score":0.6696197390556335},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.5295242667198181},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5147221684455872},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5084730386734009},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4994361400604248},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4809398055076599},{"id":"https://openalex.org/keywords/occlusion","display_name":"Occlusion","score":0.45655080676078796},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3264327049255371},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20845511555671692},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.1370367407798767},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.10451328754425049}],"concepts":[{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.9098224639892578},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6770885586738586},{"id":"https://openalex.org/C9992130","wikidata":"https://www.wikidata.org/wiki/Q484954","display_name":"Pessimism","level":2,"score":0.6696197390556335},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.5295242667198181},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5147221684455872},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5084730386734009},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4994361400604248},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4809398055076599},{"id":"https://openalex.org/C2776268601","wikidata":"https://www.wikidata.org/wiki/Q968808","display_name":"Occlusion","level":2,"score":0.45655080676078796},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3264327049255371},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20845511555671692},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.1370367407798767},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.10451328754425049},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C164705383","wikidata":"https://www.wikidata.org/wiki/Q10379","display_name":"Cardiology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tits.2024.3443397","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/tits.2024.3443397","pdf_url":null,"source":{"id":"https://openalex.org/S144771191","display_name":"IEEE Transactions on Intelligent Transportation Systems","issn_l":"1524-9050","issn":["1524-9050","1558-0016"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Transportation Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1127291761","display_name":null,"funder_award_id":"62303058","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W1965455100","https://openalex.org/W2000291746","https://openalex.org/W2020053297","https://openalex.org/W2039240409","https://openalex.org/W2890356250","https://openalex.org/W2949795681","https://openalex.org/W2951875426","https://openalex.org/W2962730596","https://openalex.org/W2963732412","https://openalex.org/W2965289613","https://openalex.org/W2970816301","https://openalex.org/W2970857152","https://openalex.org/W2971306529","https://openalex.org/W2990384329","https://openalex.org/W3012371209","https://openalex.org/W3016664689","https://openalex.org/W3065468121","https://openalex.org/W3081214244","https://openalex.org/W3090027660","https://openalex.org/W3090768122","https://openalex.org/W3093537939","https://openalex.org/W3127561923","https://openalex.org/W3164838844","https://openalex.org/W3200750070","https://openalex.org/W3203124669","https://openalex.org/W3208686011","https://openalex.org/W3209083247","https://openalex.org/W3215870255","https://openalex.org/W4220857253","https://openalex.org/W4221029045","https://openalex.org/W4229459602","https://openalex.org/W4285600734","https://openalex.org/W4292965203","https://openalex.org/W4296838344","https://openalex.org/W4312679374","https://openalex.org/W4322632270","https://openalex.org/W4366308958","https://openalex.org/W4386550196","https://openalex.org/W6634817459","https://openalex.org/W6747473740","https://openalex.org/W6838979500","https://openalex.org/W6847064673"],"related_works":["https://openalex.org/W2046459260","https://openalex.org/W2765830098","https://openalex.org/W2967463586","https://openalex.org/W1971989957","https://openalex.org/W2517338020","https://openalex.org/W3157641275","https://openalex.org/W4312300846","https://openalex.org/W4206221578","https://openalex.org/W3029572990","https://openalex.org/W2615757685"],"abstract_inverted_index":{"This":[0],"study":[1],"focuses":[2],"on":[3],"the":[4,47,54,61,83,91,109,115,118,135,140],"motion":[5,27],"planning":[6,28],"and":[7,38,58,60,72,86,95,142,147],"risk":[8,50],"evaluation":[9],"of":[10,46,51,117],"unprotected":[11],"left":[12],"turns":[13],"at":[14],"occluded":[15,52,124],"intersections":[16],"for":[17],"autonomous":[18],"vehicles.":[19,65],"In":[20],"this":[21],"paper,":[22],"we":[23],"present":[24],"an":[25,103],"interactive":[26],"controller":[29,120],"that":[30,134],"combines":[31],"Cross-Observability":[32],"Optimistic-Pessimistic":[33],"Safe":[34],"Reinforcement":[35],"Learning":[36],"(COOP-SRL)":[37],"Nonlinear":[39],"Model":[40],"Predictive":[41],"Control":[42],"(NMPC),":[43],"with":[44,127],"consideration":[45],"uncertain":[48],"potential":[49],"zone,":[53],"trade-off":[55],"between":[56,64],"safety":[57],"efficiency,":[59],"dynamic":[62],"interaction":[63],"The":[66],"proposed":[67,119,136],"COOP-SRL":[68],"algorithm":[69],"integrates":[70],"fully":[71],"partially":[73],"observable":[74],"policies":[75],"through":[76],"cross-observability":[77],"soft":[78],"imitation":[79],"learning":[80,88,112],"to":[81,101],"leverage":[82],"expert":[84],"guidance":[85],"improve":[87],"efficiency.":[89],"Moreover,":[90],"optimistic":[92],"exploration":[93,110],"policy":[94],"pessimism":[96],"safe":[97,105],"constraint":[98],"are":[99],"adopted":[100],"provide":[102],"adaptive":[104],"strategy":[106],"without":[107],"hindering":[108],"during":[111],"process.":[113],"Finally,":[114],"evaluations":[116],"were":[121],"conducted":[122],"in":[123,145],"intersection":[125],"scenarios":[126],"various":[128],"traffic":[129],"density":[130],"level,":[131],"which":[132],"indicate":[133],"method":[137],"outperforms":[138],"both":[139],"optimization-based":[141],"learning-based":[143],"baselines":[144],"qualitative":[146],"quantitative":[148],"indexes.":[149]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
