{"id":"https://openalex.org/W4404469647","doi":"https://doi.org/10.1109/tcyb.2024.3491582","title":"Safe Reinforcement Learning: Optimal Formation Control With Collision Avoidance of Multiple Satellite Systems","display_name":"Safe Reinforcement Learning: Optimal Formation Control With Collision Avoidance of Multiple Satellite Systems","publication_year":2024,"publication_date":"2024-11-18","ids":{"openalex":"https://openalex.org/W4404469647","doi":"https://doi.org/10.1109/tcyb.2024.3491582","pmid":"https://pubmed.ncbi.nlm.nih.gov/40030255"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2024.3491582","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2024.3491582","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109377213","display_name":"Hui Yu","orcid":"https://orcid.org/0000-0001-7752-1355"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hui Yu","raw_affiliation_strings":["School of Electrical Engineering and Automation, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0001-7752-1355","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044375216","display_name":"Liqian Dou","orcid":"https://orcid.org/0000-0002-3979-0420"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liqian Dou","raw_affiliation_strings":["School of Electrical Engineering and Automation, Tianjin University, Tianjin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100744361","display_name":"Xiuyun Zhang","orcid":"https://orcid.org/0000-0001-5309-6147"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiuyun Zhang","raw_affiliation_strings":["School of Electrical Engineering and Automation, Tianjin University, Tianjin, China"],"raw_orcid":"https://orcid.org/0000-0001-5309-6147","affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070599005","display_name":"Jinna Li","orcid":"https://orcid.org/0000-0001-9985-6308"},"institutions":[{"id":"https://openalex.org/I166846921","display_name":"Liaoning Shihua University","ror":"https://ror.org/00k6c4h29","country_code":"CN","type":"education","lineage":["https://openalex.org/I166846921"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinna Li","raw_affiliation_strings":["School of Information and Control Engineering, Liaoning Petrochemical University, Fushun, China"],"raw_orcid":"https://orcid.org/0000-0001-9985-6308","affiliations":[{"raw_affiliation_string":"School of Information and Control Engineering, Liaoning Petrochemical University, Fushun, China","institution_ids":["https://openalex.org/I166846921"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073871408","display_name":"Qun Zong","orcid":"https://orcid.org/0000-0003-0734-6728"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qun Zong","raw_affiliation_strings":["School of Electrical Engineering and Automation, Tianjin University, Tianjin, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Automation, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5109377213"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":1.8931,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.86442566,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"55","issue":"1","first_page":"447","last_page":"459"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.965399980545044,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.8380730748176575},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7378377318382263},{"id":"https://openalex.org/keywords/satellite","display_name":"Satellite","score":0.5364544987678528},{"id":"https://openalex.org/keywords/collision","display_name":"Collision","score":0.5342862606048584},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5142466425895691},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4760068356990814},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2684062719345093},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1989244520664215},{"id":"https://openalex.org/keywords/aerospace-engineering","display_name":"Aerospace engineering","score":0.18758484721183777},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.17835694551467896}],"concepts":[{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.8380730748176575},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7378377318382263},{"id":"https://openalex.org/C19269812","wikidata":"https://www.wikidata.org/wiki/Q26540","display_name":"Satellite","level":2,"score":0.5364544987678528},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.5342862606048584},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5142466425895691},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4760068356990814},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2684062719345093},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1989244520664215},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.18758484721183777},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.17835694551467896}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2024.3491582","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2024.3491582","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:40030255","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40030255","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","display_name":"Climate action","score":0.550000011920929}],"awards":[{"id":"https://openalex.org/G6544682862","display_name":null,"funder_award_id":"62373268","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7915282223","display_name":null,"funder_award_id":"LJKZ0401","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8244373557","display_name":null,"funder_award_id":"62373273","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":57,"referenced_works":["https://openalex.org/W1966397236","https://openalex.org/W2148053762","https://openalex.org/W2422768215","https://openalex.org/W2793010390","https://openalex.org/W2802164917","https://openalex.org/W2921163467","https://openalex.org/W2955251534","https://openalex.org/W2998132146","https://openalex.org/W3010713425","https://openalex.org/W3019604371","https://openalex.org/W3048735518","https://openalex.org/W3088154325","https://openalex.org/W3094040002","https://openalex.org/W3094638344","https://openalex.org/W3111985883","https://openalex.org/W3200079785","https://openalex.org/W3200237136","https://openalex.org/W3202988211","https://openalex.org/W4200574011","https://openalex.org/W4206239199","https://openalex.org/W4214505998","https://openalex.org/W4226044131","https://openalex.org/W4226250466","https://openalex.org/W4226255370","https://openalex.org/W4226413402","https://openalex.org/W4281752204","https://openalex.org/W4281790942","https://openalex.org/W4282940153","https://openalex.org/W4285117024","https://openalex.org/W4285411083","https://openalex.org/W4285613161","https://openalex.org/W4288064487","https://openalex.org/W4304479610","https://openalex.org/W4307230233","https://openalex.org/W4312559581","https://openalex.org/W4312617036","https://openalex.org/W4312639110","https://openalex.org/W4312722722","https://openalex.org/W4312735521","https://openalex.org/W4315630992","https://openalex.org/W4318770958","https://openalex.org/W4321366636","https://openalex.org/W4361767099","https://openalex.org/W4367016649","https://openalex.org/W4376456298","https://openalex.org/W4385325555","https://openalex.org/W4386182399","https://openalex.org/W4386432124","https://openalex.org/W4388872609","https://openalex.org/W4389105021","https://openalex.org/W4390547652","https://openalex.org/W4391164217","https://openalex.org/W4391305776","https://openalex.org/W4392399520","https://openalex.org/W4393240950","https://openalex.org/W4395028215","https://openalex.org/W4400770777"],"related_works":["https://openalex.org/W4317634134","https://openalex.org/W2981729160","https://openalex.org/W4310743282","https://openalex.org/W4306904969","https://openalex.org/W2743212448","https://openalex.org/W1819938260","https://openalex.org/W2340892746","https://openalex.org/W3163022373","https://openalex.org/W2742483371","https://openalex.org/W3005999311"],"abstract_inverted_index":{"This":[0],"article":[1],"addresses":[2],"the":[3,32,35,48,51,60,65,71,81,91,110,113,129,134,140,145],"collision":[4,57],"avoidance":[5,78],"and":[6,47,79,125,131,142],"formation":[7,73,115,124],"control":[8,116],"problem":[9],"for":[10],"multisatellite":[11,72],"systems.":[12],"A":[13,95],"novel":[14],"safe":[15,85],"reinforcement":[16],"learning":[17,38],"(RL)":[18],"algorithm":[19,33,87,136,147],"based":[20],"on":[21],"an":[22,122],"adaptive":[23,36,123],"dynamic":[24],"programming":[25],"framework":[26],"is":[27,62,88,98],"proposed.":[28],"The":[29],"highlights":[30],"of":[31,50,133,144],"are":[34,137,148],"distance-varying":[37,96],"method":[39],"to":[40,55],"integrate":[41],"online":[42],"data":[43,46],"with":[44,105,121],"historical":[45],"usage":[49],"barrier":[52],"function":[53,68],"(BF)":[54],"achieve":[56,76],"avoidance.":[58],"First,":[59],"BF":[61],"introduced":[63],"into":[64],"designed":[66],"cost":[67,111],"such":[69],"that":[70],"system":[74],"can":[75,118],"obstacle":[77],"guarantee":[80],"safety.":[82],"Next,":[83],"a":[84],"RL":[86],"developed":[89],"through":[90],"critic":[92],"network":[93],"structure.":[94],"weight":[97],"introduced,":[99],"which":[100],"combines":[101],"experience":[102],"replay":[103],"samples":[104],"extrapolation":[106],"samples.":[107],"By":[108],"minimizing":[109],"function,":[112],"optimal":[114],"policy":[117],"be":[119],"obtained":[120],"self-learning":[126],"ability.":[127],"Then,":[128],"stability":[130],"safety":[132],"proposed":[135,146],"analyzed.":[138],"Finally,":[139],"effectiveness":[141],"superiority":[143],"verified":[149],"by":[150],"numerical":[151],"simulations.":[152]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":4}],"updated_date":"2025-12-27T23:08:20.325037","created_date":"2025-10-10T00:00:00"}
