{"id":"https://openalex.org/W7141354855","doi":"https://doi.org/10.1109/lra.2026.3678453","title":"Continual Reinforcement Learning Framework for Scalable Collision Avoidance and Mitigation System With Packing Strategy","display_name":"Continual Reinforcement Learning Framework for Scalable Collision Avoidance and Mitigation System With Packing Strategy","publication_year":2026,"publication_date":"2026-03-27","ids":{"openalex":"https://openalex.org/W7141354855","doi":"https://doi.org/10.1109/lra.2026.3678453"},"language":null,"primary_location":{"id":"doi:10.1109/lra.2026.3678453","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2026.3678453","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113325722","display_name":"Joonhee Lim","orcid":null},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Joonhee Lim","raw_affiliation_strings":["KAIST, Daejeon, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0000-2248-194X","affiliations":[{"raw_affiliation_string":"KAIST, Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100828218","display_name":"Jangho Shin","orcid":null},"institutions":[{"id":"https://openalex.org/I49946491","display_name":"Hyundai Motors (South Korea)","ror":"https://ror.org/016kvft77","country_code":"KR","type":"company","lineage":["https://openalex.org/I197312522","https://openalex.org/I49946491"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jangho Shin","raw_affiliation_strings":["Hyundai Motor Company, Hwaseong, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0003-2635-5811","affiliations":[{"raw_affiliation_string":"Hyundai Motor Company, Hwaseong, Republic of Korea","institution_ids":["https://openalex.org/I49946491"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091555350","display_name":"Dongsuk Kum","orcid":"https://orcid.org/0000-0002-2590-4845"},"institutions":[{"id":"https://openalex.org/I157485424","display_name":"Korea Advanced Institute of Science and Technology","ror":"https://ror.org/05apxxy63","country_code":"KR","type":"education","lineage":["https://openalex.org/I157485424"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Dongsuk Kum","raw_affiliation_strings":["KAIST, Daejeon, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-2590-4845","affiliations":[{"raw_affiliation_string":"KAIST, Daejeon, Republic of Korea","institution_ids":["https://openalex.org/I157485424"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.42946798,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"11","issue":"5","first_page":"6264","last_page":"6271"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.22830000519752502,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.22830000519752502,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.15080000460147858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.08860000222921371,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.637499988079071},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.5218999981880188},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.42899999022483826},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3474000096321106},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3312000036239624},{"id":"https://openalex.org/keywords/collision","display_name":"Collision","score":0.32899999618530273}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.637499988079071},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6169000267982483},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.5218999981880188},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.42899999022483826},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3474000096321106},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3312000036239624},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.32899999618530273},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.3197999894618988},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31380000710487366},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.29809999465942383},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.2842999994754791},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.2711000144481659},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.2671999931335449},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.2648000121116638},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2574000060558319}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2026.3678453","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2026.3678453","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/13","score":0.8697197437286377,"display_name":"Climate action"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Collision":[0],"Avoidance":[1],"and":[2,22,79,128,174],"Mitigation":[3],"System":[4],"(CAMS)":[5],"in":[6],"autonomous":[7],"driving":[8,55,134],"systems":[9],"is":[10],"crucial":[11],"for":[12,33,39,72,126,159],"ensuring":[13],"safety":[14],"by":[15,145],"formulating":[16],"strategies":[17],"to":[18,47,122,142,186],"address":[19],"various":[20],"collisions":[21],"planning":[23,31],"the":[24,43,96,102,106],"trajectory":[25],"accordingly.":[26],"Although":[27],"recent":[28],"learning-based":[29],"motion":[30,124],"methods":[32],"CAMS":[34,73,127],"have":[35],"shown":[36],"promising":[37],"results":[38],"specific":[40,94],"collision":[41,171,178],"scenarios,":[42,95],"question":[44],"of":[45,86,104],"how":[46],"continually":[48,99],"scale":[49],"up":[50,101],"their":[51],"knowledge":[52,85,144],"across":[53,132],"different":[54],"environments":[56],"has":[57],"not":[58],"yet":[59],"been":[60],"thoroughly":[61],"investigated.":[62],"In":[63],"this":[64,119],"paper,":[65],"we":[66],"propose":[67],"a":[68,90,123,139,147,168,175,194],"scalable":[69],"learning":[70,78,120],"framework":[71,121],"that":[74,149],"combines":[75],"deep":[76],"reinforcement":[77],"continual":[80,160],"learning.":[81],"By":[82],"sequentially":[83],"packing":[84],"new":[87,133],"scenarios":[88,105],"into":[89],"model":[91,107,148,195],"trained":[92,115,188],"on":[93,113,152,189],"proposed":[97],"method":[98],"scales":[100],"range":[103],"can":[108],"handle":[109],"while":[110],"maintaining":[111],"performance":[112,184],"previously":[114],"scenarios.":[116],"We":[117],"apply":[118],"planner":[125],"evaluate":[129],"its":[130],"scalability":[131],"environments.":[135],"This":[136],"approach":[137,182],"demonstrates":[138],"significant":[140],"ability":[141],"pack":[143],"outperforming":[146],"jointly":[150],"trains":[151],"all":[153],"scenarios\u2014typically":[154],"considered":[155],"an":[156],"upper":[157],"bound":[158],"learning\u2014in":[161],"about":[162,196],"2.4\u00d7":[163],"fewer":[164],"training":[165],"steps,":[166],"with":[167,193],"4.19%":[169],"higher":[170],"avoidance":[172],"rate":[173],"12.02%":[176],"lower":[177],"impact.":[179],"Moreover,":[180],"our":[181],"achieves":[183],"close":[185],"models":[187],"each":[190],"scenario":[191],"individually,":[192],"5.8\u00d7":[197],"smaller.":[198]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-28T00:00:00"}
