{"id":"https://openalex.org/W4226188445","doi":"https://doi.org/10.1109/robio54168.2021.9739455","title":"Robot Navigation with Interaction-based Deep Reinforcement Learning","display_name":"Robot Navigation with Interaction-based Deep Reinforcement Learning","publication_year":2021,"publication_date":"2021-12-27","ids":{"openalex":"https://openalex.org/W4226188445","doi":"https://doi.org/10.1109/robio54168.2021.9739455"},"language":"en","primary_location":{"id":"doi:10.1109/robio54168.2021.9739455","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio54168.2021.9739455","pdf_url":null,"source":{"id":"https://openalex.org/S4363607846","display_name":"2021 IEEE International Conference on Robotics and Biomimetics (ROBIO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103022180","display_name":"Yu Zhai","orcid":"https://orcid.org/0009-0005-6660-1268"},"institutions":[{"id":"https://openalex.org/I25757504","display_name":"China University of Mining and Technology","ror":"https://ror.org/01xt2dr21","country_code":"CN","type":"education","lineage":["https://openalex.org/I25757504"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yu Zhai","raw_affiliation_strings":["China University of Mining and Technology,Jiangsu,China,221008"],"affiliations":[{"raw_affiliation_string":"China University of Mining and Technology,Jiangsu,China,221008","institution_ids":["https://openalex.org/I25757504"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021924831","display_name":"Yanzi Miao","orcid":"https://orcid.org/0000-0002-2688-7477"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210164862","display_name":"Artificial Intelligence in Medicine (Canada)","ror":"https://ror.org/05p590m36","country_code":"CA","type":"company","lineage":["https://openalex.org/I4210164862"]},{"id":"https://openalex.org/I25757504","display_name":"China University of Mining and Technology","ror":"https://ror.org/01xt2dr21","country_code":"CN","type":"education","lineage":["https://openalex.org/I25757504"]}],"countries":["CA","CN"],"is_corresponding":false,"raw_author_name":"Yanzi Miao","raw_affiliation_strings":["The Artificial Intelligence Research Institute,Department of Information and Control Engineering,China","University of Mining and Technology, Jiangsu, China","Department of Information and Control Engineering, The Artificial Intelligence Research Institute, China"],"affiliations":[{"raw_affiliation_string":"The Artificial Intelligence Research Institute,Department of Information and Control Engineering,China","institution_ids":["https://openalex.org/I4210164862","https://openalex.org/I4210100255"]},{"raw_affiliation_string":"University of Mining and Technology, Jiangsu, China","institution_ids":["https://openalex.org/I25757504"]},{"raw_affiliation_string":"Department of Information and Control Engineering, The Artificial Intelligence Research Institute, China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107772128","display_name":"Hesheng Wang","orcid":"https://orcid.org/0000-0002-9959-1634"},"institutions":[{"id":"https://openalex.org/I1327237609","display_name":"Ministry of Education of the People's Republic of China","ror":"https://ror.org/01mv9t934","country_code":"CN","type":"funder","lineage":["https://openalex.org/I1327237609","https://openalex.org/I4210127390"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]},{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hesheng Wang","raw_affiliation_strings":["Shanghai Jiao Tong University,Department of Automation, Institute of Medical Robotics, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education,Shanghai,China,200240","The Beijing Advanced Innovation Center for Intelligent Robots and Systems, Beijing Institute of Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,Department of Automation, Institute of Medical Robotics, Key Laboratory of System Control and Information Processing of Ministry of Education, Key Laboratory of Marine Intelligent Equipment and System of Ministry of Education,Shanghai,China,200240","institution_ids":["https://openalex.org/I1327237609","https://openalex.org/I183067930"]},{"raw_affiliation_string":"The Beijing Advanced Innovation Center for Intelligent Robots and Systems, Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5103022180"],"corresponding_institution_ids":["https://openalex.org/I25757504"],"apc_list":null,"apc_paid":null,"fwci":0.7392,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.74658972,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"70","issue":null,"first_page":"1974","last_page":"1979"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11500","display_name":"Evacuation and Crowd Dynamics","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8514143228530884},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7431583404541016},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7121549844741821},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.627690315246582},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5716068744659424},{"id":"https://openalex.org/keywords/mobile-robot-navigation","display_name":"Mobile robot navigation","score":0.5209183096885681},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5177444815635681},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.44814392924308777},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.44739049673080444},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.4135957956314087},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.3925105631351471},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3312230408191681},{"id":"https://openalex.org/keywords/collision","display_name":"Collision","score":0.31230446696281433},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.2601137161254883},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.06451603770256042}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8514143228530884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7431583404541016},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7121549844741821},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.627690315246582},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5716068744659424},{"id":"https://openalex.org/C26990112","wikidata":"https://www.wikidata.org/wiki/Q6887224","display_name":"Mobile robot navigation","level":5,"score":0.5209183096885681},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5177444815635681},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.44814392924308777},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.44739049673080444},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.4135957956314087},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.3925105631351471},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3312230408191681},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.31230446696281433},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.2601137161254883},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.06451603770256042},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio54168.2021.9739455","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio54168.2021.9739455","pdf_url":null,"source":{"id":"https://openalex.org/S4363607846","display_name":"2021 IEEE International Conference on Robotics and Biomimetics (ROBIO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335769","display_name":"Graduate Research and Innovation Projects of Jiangsu Province","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W192919555","https://openalex.org/W1969622215","https://openalex.org/W2072195747","https://openalex.org/W2082585576","https://openalex.org/W2088604406","https://openalex.org/W2117211893","https://openalex.org/W2145339207","https://openalex.org/W2424778531","https://openalex.org/W2510353085","https://openalex.org/W2604216058","https://openalex.org/W2736601468","https://openalex.org/W2787938642","https://openalex.org/W2890001928","https://openalex.org/W2963001155","https://openalex.org/W2963809389","https://openalex.org/W2964319688","https://openalex.org/W2971426775","https://openalex.org/W3035096461","https://openalex.org/W3099342209","https://openalex.org/W3103340056","https://openalex.org/W3114484401","https://openalex.org/W3115017905","https://openalex.org/W3132959187","https://openalex.org/W3196760406","https://openalex.org/W3206650971","https://openalex.org/W6725558466","https://openalex.org/W6741002519","https://openalex.org/W6748839928","https://openalex.org/W6785613427","https://openalex.org/W6787712956","https://openalex.org/W6791018965"],"related_works":["https://openalex.org/W2742483371","https://openalex.org/W4381746183","https://openalex.org/W2930863966","https://openalex.org/W2157678966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W2165180011","https://openalex.org/W3165944253","https://openalex.org/W4220829754"],"abstract_inverted_index":{"For":[0],"the":[1,17,22,30,51,66,74,82,132,138,152],"scene":[2],"of":[3,68,92,110],"dense":[4,23,55],"crowd":[5,24],"flow":[6],"in":[7,41,54,99,141,162],"limited":[8],"space,":[9],"it":[10,45],"is":[11,62,114,127],"very":[12],"important":[13],"and":[14,27,94,135,143,158,164],"challenging":[15],"for":[16,50],"robot":[18,52,111,116],"to":[19,29,64],"walk":[20],"through":[21],"without":[25],"collision":[26],"move":[28],"destination":[31],"efficiently.":[32],"As":[33],"deep":[34],"reinforcement":[35,119],"learning":[36,84,120],"has":[37,155],"achieved":[38],"certain":[39],"results":[40,149],"human-aware":[42],"navigation":[43,53,97,139,160],"policies,":[44],"provides":[46],"a":[47,107],"feasible":[48],"solution":[49],"crowd.":[56],"But":[57],"current":[58],"environment":[59,124],"representation":[60,125],"method":[61,126],"difficult":[63],"represent":[65,89],"intention":[67],"human":[69,117],"movement,":[70],"which":[71,129],"causes":[72],"that":[73,113,151],"policy":[75],"network":[76],"cannot":[77],"make":[78],"forward-looking":[79],"decisions.":[80],"And":[81],"previous":[83],"model":[85,109,154],"could":[86],"not":[87],"effectively":[88,136],"any":[90],"number":[91],"pedestrians":[93],"maintain":[95],"stable":[96],"capability":[98],"unfamiliar":[100,142,165],"environment.":[101,146,166],"In":[102],"this":[103],"study,":[104],"we":[105],"propose":[106],"novel":[108],"navigation,":[112],"called":[115],"interaction":[118,134],"(RHIRL).":[121],"A":[122],"new":[123],"proposed":[128,153],"implicitly":[130],"includes":[131],"potential":[133],"improves":[137],"ability":[140],"dynamic":[144,163],"interactive":[145],"The":[147],"experiment":[148],"show":[150],"obvious":[156],"advantages":[157],"excellent":[159],"performance":[161]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
