{"id":"https://openalex.org/W4390099862","doi":"https://doi.org/10.1109/robio58561.2023.10355042","title":"Spatio-Temporal Transformer-Based Reinforcement Learning for Robot Crowd Navigation","display_name":"Spatio-Temporal Transformer-Based Reinforcement Learning for Robot Crowd Navigation","publication_year":2023,"publication_date":"2023-12-04","ids":{"openalex":"https://openalex.org/W4390099862","doi":"https://doi.org/10.1109/robio58561.2023.10355042"},"language":"en","primary_location":{"id":"doi:10.1109/robio58561.2023.10355042","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio58561.2023.10355042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101311780","display_name":"Haodong He","orcid":"https://orcid.org/0000-0002-4837-4066"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haodong He","raw_affiliation_strings":["Wuhan University of Science and Technology,School of Computer Science and Technology","School of Computer Science and Technology, Wuhan University of Science and Technology","Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wuhan University of Science and Technology,School of Computer Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100604058","display_name":"Hao Fu","orcid":"https://orcid.org/0000-0002-9028-1728"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Fu","raw_affiliation_strings":["Wuhan University of Science and Technology,School of Computer Science and Technology","School of Computer Science and Technology, Wuhan University of Science and Technology","Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wuhan University of Science and Technology,School of Computer Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100766021","display_name":"Qiang Wang","orcid":"https://orcid.org/0000-0001-7420-8646"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Wang","raw_affiliation_strings":["Wuhan University of Science and Technology,School of Computer Science and Technology","Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","School of Computer Science and Technology, Wuhan University of Science and Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wuhan University of Science and Technology,School of Computer Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100730526","display_name":"Shuai Zhou","orcid":"https://orcid.org/0000-0003-3450-076X"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Zhou","raw_affiliation_strings":["Wuhan University of Science and Technology,School of Computer Science and Technology","Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","School of Computer Science and Technology, Wuhan University of Science and Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wuhan University of Science and Technology,School of Computer Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048396330","display_name":"Wei Liu","orcid":"https://orcid.org/0009-0007-2411-0852"},"institutions":[{"id":"https://openalex.org/I43922553","display_name":"Wuhan University of Science and Technology","ror":"https://ror.org/00e4hrk88","country_code":"CN","type":"education","lineage":["https://openalex.org/I43922553"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Liu","raw_affiliation_strings":["Wuhan University of Science and Technology,School of Computer Science and Technology","Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","School of Computer Science and Technology, Wuhan University of Science and Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Wuhan University of Science and Technology,School of Computer Science and Technology","institution_ids":["https://openalex.org/I43922553"]},{"raw_affiliation_string":"Hubei Province Key Laboratory of Intelligent Information Processing and Real-Time Industrial System, Wuhan, China","institution_ids":[]},{"raw_affiliation_string":"School of Computer Science and Technology, Wuhan University of Science and Technology","institution_ids":["https://openalex.org/I43922553"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059256963","display_name":"Chen Yang","orcid":"https://orcid.org/0000-0002-3863-5832"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang Chen","raw_affiliation_strings":["Engineering Research Center for Metallurgical Automation and Measurement Technology of Ministry of Education,Wuhan,China,430081"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Engineering Research Center for Metallurgical Automation and Measurement Technology of Ministry of Education,Wuhan,China,430081","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.7363,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.71115603,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11500","display_name":"Evacuation and Crowd Dynamics","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11500","display_name":"Evacuation and Crowd Dynamics","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9552000164985657,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9434000253677368,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7017021179199219},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6578800082206726},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.643121600151062},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6125052571296692},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6118676662445068},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5911420583724976},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5729070901870728},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.5141122937202454},{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.47718989849090576},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.43887537717819214},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3862200677394867},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3371754288673401},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16311734914779663}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7017021179199219},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6578800082206726},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.643121600151062},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6125052571296692},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6118676662445068},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5911420583724976},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5729070901870728},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.5141122937202454},{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.47718989849090576},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.43887537717819214},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3862200677394867},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3371754288673401},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16311734914779663},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio58561.2023.10355042","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio58561.2023.10355042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.7900000214576721}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320324116","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W192919555","https://openalex.org/W1963985276","https://openalex.org/W2072195747","https://openalex.org/W2142943472","https://openalex.org/W2558776914","https://openalex.org/W2565402511","https://openalex.org/W2612690371","https://openalex.org/W2748490912","https://openalex.org/W2890001928","https://openalex.org/W2904246096","https://openalex.org/W2963165299","https://openalex.org/W2963809389","https://openalex.org/W2964319688","https://openalex.org/W3005857605","https://openalex.org/W3152777725","https://openalex.org/W3174022889","https://openalex.org/W3205400264","https://openalex.org/W4220721274","https://openalex.org/W4221024508","https://openalex.org/W4226239849","https://openalex.org/W4292255390","https://openalex.org/W4313004671","https://openalex.org/W4313644253","https://openalex.org/W4315472473","https://openalex.org/W6739901393","https://openalex.org/W6757592117"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2988126442","https://openalex.org/W1974414866","https://openalex.org/W2063982682","https://openalex.org/W2338543196","https://openalex.org/W1544691147","https://openalex.org/W2768698792"],"abstract_inverted_index":{"Ensuring":[0],"robots":[1],"can":[2],"move":[3],"safely":[4],"and":[5,35,53,92,128],"adhere":[6],"to":[7,32,43,73,87,107],"social":[8],"norms":[9],"in":[10,46],"dynamic":[11],"human":[12],"environments":[13],"is":[14,85,105],"a":[15,67,81,123],"crucial":[16],"step":[17],"towards":[18],"robot":[19],"autonomous":[20],"decision-making.":[21],"In":[22,60],"existing":[23],"work,":[24],"double":[25],"serial":[26],"separate":[27],"modules":[28],"are":[29],"generally":[30],"used":[31],"capture":[33],"spatial":[34,91],"temporal":[36,93],"interactions,":[37],"respectively.":[38],"However,":[39],"such":[40],"methods":[41],"lead":[42],"extra":[44],"difficulties":[45],"improving":[47],"the":[48,55,77,90,100,109,114,118,134,142,145,149],"utilization":[49],"of":[50,57,62,116,125,136,144],"spatio-temporal":[51,110,126],"features":[52],"reducing":[54],"conservatism":[56,135],"navigation":[58,120,137],"policy.":[59,121],"light":[61],"this,":[63],"this":[64],"paper":[65],"proposes":[66],"spatiotemporal":[68],"transformer-based":[69],"policy":[70,130],"optimization":[71],"algorithm":[72,147],"more":[74],"effectively":[75,88],"preserve":[76],"human-robot":[78],"interactions.":[79],"Specifically,":[80],"gated":[82],"embedding":[83],"mechanism":[84],"introduced":[86],"fuses":[89],"representations":[94],"by":[95],"integrating":[96],"both":[97],"modalities":[98],"at":[99],"feature":[101],"level.":[102],"Then":[103],"Transformer":[104,127],"leveraged":[106],"encode":[108],"semantic":[111],"information,":[112],"with":[113],"hope":[115],"finding":[117],"optimal":[119],"Finally,":[122],"combination":[124],"self-adjusting":[129],"entropy":[131],"significantly":[132],"reduce":[133],"policies.":[138],"Experimental":[139],"results":[140],"demonstrate":[141],"priority":[143],"proposed":[146],"over":[148],"state-of-the-art":[150],"methods.":[151]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
