{"id":"https://openalex.org/W4405786968","doi":"https://doi.org/10.1109/iros58592.2024.10802257","title":"Local Path Planning among Pushable Objects based on Reinforcement Learning","display_name":"Local Path Planning among Pushable Objects based on Reinforcement Learning","publication_year":2024,"publication_date":"2024-10-14","ids":{"openalex":"https://openalex.org/W4405786968","doi":"https://doi.org/10.1109/iros58592.2024.10802257"},"language":"en","primary_location":{"id":"doi:10.1109/iros58592.2024.10802257","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10802257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://discovery.ucl.ac.uk/id/eprint/10203740/1/2303.02407v3.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070259803","display_name":"Linghong Yao","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Linghong Yao","raw_affiliation_strings":["University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091705160","display_name":"Valerio Modugno","orcid":"https://orcid.org/0000-0002-5177-428X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Valerio Modugno","raw_affiliation_strings":["University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093900200","display_name":"Andromachi Maria Delfaki","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andromachi Maria Delfaki","raw_affiliation_strings":["University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079073545","display_name":"Yuanchang Liu","orcid":"https://orcid.org/0000-0001-9306-297X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Yuanchang Liu","raw_affiliation_strings":["University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077630267","display_name":"Danail Stoyanov","orcid":"https://orcid.org/0000-0002-0980-3227"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Danail Stoyanov","raw_affiliation_strings":["University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048122691","display_name":"Dimitrios Kanoulas","orcid":"https://orcid.org/0000-0002-3684-1472"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Dimitrios Kanoulas","raw_affiliation_strings":["University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT"],"affiliations":[{"raw_affiliation_string":"University College London,Department of Computer Science and Mechanical Engineering,London,UK,WC1E 6BT","institution_ids":["https://openalex.org/I45129253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5070259803"],"corresponding_institution_ids":["https://openalex.org/I45129253"],"apc_list":null,"apc_paid":null,"fwci":0.4935,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67401231,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"3062","last_page":"3068"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9667999744415283,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.9247000217437744,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8237394690513611},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6661447882652283},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6554544568061829},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.532896876335144},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4430188536643982},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4138278365135193},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3243967294692993},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.16320085525512695},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.15881285071372986},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.0869816243648529},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08587083220481873}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8237394690513611},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6661447882652283},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6554544568061829},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.532896876335144},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4430188536643982},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4138278365135193},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3243967294692993},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.16320085525512695},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.15881285071372986},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0869816243648529},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08587083220481873}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/iros58592.2024.10802257","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros58592.2024.10802257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10203740","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10203740/","pdf_url":"https://discovery.ucl.ac.uk/id/eprint/10203740/1/2303.02407v3.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In:  2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS).  (pp. pp. 3062-3068).  IEEE: Abu Dhabi, United Arab Emirates. (2024)","raw_type":"Proceedings paper"}],"best_oa_location":{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10203740","is_oa":true,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10203740/","pdf_url":"https://discovery.ucl.ac.uk/id/eprint/10203740/1/2303.02407v3.pdf","source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"In:  2024 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS).  (pp. pp. 3062-3068).  IEEE: Abu Dhabi, United Arab Emirates. (2024)","raw_type":"Proceedings paper"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1737217355","display_name":null,"funder_award_id":"EP/P012841/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4405786968.pdf","grobid_xml":"https://content.openalex.org/works/W4405786968.grobid-xml"},"referenced_works_count":31,"referenced_works":["https://openalex.org/W1008966784","https://openalex.org/W1593316755","https://openalex.org/W1601397300","https://openalex.org/W1969483458","https://openalex.org/W1983855471","https://openalex.org/W2017146873","https://openalex.org/W2044725657","https://openalex.org/W2145339207","https://openalex.org/W2340238674","https://openalex.org/W2566555774","https://openalex.org/W2986717012","https://openalex.org/W2997051667","https://openalex.org/W2998903229","https://openalex.org/W3090386798","https://openalex.org/W4205160626","https://openalex.org/W4240202985","https://openalex.org/W4312770775","https://openalex.org/W4313478341","https://openalex.org/W4322730824","https://openalex.org/W4363649156","https://openalex.org/W4367839715","https://openalex.org/W4386066287","https://openalex.org/W4390906619","https://openalex.org/W6631190155","https://openalex.org/W6636831713","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6741002519","https://openalex.org/W6754629161","https://openalex.org/W6780127695","https://openalex.org/W6800004206"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W2359600231","https://openalex.org/W2380019117","https://openalex.org/W3138952546","https://openalex.org/W1987886368","https://openalex.org/W1660309994","https://openalex.org/W2369187583","https://openalex.org/W3197207153"],"abstract_inverted_index":{"In":[0,24],"this":[1,108],"paper,":[2],"we":[3,26,104],"introduce":[4],"a":[5,32,43],"method":[6,86],"to":[7,54,63,67,91,96,118],"tackle":[8,76],"the":[9,85,93,120,129],"problem":[10,21],"of":[11],"robot":[12],"local":[13,77],"path":[14,78],"planning":[15,79],"among":[16],"pushable":[17],"objects":[18],"\u2013an":[19],"open":[20],"in":[22,31,57,70,80,87,100,132],"robotics.":[23],"particular,":[25],"simultaneously":[27],"train":[28],"multiple":[29],"agents":[30,53],"physics-based":[33],"simulation":[34],"environment,":[35],"utilizing":[36],"an":[37,111],"Advantage":[38],"Actor-Critic":[39],"algorithm":[40],"coupled":[41],"with":[42,125],"deep":[44],"neural":[45],"network.":[46],"The":[47],"developed":[48],"online":[49],"policy":[50,109],"enables":[51],"these":[52],"push":[55],"obstacles":[56],"ways":[58],"that":[59],"are":[60],"not":[61],"limited":[62],"axial":[64],"alignments,":[65],"adapt":[66],"unforeseen":[68],"changes":[69],"obstacle":[71],"dynamics":[72],"instantaneously,":[73],"and":[74,122,128],"effectively":[75],"confined":[81],"areas.":[82],"We":[83],"tested":[84],"various":[88,97],"simulated":[89],"environments":[90],"prove":[92],"adaptation":[94],"effectiveness":[95],"unseen":[98],"scenarios":[99],"unfamiliar":[101],"settings.":[102],"Moreover,":[103],"have":[105],"successfully":[106],"applied":[107],"on":[110],"actual":[112],"quadruped":[113],"robot,":[114],"confirming":[115],"its":[116],"capability":[117],"handle":[119],"unpredictability":[121],"noise":[123],"associated":[124],"real-world":[126],"sensors":[127],"inherent":[130],"uncertainties":[131],"unexplored":[133],"object-pushing":[134],"tasks.":[135]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
