{"id":"https://openalex.org/W4360897660","doi":"https://doi.org/10.1109/lra.2023.3261708","title":"Synergistic Task and Motion Planning With Reinforcement Learning-Based Non-Prehensile Actions","display_name":"Synergistic Task and Motion Planning With Reinforcement Learning-Based Non-Prehensile Actions","publication_year":2023,"publication_date":"2023-03-24","ids":{"openalex":"https://openalex.org/W4360897660","doi":"https://doi.org/10.1109/lra.2023.3261708"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2023.3261708","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2023.3261708","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026703570","display_name":"Gaoyuan Liu","orcid":"https://orcid.org/0000-0002-9063-2751"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]},{"id":"https://openalex.org/I4210114974","display_name":"IMEC","ror":"https://ror.org/02kcbn207","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I4210114974"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Gaoyuan Liu","raw_affiliation_strings":["Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","imec, Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]},{"raw_affiliation_string":"imec, Leuven, Belgium","institution_ids":["https://openalex.org/I4210114974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091185289","display_name":"Joris De Winter","orcid":"https://orcid.org/0000-0002-5818-7539"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]},{"id":"https://openalex.org/I4210116480","display_name":"Flanders Make (Belgium)","ror":"https://ror.org/02ndjfz59","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210116480"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Joris de Winter","raw_affiliation_strings":["Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","Flanders Make, Lommel, Belgium"],"affiliations":[{"raw_affiliation_string":"Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]},{"raw_affiliation_string":"Flanders Make, Lommel, Belgium","institution_ids":["https://openalex.org/I4210116480"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067283098","display_name":"Denis Steckelmacher","orcid":"https://orcid.org/0000-0003-1521-8494"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Denis Steckelmacher","raw_affiliation_strings":["Artificial Intelligence (AI) Lab, Vrije Universiteit Brussel, Brussels, Belgium"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence (AI) Lab, Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051172866","display_name":"Roshan Kumar Hota","orcid":"https://orcid.org/0000-0002-4008-9551"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]},{"id":"https://openalex.org/I4210116480","display_name":"Flanders Make (Belgium)","ror":"https://ror.org/02ndjfz59","country_code":"BE","type":"company","lineage":["https://openalex.org/I4210116480"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Roshan Kumar Hota","raw_affiliation_strings":["Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","Flanders Make, Lommel, Belgium"],"affiliations":[{"raw_affiliation_string":"Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]},{"raw_affiliation_string":"Flanders Make, Lommel, Belgium","institution_ids":["https://openalex.org/I4210116480"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064553018","display_name":"Ann Now\u00e9","orcid":"https://orcid.org/0000-0001-6346-4564"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Ann Nowe","raw_affiliation_strings":["Artificial Intelligence (AI) Lab, Vrije Universiteit Brussel, Brussels, Belgium"],"affiliations":[{"raw_affiliation_string":"Artificial Intelligence (AI) Lab, Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010914606","display_name":"Bram Vanderborght","orcid":"https://orcid.org/0000-0003-4881-9341"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]},{"id":"https://openalex.org/I4210114974","display_name":"IMEC","ror":"https://ror.org/02kcbn207","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I4210114974"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Bram Vanderborght","raw_affiliation_strings":["Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","imec, Leuven, Belgium"],"affiliations":[{"raw_affiliation_string":"Brubotics, Vrije Universiteit Brussel, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]},{"raw_affiliation_string":"imec, Leuven, Belgium","institution_ids":["https://openalex.org/I4210114974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5026703570"],"corresponding_institution_ids":["https://openalex.org/I13469542","https://openalex.org/I4210114974"],"apc_list":null,"apc_paid":null,"fwci":2.1849,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.87207569,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"8","issue":"5","first_page":"2764","last_page":"2771"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prehensile-tail","display_name":"Prehensile tail","score":0.752269446849823},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6325041055679321},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.6099260449409485},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.609390914440155},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6079047918319702},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5818939208984375},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3517712950706482},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.26227235794067383},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14123386144638062},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.06429508328437805}],"concepts":[{"id":"https://openalex.org/C136380597","wikidata":"https://www.wikidata.org/wiki/Q10508905","display_name":"Prehensile tail","level":2,"score":0.752269446849823},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6325041055679321},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.6099260449409485},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.609390914440155},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6079047918319702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5818939208984375},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3517712950706482},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.26227235794067383},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14123386144638062},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.06429508328437805},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/lra.2023.3261708","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2023.3261708","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},{"id":"pmh:oai:vubissmart:VUBISSMART:2000:166505","is_oa":false,"landing_page_url":"https://biblio.vub.ac.be/vubir/synergistic-task-and-motion-planning-with-reinforcement-learningbased-nonprehensile-actions(5f77e0ca-cdaf-4889-a077-7bbad12d6bac).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306402573","display_name":"VUBIR (Vrije Universiteit Brussel)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I13469542","host_organization_name":"Vrije Universiteit Brussel","host_organization_lineage":["https://openalex.org/I13469542"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"publishedVersion"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1462399522","display_name":null,"funder_award_id":"101070596","funder_id":"https://openalex.org/F4320322725","funder_display_name":"China Scholarship Council"},{"id":"https://openalex.org/G2300736770","display_name":null,"funder_award_id":"(CSC)","funder_id":"https://openalex.org/F4320322725","funder_display_name":"China Scholarship Council"},{"id":"https://openalex.org/G4132985236","display_name":null,"funder_award_id":"unknown","funder_id":"https://openalex.org/F4320322725","funder_display_name":"China Scholarship Council"},{"id":"https://openalex.org/G8589651859","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320322725","funder_display_name":"China Scholarship Council"}],"funders":[{"id":"https://openalex.org/F4320322725","display_name":"China Scholarship Council","ror":"https://ror.org/04atp4p48"},{"id":"https://openalex.org/F4320327336","display_name":"Vlaamse regering","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2161414194","https://openalex.org/W2412154694","https://openalex.org/W2561918466","https://openalex.org/W2735300570","https://openalex.org/W2736601468","https://openalex.org/W2786893837","https://openalex.org/W2794663059","https://openalex.org/W2904207885","https://openalex.org/W2945600613","https://openalex.org/W2962793652","https://openalex.org/W2984756091","https://openalex.org/W3001865277","https://openalex.org/W3004011906","https://openalex.org/W3008535267","https://openalex.org/W3021544315","https://openalex.org/W3039141704","https://openalex.org/W3086207594","https://openalex.org/W3098499184","https://openalex.org/W3101103779","https://openalex.org/W3103940950","https://openalex.org/W3135445321","https://openalex.org/W3150384095","https://openalex.org/W3176770340","https://openalex.org/W3189699967","https://openalex.org/W3201307163","https://openalex.org/W3215761265","https://openalex.org/W4221138457","https://openalex.org/W4221152092","https://openalex.org/W6741002519","https://openalex.org/W6752429892","https://openalex.org/W6780755086","https://openalex.org/W6810099856"],"related_works":["https://openalex.org/W2552641899","https://openalex.org/W2768832826","https://openalex.org/W2028231052","https://openalex.org/W2465876097","https://openalex.org/W3166169123","https://openalex.org/W2010045274","https://openalex.org/W2105329304","https://openalex.org/W197901881","https://openalex.org/W1551001629","https://openalex.org/W2998125923"],"abstract_inverted_index":{"Robotic":[0],"manipulation":[1],"in":[2,40,103,135],"cluttered":[3,41,130],"environments":[4],"requires":[5],"synergistic":[6],"planning":[7,124],"among":[8],"prehensile":[9],"and":[10,18,28,86,133,138],"non-prehensile":[11,68],"actions.":[12],"Previous":[13],"works":[14],"on":[15,128],"sampling-based":[16,59,94,157,161],"Task":[17],"Motion":[19],"Planning":[20],"(TAMP)":[21],"algorithms,":[22,60],"e.g.":[23],"PDDLStream,":[24],"provide":[25],"a":[26,63,129],"fast":[27],"generalizable":[29],"solution":[30],"for":[31],"multi-modal":[32],"manipulation.":[33],"However,":[34],"they":[35],"are":[36],"likely":[37],"to":[38,114,118],"fail":[39],"scenarios":[42],"where":[43],"no":[44],"collision-free":[45],"grasping":[46,89],"approaches":[47],"can":[48,82,112,148,163],"be":[49],"sampled":[50],"without":[51],"preliminary":[52],"manipulations.":[53],"To":[54],"extend":[55],"the":[56,88,93,97,104,108,144,151,155,160,165],"ability":[57],"of":[58,154],"we":[61],"integrate":[62],"vision-based":[64],"Reinforcement":[65],"Learning":[66],"(RL)":[67],"procedure,":[69],"<italic":[70,79,109,145,166],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[71,80,110,146,167],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">pusher</i>":[72,81,111,147,168],".":[73],"The":[74,121],"pushing":[75,98,170],"actions":[76,99],"generated":[77],"by":[78,100],"eliminate":[83],"interlocked":[84],"situations":[85,116],"make":[87],"problem":[90,132],"solvable.":[91],"Also,":[92],"algorithm":[95,162],"evaluates":[96],"providing":[101],"rewards":[102],"training":[105],"process,":[106],"thus":[107],"learn":[113,169],"avoid":[115],"leading":[117],"irreversible":[119],"failures.":[120],"proposed":[122],"hybrid":[123],"method":[125],"is":[126],"validated":[127],"bin-picking":[131],"implemented":[134],"both":[136],"simulation":[137],"real":[139],"world.":[140],"Results":[141],"show":[142],"that":[143],"effectively":[149],"improve":[150],"success":[152],"ratio":[153],"previous":[156],"algorithm,":[158],"while":[159],"help":[164],"skills.":[171]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
