{"id":"https://openalex.org/W4391306093","doi":"https://doi.org/10.1109/rose60297.2023.10410776","title":"An Online Model-Free Reinforcement Learning Approach for 6-DOF Robot Manipulators","display_name":"An Online Model-Free Reinforcement Learning Approach for 6-DOF Robot Manipulators","publication_year":2023,"publication_date":"2023-11-06","ids":{"openalex":"https://openalex.org/W4391306093","doi":"https://doi.org/10.1109/rose60297.2023.10410776"},"language":"en","primary_location":{"id":"doi:10.1109/rose60297.2023.10410776","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/rose60297.2023.10410776","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on Robotic and Sensors Environments (ROSE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093809829","display_name":"Zeyad Hosny","orcid":null},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Zeyad Hosny","raw_affiliation_strings":["University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","institution_ids":["https://openalex.org/I153718931"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059434364","display_name":"Abdullah Nassar","orcid":null},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Abdullah Nassar","raw_affiliation_strings":["University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","institution_ids":["https://openalex.org/I153718931"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093809830","display_name":"Ahmed AboElyazeed","orcid":null},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ahmed AboElyazeed","raw_affiliation_strings":["University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","institution_ids":["https://openalex.org/I153718931"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109195846","display_name":"Mahmoud Mohamed","orcid":null},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Mahmoud Mohamed","raw_affiliation_strings":["University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","institution_ids":["https://openalex.org/I153718931"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045456375","display_name":"Mohammed Abouheaf","orcid":"https://orcid.org/0000-0002-6130-9015"},"institutions":[{"id":"https://openalex.org/I157417397","display_name":"Bowling Green State University","ror":"https://ror.org/00ay7va13","country_code":"US","type":"education","lineage":["https://openalex.org/I157417397"]},{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA","US"],"is_corresponding":false,"raw_author_name":"Mohammed Abouheaf","raw_affiliation_strings":["University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","Robotics Engineering, Bowling Green State University, Bowling Green, 43402 OH, USA","School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","institution_ids":["https://openalex.org/I153718931"]},{"raw_affiliation_string":"Robotics Engineering, Bowling Green State University, Bowling Green, 43402 OH, USA","institution_ids":["https://openalex.org/I157417397"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada","institution_ids":["https://openalex.org/I153718931"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036560577","display_name":"Wail Gueaieb","orcid":"https://orcid.org/0000-0001-6490-4648"},"institutions":[{"id":"https://openalex.org/I153718931","display_name":"University of Ottawa","ror":"https://ror.org/03c4mmv16","country_code":"CA","type":"education","lineage":["https://openalex.org/I153718931"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Wail Gueaieb","raw_affiliation_strings":["University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Ottawa,School of Electrical Engineering and Computer Science,Ottawa,ON, K1N6N5,Canada","institution_ids":["https://openalex.org/I153718931"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, University of Ottawa, Ottawa, ON, K1N6N5, Canada","institution_ids":["https://openalex.org/I153718931"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5093809829"],"corresponding_institution_ids":["https://openalex.org/I153718931"],"apc_list":null,"apc_paid":null,"fwci":0.3887,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67913832,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"120","issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11372","display_name":"Hydraulic and Pneumatic Systems","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7556539177894592},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6975034475326538},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.6128890514373779},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.5667558312416077},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5661225318908691},{"id":"https://openalex.org/keywords/adaptive-control","display_name":"Adaptive control","score":0.4797435998916626},{"id":"https://openalex.org/keywords/matlab","display_name":"MATLAB","score":0.4702146351337433},{"id":"https://openalex.org/keywords/robot-manipulator","display_name":"Robot manipulator","score":0.4448433816432953},{"id":"https://openalex.org/keywords/tracking-error","display_name":"Tracking error","score":0.43781906366348267},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.42446672916412354},{"id":"https://openalex.org/keywords/degrees-of-freedom","display_name":"Degrees of freedom (physics and chemistry)","score":0.41797709465026855},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.39163723587989807},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.3867324888706207},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2927206754684448},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15164437890052795},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11120253801345825}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7556539177894592},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6975034475326538},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.6128890514373779},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.5667558312416077},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5661225318908691},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.4797435998916626},{"id":"https://openalex.org/C2780365114","wikidata":"https://www.wikidata.org/wiki/Q169478","display_name":"MATLAB","level":2,"score":0.4702146351337433},{"id":"https://openalex.org/C2985527887","wikidata":"https://www.wikidata.org/wiki/Q1587588","display_name":"Robot manipulator","level":3,"score":0.4448433816432953},{"id":"https://openalex.org/C183356978","wikidata":"https://www.wikidata.org/wiki/Q1779213","display_name":"Tracking error","level":3,"score":0.43781906366348267},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.42446672916412354},{"id":"https://openalex.org/C208081375","wikidata":"https://www.wikidata.org/wiki/Q274502","display_name":"Degrees of freedom (physics and chemistry)","level":2,"score":0.41797709465026855},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.39163723587989807},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3867324888706207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2927206754684448},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15164437890052795},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11120253801345825},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/rose60297.2023.10410776","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/rose60297.2023.10410776","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on Robotic and Sensors Environments (ROSE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1487127700","https://openalex.org/W1583895361","https://openalex.org/W1986253301","https://openalex.org/W1987304268","https://openalex.org/W1997014929","https://openalex.org/W2036619160","https://openalex.org/W2039354440","https://openalex.org/W2048017417","https://openalex.org/W2075841074","https://openalex.org/W2079737074","https://openalex.org/W2086977346","https://openalex.org/W2093244306","https://openalex.org/W2124267516","https://openalex.org/W2141781870","https://openalex.org/W2166783325","https://openalex.org/W2216547738","https://openalex.org/W2318763906","https://openalex.org/W2366070612","https://openalex.org/W2585713293","https://openalex.org/W2862626627","https://openalex.org/W2897010625","https://openalex.org/W2899438223","https://openalex.org/W2967190068","https://openalex.org/W2967692091","https://openalex.org/W2979612126","https://openalex.org/W2980804356","https://openalex.org/W2999810890","https://openalex.org/W3150565301","https://openalex.org/W3156359084","https://openalex.org/W4200395703","https://openalex.org/W4213251304","https://openalex.org/W4214717370","https://openalex.org/W4225133385","https://openalex.org/W4242310606","https://openalex.org/W4250606304","https://openalex.org/W4324137886"],"related_works":["https://openalex.org/W2567520115","https://openalex.org/W1545539801","https://openalex.org/W2567391447","https://openalex.org/W2080408381","https://openalex.org/W1925083093","https://openalex.org/W2344226335","https://openalex.org/W4280596088","https://openalex.org/W2055801945","https://openalex.org/W2148178391","https://openalex.org/W2139526495"],"abstract_inverted_index":{"Controlling":[0],"6":[1,40],"Degrees-of-Freedom":[2],"(DoF)":[3],"robotic":[4,43,195],"manipulators":[5],"in":[6,119,212],"an":[7,61,164],"online,":[8],"model-free":[9,32,132],"manner":[10],"poses":[11],"significant":[12],"challenges":[13],"due":[14],"to":[15,23,80,88,129,142,158,189],"their":[16],"complex":[17],"coupling,":[18],"non-linearities,":[19],"and":[20,73],"the":[21,51,58,78,86,101,115,144,160,170,191,194,198,206,215,219,225],"need":[22,87],"account":[24],"for":[25,35,60],"unmodeled":[26],"dynamics.":[27,53],"This":[28,124],"paper":[29],"introduces":[30],"a":[31,39,109,120,131,136,154,177],"adaptive":[33,165],"approach":[34,139],"real-time":[36],"control":[37,63,75,133],"of":[38,50,95,104,193,214,218],"DoF":[41],"\u201cEPSON\u201d":[42],"manipulator,":[44],"without":[45,85],"requiring":[46],"any":[47],"prior":[48],"knowledge":[49],"manipulator\u2019s":[52],"Initially,":[54],"we":[55],"lay":[56],"out":[57],"framework":[59],"optimal":[62],"solution.":[64],"A":[65,181],"performance":[66,116],"index":[67],"is":[68,98,140,174,187],"introduced,":[69],"leveraging":[70],"error":[71,83,91,96,105],"dynamics":[72,84,97],"correction":[74],"signals,":[76],"offering":[77],"capability":[79],"incorporate":[81],"high-order":[82],"explicitly":[89],"derive":[90],"trajectories.":[92],"The":[93],"order":[94],"determined":[99],"by":[100,152],"chosen":[102],"number":[103],"samples.":[106],"We":[107],"assume":[108],"kernel-based":[110],"solution":[111],"structure":[112],"aligning":[113],"with":[114],"index,":[117],"resulting":[118],"temporal":[121],"difference":[122],"equation.":[123],"equation":[125],"can":[126],"be":[127],"optimized":[128],"formulate":[130],"strategy.":[134,146],"Subsequently,":[135],"reinforcement":[137],"learning":[138],"adopted":[141],"approximate":[143],"underlying":[145],"Infeasible":[147],"exact":[148],"solutions":[149],"are":[150],"overcome":[151],"employing":[153],"value":[155],"iteration":[156],"mechanism":[157],"adapt":[159],"actor-critic":[161],"structures":[162],"within":[163],"critics":[166],"framework.":[167],"To":[168],"validate":[169],"proposed":[171,207],"approach,":[172],"it":[173],"compared":[175],"against":[176],"conventional":[178,226],"proportional-integral":[179],"controller.":[180],"Unified":[182],"Robot":[183],"Description":[184],"Format":[185],"file":[186],"generated":[188],"facilitate":[190],"import":[192],"manipulator":[196],"into":[197],"MATLAB":[199],"Simulink":[200],"environment,":[201],"enabling":[202],"its":[203,222],"control.":[204],"Ultimately,":[205],"method":[208],"yields":[209],"superior":[210],"results":[211],"terms":[213],"dynamic":[216],"characteristics":[217],"response,":[220],"demonstrating":[221],"effectiveness":[223],"over":[224],"approach.":[227]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-29T09:16:38.111599","created_date":"2025-10-10T00:00:00"}
