{"id":"https://openalex.org/W4392981013","doi":"https://doi.org/10.1109/aics60730.2023.10470579","title":"Reinforcement Learning for Bio-Inspired Stochastic Robot Control","display_name":"Reinforcement Learning for Bio-Inspired Stochastic Robot Control","publication_year":2023,"publication_date":"2023-12-07","ids":{"openalex":"https://openalex.org/W4392981013","doi":"https://doi.org/10.1109/aics60730.2023.10470579"},"language":"en","primary_location":{"id":"doi:10.1109/aics60730.2023.10470579","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/aics60730.2023.10470579","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 31st Irish Conference on Artificial Intelligence and Cognitive Science (AICS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055838954","display_name":"James B. Gillespie","orcid":"https://orcid.org/0000-0003-2721-8854"},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"James Gillespie","raw_affiliation_strings":["Intelligent Systems Research Centre, Ulster University,Northern Ireland, UK","Intelligent Systems Research Centre, Ulster University, Northern Ireland, UK"],"affiliations":[{"raw_affiliation_string":"Intelligent Systems Research Centre, Ulster University,Northern Ireland, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"Intelligent Systems Research Centre, Ulster University, Northern Ireland, UK","institution_ids":["https://openalex.org/I138801177"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074968710","display_name":"I\u00f1aki Ra\u00f1\u00f3","orcid":"https://orcid.org/0000-0002-0461-0258"},"institutions":[{"id":"https://openalex.org/I200284239","display_name":"Universidade de Santiago de Compostela","ror":"https://ror.org/030eybx10","country_code":"ES","type":"education","lineage":["https://openalex.org/I200284239"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"I\u00f1aki Ra\u00f1\u00f3","raw_affiliation_strings":["Intelligent Systems Group, University of Santiago de Compostela,Spain","Intelligent Systems Group, University of Santiago de Compostela, Spain"],"affiliations":[{"raw_affiliation_string":"Intelligent Systems Group, University of Santiago de Compostela,Spain","institution_ids":["https://openalex.org/I200284239"]},{"raw_affiliation_string":"Intelligent Systems Group, University of Santiago de Compostela, Spain","institution_ids":["https://openalex.org/I200284239"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037830755","display_name":"Jos\u00e9 Santos","orcid":"https://orcid.org/0000-0001-5604-1125"},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Jos\u00e9 Santos","raw_affiliation_strings":["Pervasive Computing Research Centre, Ulster University,Northern Ireland, UK","Pervasive Computing Research Centre, Ulster University, Northern Ireland, UK"],"affiliations":[{"raw_affiliation_string":"Pervasive Computing Research Centre, Ulster University,Northern Ireland, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"Pervasive Computing Research Centre, Ulster University, Northern Ireland, UK","institution_ids":["https://openalex.org/I138801177"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012890130","display_name":"Nazmul Siddique","orcid":"https://orcid.org/0000-0002-0642-2357"},"institutions":[{"id":"https://openalex.org/I138801177","display_name":"University of Ulster","ror":"https://ror.org/01yp9g959","country_code":"GB","type":"education","lineage":["https://openalex.org/I138801177"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Nazmul Siddique","raw_affiliation_strings":["Intelligent Systems Research Centre, Ulster University,Northern Ireland, UK","Intelligent Systems Research Centre, Ulster University, Northern Ireland, UK"],"affiliations":[{"raw_affiliation_string":"Intelligent Systems Research Centre, Ulster University,Northern Ireland, UK","institution_ids":["https://openalex.org/I138801177"]},{"raw_affiliation_string":"Intelligent Systems Research Centre, Ulster University, Northern Ireland, UK","institution_ids":["https://openalex.org/I138801177"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5055838954"],"corresponding_institution_ids":["https://openalex.org/I138801177"],"apc_list":null,"apc_paid":null,"fwci":0.1748,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.60567742,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"abs/1412.6980","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5498999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.5498999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7857065796852112},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6147544980049133},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5000979900360107},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4902983009815216}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7857065796852112},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6147544980049133},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5000979900360107},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4902983009815216}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/aics60730.2023.10470579","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/aics60730.2023.10470579","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 31st Irish Conference on Artificial Intelligence and Cognitive Science (AICS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1535977321","https://openalex.org/W1949804828","https://openalex.org/W1969019211","https://openalex.org/W1977655452","https://openalex.org/W1995837155","https://openalex.org/W2010818426","https://openalex.org/W2011777324","https://openalex.org/W2053211384","https://openalex.org/W2063282235","https://openalex.org/W2073360733","https://openalex.org/W2087751887","https://openalex.org/W2089496638","https://openalex.org/W2127107099","https://openalex.org/W2135376858","https://openalex.org/W2160239037","https://openalex.org/W2160638931","https://openalex.org/W2168945912","https://openalex.org/W2529601334","https://openalex.org/W2603249661","https://openalex.org/W2736558185","https://openalex.org/W3009018467","https://openalex.org/W4243206564","https://openalex.org/W6628861149","https://openalex.org/W6630825244","https://openalex.org/W6631190155"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4306904969","https://openalex.org/W2358668433","https://openalex.org/W2138720691","https://openalex.org/W2376932109","https://openalex.org/W4362501864","https://openalex.org/W2001405890","https://openalex.org/W4380318855","https://openalex.org/W2031695474"],"abstract_inverted_index":{"Braitenberg":[0,84,108],"vehicles":[1],"serve":[2],"as":[3,153],"bio-inspired":[4,88],"controllers":[5,24,82],"for":[6,83,107,130],"sensor-based":[7],"local":[8],"navigation":[9,49],"in":[10,15,93,128,176],"wheeled":[11],"robots,":[12],"finding":[13,26],"applications":[14],"various":[16],"real-world":[17,113],"scenarios.":[18],"Tuning":[19],"the":[20,42,46,67,103,122,125,138,150,163,168],"parameters":[21],"of":[22,90,105,124,162],"these":[23],"involves":[25],"nonlinear":[27],"functions":[28],"typically":[29],"implemented":[30],"through":[31,142,160],"neural":[32,62,81,139,170],"networks":[33],"that":[34],"link":[35],"sensing":[36],"to":[37,44,79,111,180],"motor":[38],"actions.":[39],"However,":[40],"tuning":[41],"weights":[43,68],"achieve":[45],"desired":[47],"closed-loop":[48],"behaviours":[50],"poses":[51],"significant":[52],"challenges.":[53],"Some":[54],"approaches":[55],"use":[56],"hand":[57],"tuned":[58],"spiking":[59],"or":[60],"recurrent":[61],"networks,":[63],"while":[64],"others":[65],"learn":[66,80],"using":[69,149],"evolutionary":[70],"approaches.":[71],"Recently,":[72],"Reinforcement":[73],"Learning":[74],"has":[75],"been":[76],"successfully":[77],"used":[78],"vehicle":[85],"3a,":[86],"a":[87,112,145,173],"model":[89],"target":[91],"seeking":[92],"simulated":[94],"scenarios":[95],"with":[96],"high":[97],"noise":[98,119],"levels.":[99],"This":[100],"paper":[101],"extends":[102],"application":[104],"RL":[106,126,143],"Vehicle":[109],"control":[110],"robot":[114,165],"platform,":[115],"introducing":[116],"real":[117,164],"sensor":[118],"and":[120,144],"testing":[121],"adaptability":[123],"framework":[127],"attenuating":[129],"this":[131],"uncertainty.":[132],"Comparative":[133],"analyses":[134],"are":[135,158],"drawn":[136],"between":[137],"controller":[140,171],"acquired":[141],"simplistic":[146],"hand-tuned":[147,183],"counterpart":[148],"Colias":[151],"micro-robot":[152],"an":[154,181],"evaluation":[155],"tool.":[156],"Results":[157],"illustrated":[159],"analysis":[161],"trajectories,":[166],"where":[167],"RL-based":[169],"exhibits":[172],"32.5%":[174],"increase":[175],"successful":[177],"trajectories":[178],"compared":[179],"empirical":[182],"controller.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-25T23:11:45.687758","created_date":"2025-10-10T00:00:00"}
