{"id":"https://openalex.org/W2151473317","doi":"https://doi.org/10.1109/robio.2010.5723346","title":"Fuzzy rule based neuro-dynamic programming for mobile robot skill acquisition on the basis of a nested multi-agent architecture","display_name":"Fuzzy rule based neuro-dynamic programming for mobile robot skill acquisition on the basis of a nested multi-agent architecture","publication_year":2010,"publication_date":"2010-12-01","ids":{"openalex":"https://openalex.org/W2151473317","doi":"https://doi.org/10.1109/robio.2010.5723346","mag":"2151473317"},"language":"en","primary_location":{"id":"doi:10.1109/robio.2010.5723346","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio.2010.5723346","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE International Conference on Robotics and Biomimetics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://doi.org/10.1109/ROBIO.2010.5723346","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5005907108","display_name":"John Karigiannis","orcid":"https://orcid.org/0009-0009-8921-1915"},"institutions":[{"id":"https://openalex.org/I174458059","display_name":"National Technical University of Athens","ror":"https://ror.org/03cx6bg69","country_code":"GR","type":"education","lineage":["https://openalex.org/I174458059"]}],"countries":["GR"],"is_corresponding":true,"raw_author_name":"John N. Karigiannis","raw_affiliation_strings":["School of Electrical & Computer Engineering, Division of Signals, Control & Robotics, National and Technical University of Athens, Athens, Greece"],"affiliations":[{"raw_affiliation_string":"School of Electrical & Computer Engineering, Division of Signals, Control & Robotics, National and Technical University of Athens, Athens, Greece","institution_ids":["https://openalex.org/I174458059"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002060759","display_name":"Theodoros Rekatsinas","orcid":"https://orcid.org/0000-0001-6148-1854"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Theodoros I. Rekatsinas","raw_affiliation_strings":["School of Computer Science, University of Maryland, College Park, MD, USA"],"affiliations":[{"raw_affiliation_string":"School of Computer Science, University of Maryland, College Park, MD, USA","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075518884","display_name":"Costas S. Tzafestas","orcid":"https://orcid.org/0000-0003-1545-9191"},"institutions":[{"id":"https://openalex.org/I174458059","display_name":"National Technical University of Athens","ror":"https://ror.org/03cx6bg69","country_code":"GR","type":"education","lineage":["https://openalex.org/I174458059"]}],"countries":["GR"],"is_corresponding":false,"raw_author_name":"Costas S. Tzafestas","raw_affiliation_strings":["School of Electrical & Computer Engineering, Division of Signals, Control & Robotics, National and Technical University of Athens, Athens, Greece"],"affiliations":[{"raw_affiliation_string":"School of Electrical & Computer Engineering, Division of Signals, Control & Robotics, National and Technical University of Athens, Athens, Greece","institution_ids":["https://openalex.org/I174458059"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5005907108"],"corresponding_institution_ids":["https://openalex.org/I174458059"],"apc_list":null,"apc_paid":null,"fwci":1.4562,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.86622526,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"8","issue":null,"first_page":"312","last_page":"319"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9846000075340271,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7297171354293823},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5752419829368591},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5619335174560547},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5390097498893738},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5284538269042969},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5067811608314514},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5064736604690552},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.48016753792762756},{"id":"https://openalex.org/keywords/fuzzy-logic","display_name":"Fuzzy logic","score":0.4733550548553467},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.46127888560295105},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.4452117681503296},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.42336535453796387},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.41697168350219727},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.37362849712371826},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.10560867190361023}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7297171354293823},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5752419829368591},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5619335174560547},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5390097498893738},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5284538269042969},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5067811608314514},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5064736604690552},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.48016753792762756},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.4733550548553467},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46127888560295105},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.4452117681503296},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.42336535453796387},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.41697168350219727},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.37362849712371826},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.10560867190361023},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/robio.2010.5723346","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio.2010.5723346","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE International Conference on Robotics and Biomimetics","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.401.3835","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.401.3835","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://www.cs.umd.edu/~thodrek/Hier_NDP_Arch.pdf","raw_type":"text"},{"id":"pmh:oai:dspace.lib.ntua.gr:123456789/32864","is_oa":true,"landing_page_url":"http://doi.org/10.1109/ROBIO.2010.5723346","pdf_url":null,"source":{"id":"https://openalex.org/S4377196837","display_name":"DSpace - NTUA (National Technical University of Athens)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I174458059","host_organization_name":"National Technical University of Athens","host_organization_lineage":["https://openalex.org/I174458059"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2010 IEEE International Conference on Robotics and Biomimetics, ROBIO 2010","raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"pmh:oai:dspace.lib.ntua.gr:123456789/32864","is_oa":true,"landing_page_url":"http://doi.org/10.1109/ROBIO.2010.5723346","pdf_url":null,"source":{"id":"https://openalex.org/S4377196837","display_name":"DSpace - NTUA (National Technical University of Athens)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I174458059","host_organization_name":"National Technical University of Athens","host_organization_lineage":["https://openalex.org/I174458059"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2010 IEEE International Conference on Robotics and Biomimetics, ROBIO 2010","raw_type":"info:eu-repo/semantics/conferenceObject"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W60031785","https://openalex.org/W69147663","https://openalex.org/W1510918013","https://openalex.org/W1510931001","https://openalex.org/W1512746852","https://openalex.org/W1523677668","https://openalex.org/W1576452626","https://openalex.org/W1591461724","https://openalex.org/W1602614133","https://openalex.org/W1985348117","https://openalex.org/W1987864653","https://openalex.org/W2030248743","https://openalex.org/W2042106485","https://openalex.org/W2045463255","https://openalex.org/W2075268401","https://openalex.org/W2086519765","https://openalex.org/W2097856935","https://openalex.org/W2100644648","https://openalex.org/W2104602264","https://openalex.org/W2115536129","https://openalex.org/W2118318536","https://openalex.org/W2121863487","https://openalex.org/W2134269720","https://openalex.org/W2146698718","https://openalex.org/W2154144276","https://openalex.org/W2160113664","https://openalex.org/W2162850206","https://openalex.org/W2544716473","https://openalex.org/W3011120880","https://openalex.org/W4205326910","https://openalex.org/W4214717370","https://openalex.org/W6602467702","https://openalex.org/W6631449650","https://openalex.org/W6637971370","https://openalex.org/W6674885835","https://openalex.org/W6675811377","https://openalex.org/W6677834374","https://openalex.org/W6775686901","https://openalex.org/W7028697565"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W4225571923","https://openalex.org/W3212257828","https://openalex.org/W4297873223","https://openalex.org/W2350784623","https://openalex.org/W2126211886"],"abstract_inverted_index":{"Biologically":[0],"inspired":[1,295],"architectures":[2],"that":[3,15,141,204,238],"mimic":[4],"the":[5,18,27,44,93,103,132,139,155,159,166,184,213,218,221,229,235,250,266,274,290],"organizational":[6],"structure":[7],"of":[8,20,46,61,111,117,168,220,228,292],"living":[9],"organisms":[10],"and":[11,39,148,216],"in":[12,43,80,97,120,165,186,247,258],"general":[13],"frameworks":[14],"will":[16],"improve":[17],"design":[19],"intelligent":[21,254],"robots":[22,172,185,231],"attract":[23],"significant":[24],"attention":[25],"from":[26],"research":[28],"community.":[29],"Self-organization":[30],"problems,":[31],"intrinsic":[32],"behaviors":[33],"as":[34,36,234,271,273],"well":[35,272],"effective":[37],"learning":[38,64,75],"skill":[40,63],"transfer":[41],"processes":[42],"context":[45],"robotic":[47],"systems":[48],"have":[49,239],"been":[50],"significantly":[51],"investigated":[52],"by":[53,66,145],"researchers.":[54],"Our":[55,256],"work":[56],"presents":[57],"a":[58,68,81,88,98,109,121,174,194,197,279],"new":[59],"framework":[60,162],"developmental":[62],"process":[65],"introducing":[67],"hierarchical":[69,268,280],"nested":[70],"multi-agent":[71,104,269,281],"architecture.":[72],"A":[73],"neuro-dynamic":[74],"mechanism":[76],"employing":[77],"function":[78],"approximators":[79],"fuzzified":[82],"state-space":[83],"is":[84,163,223,262,283],"utilized,":[85],"leading":[86],"to":[87,106,114,135,188,196,240,252,263,285],"collaborative":[89,175],"control":[90,276,291],"scheme":[91],"among":[92],"distributed":[94],"agents":[95,130,237],"engaged":[96],"continuous":[99,118],"space,":[100],"which":[101],"enables":[102],"system":[105,133],"learn,":[107],"over":[108,138,245],"period":[110],"time,":[112,246],"how":[113],"perform":[115,144],"sequences":[116],"actions":[119],"cooperative":[122,243],"manner":[123],"without":[124],"any":[125],"prior":[126],"task":[127,140,179],"model.":[128],"The":[129,225],"comprising":[131],"manage":[134],"gain":[136],"experience":[137],"they":[142],"collaboratively":[143],"continuously":[146],"exploring":[147],"exploiting":[149],"their":[150],"state-to-action":[151],"mapping":[152],"space.":[153],"For":[154],"specific":[156],"problem":[157],"setting,":[158],"proposed":[160,267],"theoretical":[161],"employed":[164],"case":[167],"two":[169,214],"simulated":[170],"e-Puck":[171],"performing":[173],"box-pushing":[176],"task.":[177],"This":[178],"involves":[180],"active":[181],"cooperation":[182],"between":[183],"order":[187,248],"jointly":[189],"push":[190],"an":[191],"object":[192,222],"on":[193],"plane":[195],"specified":[198,211],"goal":[199,257],"location.":[200],"We":[201],"should":[202],"note":[203],"1)":[205],"there":[206],"are":[207,232],"no":[208],"contact":[209],"points":[210],"for":[212,249,289],"e-Pucks":[215],"2)":[217],"shape":[219],"indifferent.":[224],"actuated":[226],"wheels":[227],"mobile":[230],"considered":[233],"independent":[236],"build":[241],"up":[242],"skills":[244],"robot":[251,296],"demonstrate":[253],"behavior.":[255],"this":[259],"experimental":[260],"study":[261],"evaluate":[264],"both":[265],"architecture,":[270],"methodological":[275],"framework.":[277],"Such":[278],"approach":[282],"envisioned":[284],"be":[286],"highly":[287],"scalable":[288],"complex":[293],"biologically":[294],"locomotion":[297],"systems.":[298]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
