{"id":"https://openalex.org/W2950125763","doi":"https://doi.org/10.1109/icarsc.2019.8733632","title":"Learning low level skills from scratch for humanoid robot soccer using deep reinforcement learning","display_name":"Learning low level skills from scratch for humanoid robot soccer using deep reinforcement learning","publication_year":2019,"publication_date":"2019-04-01","ids":{"openalex":"https://openalex.org/W2950125763","doi":"https://doi.org/10.1109/icarsc.2019.8733632","mag":"2950125763"},"language":"en","primary_location":{"id":"doi:10.1109/icarsc.2019.8733632","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icarsc.2019.8733632","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057161810","display_name":"Miguel Abreu","orcid":"https://orcid.org/0000-0002-6342-2054"},"institutions":[{"id":"https://openalex.org/I182534213","display_name":"Universidade do Porto","ror":"https://ror.org/043pwc612","country_code":"PT","type":"education","lineage":["https://openalex.org/I182534213"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Miguel Abreu","raw_affiliation_strings":["Faculty of Engineering, University of Porto, Portugal"],"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Porto, Portugal","institution_ids":["https://openalex.org/I182534213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055569781","display_name":"Nuno Lau","orcid":"https://orcid.org/0000-0003-0513-158X"},"institutions":[{"id":"https://openalex.org/I60858718","display_name":"University of Aveiro","ror":"https://ror.org/00nt41z93","country_code":"PT","type":"education","lineage":["https://openalex.org/I60858718"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Nuno Lau","raw_affiliation_strings":["DETI, University of Aveiro, Portugal"],"affiliations":[{"raw_affiliation_string":"DETI, University of Aveiro, Portugal","institution_ids":["https://openalex.org/I60858718"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057871059","display_name":"Armando Sousa","orcid":"https://orcid.org/0000-0002-0317-4714"},"institutions":[{"id":"https://openalex.org/I4210166615","display_name":"INESC TEC","ror":"https://ror.org/05fa8ka61","country_code":"PT","type":"nonprofit","lineage":["https://openalex.org/I4210125590","https://openalex.org/I4210166615"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Armando Sousa","raw_affiliation_strings":["Technology and Science, INESC TEC - Institute for Systems and Computer Engineering, Porto, Portugal"],"affiliations":[{"raw_affiliation_string":"Technology and Science, INESC TEC - Institute for Systems and Computer Engineering, Porto, Portugal","institution_ids":["https://openalex.org/I4210166615"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5089812166","display_name":"Lu\u00eds Paulo Reis","orcid":"https://orcid.org/0000-0002-4709-1718"},"institutions":[{"id":"https://openalex.org/I182534213","display_name":"Universidade do Porto","ror":"https://ror.org/043pwc612","country_code":"PT","type":"education","lineage":["https://openalex.org/I182534213"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Luis Paulo Reis","raw_affiliation_strings":["Faculty of Engineering, University of Porto, Portugal"],"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Porto, Portugal","institution_ids":["https://openalex.org/I182534213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5057161810"],"corresponding_institution_ids":["https://openalex.org/I182534213"],"apc_list":null,"apc_paid":null,"fwci":1.9562,"has_fulltext":false,"cited_by_count":31,"citation_normalized_percentile":{"value":0.85335222,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11023","display_name":"Prosthetics and Rehabilitation Robotics","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7969545125961304},{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.7644473314285278},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7620229125022888},{"id":"https://openalex.org/keywords/scratch","display_name":"Scratch","score":0.6147443652153015},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5876038670539856},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5127130746841431},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5092929601669312},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3230500817298889}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7969545125961304},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.7644473314285278},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7620229125022888},{"id":"https://openalex.org/C2781235140","wikidata":"https://www.wikidata.org/wiki/Q275131","display_name":"Scratch","level":2,"score":0.6147443652153015},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5876038670539856},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5127130746841431},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5092929601669312},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3230500817298889},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icarsc.2019.8733632","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icarsc.2019.8733632","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W576027973","https://openalex.org/W1548782413","https://openalex.org/W1651888519","https://openalex.org/W2405827006","https://openalex.org/W2736601468","https://openalex.org/W2755575625","https://openalex.org/W2791877265","https://openalex.org/W2799745602","https://openalex.org/W2963637944","https://openalex.org/W4242923666","https://openalex.org/W4297810554","https://openalex.org/W6616434037","https://openalex.org/W6632815668","https://openalex.org/W6741002519","https://openalex.org/W6745190604"],"related_works":["https://openalex.org/W2475116013","https://openalex.org/W2066741154","https://openalex.org/W2770018148","https://openalex.org/W2358308169","https://openalex.org/W2385135707","https://openalex.org/W2140315382","https://openalex.org/W2059109728","https://openalex.org/W2082556335","https://openalex.org/W322691623","https://openalex.org/W1569471492"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,30],"algorithms":[2],"are":[3,23,154],"now":[4],"more":[5],"appealing":[6],"than":[7,146],"ever.":[8],"Recent":[9],"approaches":[10],"bring":[11],"power":[12],"and":[13,25,75,108,125,133,175],"tuning":[14],"simplicity":[15],"to":[16,56,68,82,87,100,111,129,157,165],"the":[17,26,46,77,84,147,171],"everyday":[18],"work":[19,168],"machine.":[20],"The":[21,136],"possibilities":[22],"endless,":[24],"idea":[27],"of":[28,173],"automating":[29],"without":[31,94],"domain":[32],"knowledge":[33],"is":[34,53,139],"quite":[35],"tempting":[36],"for":[37],"many":[38,65],"researchers.":[39],"However,":[40,151],"in":[41,140,160],"competitive":[42,161],"environments":[43,162],"such":[44,72],"as":[45,73],"RoboCup":[47,149,174],"3D":[48],"Soccer":[49],"Simulation":[50],"League,":[51],"there":[52],"a":[54,102],"lot":[55],"be":[57,158],"done":[58],"regarding":[59],"humanlike":[60],"behaviors.":[61,135],"Current":[62],"teams":[63],"use":[64,83,98],"mechanical":[66],"movements":[67],"perform":[69],"basic":[70],"skills,":[71,90],"running":[74,132],"dribbling":[76,134],"ball.":[78],"This":[79,167],"paper":[80],"aims":[81],"PPO":[85],"algorithm":[86],"optimize":[88],"those":[89],"achieving":[91],"natural":[92,131],"gaits":[93],"sacrificing":[95],"performance.":[96],"We":[97],"Simspark":[99],"simulate":[101],"NAO":[103],"humanoid":[104],"robot,":[105],"using":[106],"visual":[107],"body":[109],"sensors":[110],"control":[112,123],"its":[113],"actuators.":[114],"Based":[115],"on":[116],"our":[117],"results,":[118],"we":[119],"propose":[120],"an":[121],"indirect":[122],"approach":[124],"detailed":[126],"parameter":[127],"setups":[128],"obtain":[130],"obtained":[137],"performance":[138],"some":[141,152,176],"cases":[142],"comparable":[143],"or":[144],"better":[145],"top":[148],"teams.":[150],"skills":[153],"not":[155],"ready":[156],"applied":[159],"yet,":[163],"due":[164],"instability.":[166],"contributes":[169],"towards":[170],"improvement":[172],"related":[177],"technical":[178],"challenges.":[179]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":5},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
