{"id":"https://openalex.org/W2963177351","doi":"https://doi.org/10.1109/inista.2019.8778209","title":"An Implementation of Vision Based Deep Reinforcement Learning for Humanoid Robot Locomotion","display_name":"An Implementation of Vision Based Deep Reinforcement Learning for Humanoid Robot Locomotion","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2963177351","doi":"https://doi.org/10.1109/inista.2019.8778209","mag":"2963177351"},"language":"en","primary_location":{"id":"doi:10.1109/inista.2019.8778209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/inista.2019.8778209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Symposium on INnovations in Intelligent SysTems and Applications (INISTA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069238876","display_name":"Recen Ozaln","orcid":null},"institutions":[{"id":"https://openalex.org/I143396566","display_name":"F\u0131rat University","ror":"https://ror.org/05teb7b63","country_code":"TR","type":"education","lineage":["https://openalex.org/I143396566"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Recen Ozaln","raw_affiliation_strings":["Department of Mechatronics Engineering, Firat University, Elazig, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Mechatronics Engineering, Firat University, Elazig, Turkey","institution_ids":["https://openalex.org/I143396566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025953014","display_name":"\u00c7a\u011fr\u0131 Kaymak","orcid":"https://orcid.org/0000-0001-5343-226X"},"institutions":[{"id":"https://openalex.org/I143396566","display_name":"F\u0131rat University","ror":"https://ror.org/05teb7b63","country_code":"TR","type":"education","lineage":["https://openalex.org/I143396566"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Cagri Kaymak","raw_affiliation_strings":["Department of Mechatronics Engineering, Firat University, Elazig, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Mechatronics Engineering, Firat University, Elazig, Turkey","institution_ids":["https://openalex.org/I143396566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052630551","display_name":"Ozal Yildirum","orcid":null},"institutions":[{"id":"https://openalex.org/I64925351","display_name":"Munzur University","ror":"https://ror.org/05v0p1f11","country_code":"TR","type":"education","lineage":["https://openalex.org/I64925351"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Ozal Yildirum","raw_affiliation_strings":["Department of Computer Engineering, Muznur University, Tunceli, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Muznur University, Tunceli, Turkey","institution_ids":["https://openalex.org/I64925351"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109431489","display_name":"Ayscgul Ucar","orcid":null},"institutions":[{"id":"https://openalex.org/I143396566","display_name":"F\u0131rat University","ror":"https://ror.org/05teb7b63","country_code":"TR","type":"education","lineage":["https://openalex.org/I143396566"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Ayscgul Ucar","raw_affiliation_strings":["Department of Mechatronics Engineering, Firat University, Elazig, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Mechatronics Engineering, Firat University, Elazig, Turkey","institution_ids":["https://openalex.org/I143396566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102706549","display_name":"Yakup Demir","orcid":"https://orcid.org/0000-0001-9530-5824"},"institutions":[{"id":"https://openalex.org/I143396566","display_name":"F\u0131rat University","ror":"https://ror.org/05teb7b63","country_code":"TR","type":"education","lineage":["https://openalex.org/I143396566"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Yakup Demir","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Firat University, Elazig, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Firat University, Elazig, Turkey","institution_ids":["https://openalex.org/I143396566"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5063349801","display_name":"C\u00fcneyt G\u00fczel\u0456\u0219","orcid":"https://orcid.org/0000-0001-5416-368X"},"institutions":[{"id":"https://openalex.org/I59944920","display_name":"Ya\u015far University","ror":"https://ror.org/00dz1eb96","country_code":"TR","type":"education","lineage":["https://openalex.org/I59944920"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Cuneyt Guzelis","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Yasar University, Izmir, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Yasar University, Izmir, Turkey","institution_ids":["https://openalex.org/I59944920"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5069238876"],"corresponding_institution_ids":["https://openalex.org/I143396566"],"apc_list":null,"apc_paid":null,"fwci":0.6847,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.67363045,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10879","display_name":"Robotic Locomotion and Control","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9839000105857849,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.8712553977966309},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8370212316513062},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.668088972568512},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6335005760192871},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5502500534057617},{"id":"https://openalex.org/keywords/gyroscope","display_name":"Gyroscope","score":0.4968312084674835},{"id":"https://openalex.org/keywords/robot-locomotion","display_name":"Robot locomotion","score":0.4817773997783661},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.46259230375289917},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3956920802593231},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.3248950242996216},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.29072320461273193},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.18156445026397705}],"concepts":[{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.8712553977966309},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8370212316513062},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.668088972568512},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6335005760192871},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5502500534057617},{"id":"https://openalex.org/C158488048","wikidata":"https://www.wikidata.org/wiki/Q483400","display_name":"Gyroscope","level":2,"score":0.4968312084674835},{"id":"https://openalex.org/C6101204","wikidata":"https://www.wikidata.org/wiki/Q7353391","display_name":"Robot locomotion","level":5,"score":0.4817773997783661},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.46259230375289917},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3956920802593231},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.3248950242996216},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.29072320461273193},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.18156445026397705},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/inista.2019.8778209","is_oa":false,"landing_page_url":"https://doi.org/10.1109/inista.2019.8778209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE International Symposium on INnovations in Intelligent SysTems and Applications (INISTA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320322626","display_name":"T\u00fcrkiye Bilimsel ve Teknolojik Ara\u015ft\u0131rma Kurumu","ror":"https://ror.org/04w9kkr77"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1974610117","https://openalex.org/W2002554707","https://openalex.org/W2010363098","https://openalex.org/W2014824949","https://openalex.org/W2037729465","https://openalex.org/W2121615981","https://openalex.org/W2121863487","https://openalex.org/W2145339207","https://openalex.org/W2155007355","https://openalex.org/W2155968351","https://openalex.org/W2173564293","https://openalex.org/W2257979135","https://openalex.org/W2342662072","https://openalex.org/W2460299708","https://openalex.org/W2522025381","https://openalex.org/W2527027039","https://openalex.org/W2546975091","https://openalex.org/W2604216058","https://openalex.org/W2726187156","https://openalex.org/W2732319713","https://openalex.org/W2739330054","https://openalex.org/W2746553466","https://openalex.org/W2800843584","https://openalex.org/W2810565864","https://openalex.org/W2811406095","https://openalex.org/W2884400617","https://openalex.org/W2888235455","https://openalex.org/W2891051118","https://openalex.org/W2913346307","https://openalex.org/W2924656332","https://openalex.org/W2951799221","https://openalex.org/W2951941324","https://openalex.org/W2962759351","https://openalex.org/W2963184939","https://openalex.org/W2963544079","https://openalex.org/W2963641140","https://openalex.org/W2963780790","https://openalex.org/W2963841023","https://openalex.org/W2964161785","https://openalex.org/W2982564889","https://openalex.org/W4214717370","https://openalex.org/W4247290769","https://openalex.org/W4300892751","https://openalex.org/W6682849425","https://openalex.org/W6704571135","https://openalex.org/W6740402285","https://openalex.org/W6752922040"],"related_works":["https://openalex.org/W1889129279","https://openalex.org/W4387451989","https://openalex.org/W2532412374","https://openalex.org/W2745063183","https://openalex.org/W2063137106","https://openalex.org/W2358715846","https://openalex.org/W3180160681","https://openalex.org/W1567230752","https://openalex.org/W1600238263","https://openalex.org/W2805865429"],"abstract_inverted_index":{"Deep":[0,94],"reinforcement":[1,53,103],"learning":[2,54,104],"(DRL)":[3],"exhibits":[4],"a":[5,48,79,100,116],"promising":[6],"approach":[7],"for":[8,56,64],"controlling":[9],"humanoid":[10,62,76],"robot":[11,63,77],"locomotion.":[12],"However,":[13],"only":[14],"values":[15],"relating":[16],"sensors":[17],"such":[18],"as":[19],"IMU,":[20],"gyroscope,":[21],"and":[22,93,133,136,153],"GPS":[23],"are":[24,99],"not":[25],"sufficient":[26],"robots":[27],"to":[28,38,146],"learn":[29],"their":[30],"locomotion":[31,58,74,117,132],"skills.":[32],"In":[33,68],"this":[34],"article,":[35],"we":[36,71],"aim":[37],"show":[39,122],"the":[40,57,60,65,73,83,108,137,149],"success":[41],"of":[42,59,75,102,110],"vision":[43,50,111,138],"based":[44,51,112,139],"DRL.":[45],"We":[46,86,106],"propose":[47],"new":[49],"deep":[52],"algorithm":[55,114],"Robotis-op2":[61],"first":[66],"time.":[67],"experimental":[69,120],"setup,":[70],"construct":[72],"in":[78,82,129],"specific":[80],"environment":[81],"Webots":[84],"software.":[85],"use":[87,147],"Double":[88],"Dueling":[89],"Q":[90,95],"Networks":[91,96],"(D3QN)":[92],"(DQN)":[97],"that":[98,123,130],"kind":[101],"algorithm.":[105],"present":[107],"performance":[109],"DRL":[113,140],"on":[115],"experiment.":[118],"The":[119],"results":[121],"D3QN":[124],"is":[125],"better":[126],"than":[127],"DQN":[128],"stable":[131],"fast":[134],"training":[135],"algorithms":[141],"will":[142],"be":[143],"successfully":[144],"able":[145],"at":[148],"other":[150],"complex":[151],"environments":[152],"applications.":[154]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
