{"id":"https://openalex.org/W2914170332","doi":"https://doi.org/10.1109/humanoids.2018.8624972","title":"User Feedback in Latent Space Robotic Skill Learning","display_name":"User Feedback in Latent Space Robotic Skill Learning","publication_year":2018,"publication_date":"2018-11-01","ids":{"openalex":"https://openalex.org/W2914170332","doi":"https://doi.org/10.1109/humanoids.2018.8624972","mag":"2914170332"},"language":"en","primary_location":{"id":"doi:10.1109/humanoids.2018.8624972","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids.2018.8624972","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE-RAS 18th International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006565540","display_name":"Rok Pahi\u010d","orcid":"https://orcid.org/0000-0003-0985-9439"},"institutions":[{"id":"https://openalex.org/I4210113529","display_name":"Jo\u017eef Stefan International Postgraduate School","ror":"https://ror.org/01hdkb925","country_code":"SI","type":"education","lineage":["https://openalex.org/I4210113529"]}],"countries":["SI"],"is_corresponding":true,"raw_author_name":"Rok Pahic","raw_affiliation_strings":["Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia","institution_ids":["https://openalex.org/I4210113529"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083969934","display_name":"Zvezdan Lon\u010darevi\u0107","orcid":"https://orcid.org/0000-0002-1233-6949"},"institutions":[{"id":"https://openalex.org/I4210113529","display_name":"Jo\u017eef Stefan International Postgraduate School","ror":"https://ror.org/01hdkb925","country_code":"SI","type":"education","lineage":["https://openalex.org/I4210113529"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Zvezdan Loncarevic","raw_affiliation_strings":["Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia","institution_ids":["https://openalex.org/I4210113529"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019399129","display_name":"Ale\u0161 Ude","orcid":"https://orcid.org/0000-0003-3677-3972"},"institutions":[{"id":"https://openalex.org/I4210113529","display_name":"Jo\u017eef Stefan International Postgraduate School","ror":"https://ror.org/01hdkb925","country_code":"SI","type":"education","lineage":["https://openalex.org/I4210113529"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Ales Ude","raw_affiliation_strings":["Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia","institution_ids":["https://openalex.org/I4210113529"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020114289","display_name":"Bojan Nemec","orcid":"https://orcid.org/0000-0002-8728-7731"},"institutions":[{"id":"https://openalex.org/I4210113529","display_name":"Jo\u017eef Stefan International Postgraduate School","ror":"https://ror.org/01hdkb925","country_code":"SI","type":"education","lineage":["https://openalex.org/I4210113529"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Bojan Nemec","raw_affiliation_strings":["Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia","institution_ids":["https://openalex.org/I4210113529"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5028393702","display_name":"Andrej Gams","orcid":"https://orcid.org/0000-0002-9803-3593"},"institutions":[{"id":"https://openalex.org/I4210113529","display_name":"Jo\u017eef Stefan International Postgraduate School","ror":"https://ror.org/01hdkb925","country_code":"SI","type":"education","lineage":["https://openalex.org/I4210113529"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Andrej Gams","raw_affiliation_strings":["Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia"],"affiliations":[{"raw_affiliation_string":"Department of Automatics, Biocybernetics and Robotics, Jozef Stefan International Postgraduate School, jubljana, Slovenia","institution_ids":["https://openalex.org/I4210113529"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5006565540"],"corresponding_institution_ids":["https://openalex.org/I4210113529"],"apc_list":null,"apc_paid":null,"fwci":0.7357,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.74037546,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"270","last_page":"276"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9779999852180481,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.7665795683860779},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7587025165557861},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7134407758712769},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6122207045555115},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.5609193444252014},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4942381680011749},{"id":"https://openalex.org/keywords/throwing","display_name":"Throwing","score":0.46782153844833374},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4537326693534851},{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.43703216314315796},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.4140235483646393},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.4100792407989502},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.3264716863632202},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.13436630368232727}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.7665795683860779},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7587025165557861},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7134407758712769},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6122207045555115},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5609193444252014},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4942381680011749},{"id":"https://openalex.org/C207451115","wikidata":"https://www.wikidata.org/wiki/Q12898216","display_name":"Throwing","level":2,"score":0.46782153844833374},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4537326693534851},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.43703216314315796},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.4140235483646393},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.4100792407989502},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3264716863632202},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.13436630368232727},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/humanoids.2018.8624972","is_oa":false,"landing_page_url":"https://doi.org/10.1109/humanoids.2018.8624972","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 IEEE-RAS 18th International Conference on Humanoid Robots (Humanoids)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7300000190734863,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1130790960","https://openalex.org/W1506540549","https://openalex.org/W1566123042","https://openalex.org/W1579640618","https://openalex.org/W1894373409","https://openalex.org/W1964985369","https://openalex.org/W1977655452","https://openalex.org/W2012392077","https://openalex.org/W2012587148","https://openalex.org/W2016773334","https://openalex.org/W2022638737","https://openalex.org/W2061562262","https://openalex.org/W2085627234","https://openalex.org/W2104171826","https://openalex.org/W2120772693","https://openalex.org/W2136719407","https://openalex.org/W2156869222","https://openalex.org/W2166302491","https://openalex.org/W2213467466","https://openalex.org/W2545521674","https://openalex.org/W2567455162","https://openalex.org/W2569181534","https://openalex.org/W2626804490","https://openalex.org/W2735318784","https://openalex.org/W2766610320","https://openalex.org/W2807366678","https://openalex.org/W2963508354","https://openalex.org/W4321392130","https://openalex.org/W6630344866","https://openalex.org/W6634574864","https://openalex.org/W6653548176","https://openalex.org/W6729512192","https://openalex.org/W6739585900","https://openalex.org/W6843699536"],"related_works":["https://openalex.org/W4213225422","https://openalex.org/W3044458868","https://openalex.org/W1932558918","https://openalex.org/W1804325819","https://openalex.org/W2169547041","https://openalex.org/W2031129854","https://openalex.org/W4289656111","https://openalex.org/W2567271240","https://openalex.org/W4250304930","https://openalex.org/W2922457425"],"abstract_inverted_index":{"In":[0,102],"order":[1],"to":[2,12],"operate":[3],"in":[4,29,78,124],"everyday":[5,79],"human":[6,48],"environment,":[7],"humanoids":[8],"robots":[9],"will":[10],"need":[11],"autonomously":[13],"learn":[14],"and":[15],"adapt":[16],"their":[17,83],"actions,":[18],"using":[19,110],"among":[20],"other":[21],"reinforcement":[22],"learning":[23,56,123],"methods":[24],"(RL).":[25],"A":[26,40],"common":[27],"challenge":[28],"robotic":[30,76,117,150],"RL":[31,70,115,158],"is":[32],"also":[33,81],"the":[34,69,94,103,107,125],"generation":[35],"of":[36,43,75,90,109,116,132,139],"appropriate":[37],"reward":[38,113],"functions.":[39],"vast":[41],"body":[42],"literature":[44],"investigates":[45],"how":[46],"active":[47],"feedback":[49,64,92,148,162],"can":[50,65,86,163],"be":[51,66,164],"introduced":[52],"into":[53],"an":[54,120],"interactive":[55],"loop,":[57],"with":[58,119,143,159],"recent":[59],"publications":[60],"showing":[61],"that":[62,154],"user":[63,91,141,161],"used":[67],"for":[68,93,114,149,155,167],"reward.":[71],"However,":[72],"increased":[73],"complexity":[74],"skills":[77],"environment":[80],"increases":[82],"dimensionality,":[84],"which":[85],"practically":[87],"prevent":[88],"use":[89],"reward,":[95],"because":[96],"too":[97],"many":[98],"trials":[99],"are":[100],"needed.":[101],"paper":[104],"we":[105],"present":[106],"results":[108],"discretized,":[111],"user-assigned":[112],"throwing,":[118],"emphasis":[121],"on":[122],"feature":[126],"space,":[127],"i.":[128],"e.,":[129],"latent":[130],"space":[131],"a":[133,140],"deep":[134],"autoencoder":[135],"network.":[136],"Statistical":[137],"evaluation":[138],"study":[142],"15":[144],"participants,":[145],"who":[146],"provided":[147],"throwing":[151],"experiments,":[152],"show":[153],"certain":[156],"tasks,":[157],"discrete":[160],"effectively":[165],"applied":[166],"robot":[168],"learning.":[169]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
