{"id":"https://openalex.org/W2999889331","doi":"https://doi.org/10.1109/ro-man46459.2019.8956364","title":"Extending Policy from One-Shot Learning through Coaching","display_name":"Extending Policy from One-Shot Learning through Coaching","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2999889331","doi":"https://doi.org/10.1109/ro-man46459.2019.8956364","mag":"2999889331"},"language":"en","primary_location":{"id":"doi:10.1109/ro-man46459.2019.8956364","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ro-man46459.2019.8956364","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 28th IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002799619","display_name":"Mythra V. Balakuntala","orcid":"https://orcid.org/0000-0003-2551-4780"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mythra V. Balakuntala","raw_affiliation_strings":["Purdue University,School of Engineering Technology,IN,USA,47907","School of Engineering Technology, Purdue University, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University,School of Engineering Technology,IN,USA,47907","institution_ids":["https://openalex.org/I219193219"]},{"raw_affiliation_string":"School of Engineering Technology, Purdue University, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029213933","display_name":"Vishnunandan L. N. Venkatesh","orcid":null},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vishnunandan L. N. Venkatesh","raw_affiliation_strings":["Purdue University,School of Engineering Technology,IN,USA,47907","School of Engineering Technology, Purdue University, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University,School of Engineering Technology,IN,USA,47907","institution_ids":["https://openalex.org/I219193219"]},{"raw_affiliation_string":"School of Engineering Technology, Purdue University, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083898330","display_name":"Jyothsna Padmakumar Bindu","orcid":null},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jyothsna Padmakumar Bindu","raw_affiliation_strings":["Purdue University,School of Engineering Technology,IN,USA,47907","School of Engineering Technology, Purdue University, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University,School of Engineering Technology,IN,USA,47907","institution_ids":["https://openalex.org/I219193219"]},{"raw_affiliation_string":"School of Engineering Technology, Purdue University, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013960389","display_name":"Richard M. Voyles","orcid":"https://orcid.org/0000-0002-1871-9887"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Richard M. Voyles","raw_affiliation_strings":["Purdue University,School of Engineering Technology,IN,USA,47907","School of Engineering Technology, Purdue University, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University,School of Engineering Technology,IN,USA,47907","institution_ids":["https://openalex.org/I219193219"]},{"raw_affiliation_string":"School of Engineering Technology, Purdue University, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072528523","display_name":"Juan Wachs","orcid":"https://orcid.org/0000-0002-6425-5745"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juan Wachs","raw_affiliation_strings":["Purdue University,School of Industrial Engineering,IN,USA,47907","School of Industrial Engineering, Purdue University, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University,School of Industrial Engineering,IN,USA,47907","institution_ids":["https://openalex.org/I219193219"]},{"raw_affiliation_string":"School of Industrial Engineering, Purdue University, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5002799619"],"corresponding_institution_ids":["https://openalex.org/I219193219"],"apc_list":null,"apc_paid":null,"fwci":0.3305305,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.61300422,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9671000242233276,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9671000242233276,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11299","display_name":"Problem and Project Based Learning","score":0.948199987411499,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9473000168800354,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coaching","display_name":"Coaching","score":0.8140037059783936},{"id":"https://openalex.org/keywords/shot","display_name":"Shot (pellet)","score":0.7390539646148682},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6052532196044922},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.24888202548027039},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.07140931487083435},{"id":"https://openalex.org/keywords/psychotherapist","display_name":"Psychotherapist","score":0.05294346809387207}],"concepts":[{"id":"https://openalex.org/C2779363792","wikidata":"https://www.wikidata.org/wiki/Q1104185","display_name":"Coaching","level":2,"score":0.8140037059783936},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.7390539646148682},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6052532196044922},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.24888202548027039},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.07140931487083435},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.05294346809387207},{"id":"https://openalex.org/C191897082","wikidata":"https://www.wikidata.org/wiki/Q11467","display_name":"Metallurgy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ro-man46459.2019.8956364","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ro-man46459.2019.8956364","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 28th IEEE International Conference on Robot and Human Interactive Communication (RO-MAN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W197704362","https://openalex.org/W1140834175","https://openalex.org/W1851340573","https://openalex.org/W1966197275","https://openalex.org/W1975491757","https://openalex.org/W1986014385","https://openalex.org/W1999874108","https://openalex.org/W2100235553","https://openalex.org/W2103254706","https://openalex.org/W2104171826","https://openalex.org/W2111781320","https://openalex.org/W2345221990","https://openalex.org/W2500624988","https://openalex.org/W2558161936","https://openalex.org/W2601322194","https://openalex.org/W2728976678","https://openalex.org/W2755546070","https://openalex.org/W2962732055","https://openalex.org/W2963094133","https://openalex.org/W4300110528","https://openalex.org/W6607978175","https://openalex.org/W6729985011","https://openalex.org/W6732417791","https://openalex.org/W6735944222","https://openalex.org/W6744181227"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W4214877189","https://openalex.org/W2074502265","https://openalex.org/W4249854088","https://openalex.org/W2746413784","https://openalex.org/W603502240","https://openalex.org/W2773965352","https://openalex.org/W656132696","https://openalex.org/W4232010708","https://openalex.org/W2748672977"],"abstract_inverted_index":{"Humans":[0],"generally":[1],"teach":[2],"their":[3,118],"fellow":[4],"collaborators":[5],"to":[6,67,83,90,108,125,138,187,192,200,208,210],"perform":[7],"tasks":[8,40,49,222],"through":[9,36,50,232],"a":[10,30,69,73,98,101,218,235],"small":[11],"number":[12],"of":[13,19,47,100,166,174,202,238],"demonstrations,":[14],"often":[15],"followed":[16],"by":[17,81],"episodes":[18],"coaching":[20,51,132,150,233],"that":[21],"tune":[22],"and":[23,43,120,140,149,168,183,226],"refine":[24,121],"the":[25,45,53,85,114,122,135,143,147,164,175,179,203,214],"execution":[26],"during":[27],"practice.":[28],"Adopting":[29],"similar":[31,191],"framework":[32,219],"for":[33,220],"teaching":[34,39],"robots":[35],"demonstrations":[37,66],"makes":[38],"highly":[41],"intuitive":[42],"imitating":[44],"refinement":[46],"complex":[48],"improves":[52],"efficacy.":[54],"Unlike":[55],"traditional":[56],"Learning":[57],"from":[58,77,87,223],"Demonstration":[59],"(LfD)":[60],"approaches":[61],"which":[62],"rely":[63],"on":[64],"multiple":[65],"train":[68],"task,":[70],"we":[71],"present":[72],"novel":[74],"one-shot":[75],"learning":[76,155,221],"demonstration":[78,93,225],"approach,":[79],"augmented":[80],"coaching,":[82],"transfer":[84],"task":[86,88,105,110,123,136,165],"expert":[89],"robot.":[91],"The":[92,158,172],"is":[94,161],"automatically":[95],"segmented":[96],"into":[97],"sequence":[99],"priori":[102],"skills":[103,116],"(the":[104],"policy)":[106],"parametrized":[107],"match":[109],"goals.":[111],"During":[112],"practice,":[113],"robotic":[115],"self-evaluate":[117],"performances":[119],"policy":[124,137],"locally":[126],"optimize":[127,142],"cumulative":[128],"performance.":[129,145,212],"Then,":[130],"human":[131,230],"further":[133],"refines":[134],"explore":[139],"globally":[141],"net":[144],"Both":[146],"self-evaluation":[148],"are":[151],"implemented":[152],"using":[153,163,206,229],"reinforcement":[154],"(RL)":[156],"methods.":[157],"proposed":[159,215],"approach":[160],"evaluated":[162],"scooping":[167,176,189],"unscooping":[169],"granular":[170],"media.":[171],"self-evaluator":[173],"skill":[177],"uses":[178],"realtime":[180],"force":[181,185],"signature":[182],"resistive":[184],"theory":[186],"minimize":[188],"resistance":[190],"how":[193],"humans":[194],"scoop.":[195],"Coaching":[196],"feedback":[197,231],"focuses":[198],"modifications":[199],"sub-domains":[201],"action":[204],"space,":[205],"RL":[207],"converge":[209],"desired":[211],"Thus,":[213],"method":[216],"provides":[217],"one":[224],"generalizing":[227],"it":[228],"achieving":[234],"success":[236],"rate":[237],"\u224890%.":[239]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
