{"id":"https://openalex.org/W2169481237","doi":"https://doi.org/10.1109/adprl.2009.4927544","title":"Integrating sporadic imitation in Reinforcement Learning robots","display_name":"Integrating sporadic imitation in Reinforcement Learning robots","publication_year":2009,"publication_date":"2009-03-01","ids":{"openalex":"https://openalex.org/W2169481237","doi":"https://doi.org/10.1109/adprl.2009.4927544","mag":"2169481237"},"language":"en","primary_location":{"id":"doi:10.1109/adprl.2009.4927544","is_oa":false,"landing_page_url":"https://doi.org/10.1109/adprl.2009.4927544","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028877800","display_name":"Willi Richert","orcid":null},"institutions":[{"id":"https://openalex.org/I206945453","display_name":"Paderborn University","ror":"https://ror.org/058kzsd48","country_code":"DE","type":"education","lineage":["https://openalex.org/I206945453"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Willi Richert","raw_affiliation_strings":["Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany"],"affiliations":[{"raw_affiliation_string":"Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany","institution_ids":["https://openalex.org/I206945453"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046448027","display_name":"Ulrich Scheller","orcid":null},"institutions":[{"id":"https://openalex.org/I206945453","display_name":"Paderborn University","ror":"https://ror.org/058kzsd48","country_code":"DE","type":"education","lineage":["https://openalex.org/I206945453"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Ulrich Scheller","raw_affiliation_strings":["Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany"],"affiliations":[{"raw_affiliation_string":"Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany","institution_ids":["https://openalex.org/I206945453"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013130494","display_name":"Markus Koch","orcid":"https://orcid.org/0000-0003-3247-2988"},"institutions":[{"id":"https://openalex.org/I206945453","display_name":"Paderborn University","ror":"https://ror.org/058kzsd48","country_code":"DE","type":"education","lineage":["https://openalex.org/I206945453"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Markus Koch","raw_affiliation_strings":["Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany"],"affiliations":[{"raw_affiliation_string":"Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany","institution_ids":["https://openalex.org/I206945453"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026131063","display_name":"Bernd Kleinjohann","orcid":null},"institutions":[{"id":"https://openalex.org/I206945453","display_name":"Paderborn University","ror":"https://ror.org/058kzsd48","country_code":"DE","type":"education","lineage":["https://openalex.org/I206945453"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bernd Kleinjohann","raw_affiliation_strings":["Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany"],"affiliations":[{"raw_affiliation_string":"Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany","institution_ids":["https://openalex.org/I206945453"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103284605","display_name":"Claudius Stern","orcid":"https://orcid.org/0000-0002-7187-8991"},"institutions":[{"id":"https://openalex.org/I206945453","display_name":"Paderborn University","ror":"https://ror.org/058kzsd48","country_code":"DE","type":"education","lineage":["https://openalex.org/I206945453"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Claudius Stern","raw_affiliation_strings":["Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany"],"affiliations":[{"raw_affiliation_string":"Faculty of of Computer Science, Electrical Engineering and Mathematics, University of Paderborn, Paderborn, Germany","institution_ids":["https://openalex.org/I206945453"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5028877800"],"corresponding_institution_ids":["https://openalex.org/I206945453"],"apc_list":null,"apc_paid":null,"fwci":0.8724,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.81655467,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"193","last_page":"198"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11431","display_name":"Action Observation and Synchronization","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interrupt","display_name":"Interrupt","score":0.86273193359375},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.8568310141563416},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7854598760604858},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7404620051383972},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6724972128868103},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6531301736831665},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49069488048553467},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.4403395354747772},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.43575870990753174},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.143220454454422}],"concepts":[{"id":"https://openalex.org/C41661131","wikidata":"https://www.wikidata.org/wiki/Q220764","display_name":"Interrupt","level":3,"score":0.86273193359375},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.8568310141563416},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7854598760604858},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7404620051383972},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6724972128868103},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6531301736831665},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49069488048553467},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.4403395354747772},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.43575870990753174},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.143220454454422},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/adprl.2009.4927544","is_oa":false,"landing_page_url":"https://doi.org/10.1109/adprl.2009.4927544","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Symposium on Adaptive Dynamic Programming and Reinforcement Learning","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1542537254","https://openalex.org/W1593741171","https://openalex.org/W1991133427","https://openalex.org/W1994193347","https://openalex.org/W2032603916","https://openalex.org/W2096169321","https://openalex.org/W2097883698","https://openalex.org/W2110178871","https://openalex.org/W2110304639","https://openalex.org/W2110631042","https://openalex.org/W2116165953","https://openalex.org/W2120387014","https://openalex.org/W2125113001","https://openalex.org/W2128103053","https://openalex.org/W2131220995","https://openalex.org/W2153264310","https://openalex.org/W2207662037","https://openalex.org/W2341171179","https://openalex.org/W3022532439","https://openalex.org/W4253694374","https://openalex.org/W6632300202","https://openalex.org/W6676388466","https://openalex.org/W6678045943"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W4288898221"],"abstract_inverted_index":{"Although":[0],"the":[1,28,41],"combination":[2],"of":[3,35,43],"reinforcement":[4],"learning":[5],"and":[6,23,27,82,100],"imitation":[7,29,51],"has":[8],"been":[9],"already":[10],"considered":[11],"in":[12,48,59,98],"recent":[13],"research,":[14],"it":[15],"always":[16],"revolved":[17],"around":[18],"fixed":[19,26],"settings":[20],"where":[21,50],"demonstrator":[22],"imitator":[24],"are":[25],"process":[30],"is":[31,38,40,52,65],"a":[32,60,63],"well-defined":[33],"period":[34],"time.":[36],"What":[37],"missing":[39],"investigation":[42],"approaches":[44],"that":[45,58,94],"also":[46],"work":[47],"scenarios":[49],"only":[53,80],"sporadically":[54],"possible.":[55],"This":[56],"means":[57],"multi-robot":[61],"scenario":[62],"robot":[64,71],"now":[66],"allowed":[67],"to":[68,74],"interrupt":[69],"another":[70],"by":[72],"asking":[73],"repeat":[75],"certain":[76],"actions,":[77],"but":[78],"can":[79,95],"observe":[81],"integrate":[83],"information":[84],"bits":[85],"delivered":[86],"occasionally.":[87],"In":[88],"this":[89],"paper":[90],"we":[91],"present":[92],"how":[93],"be":[96],"done":[97],"continuous":[99],"noisy":[101],"environment":[102],"within":[103],"an":[104],"SMDP":[105],"context.":[106]},"counts_by_year":[{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
