{"id":"https://openalex.org/W4312509396","doi":"https://doi.org/10.1109/iros47612.2022.9982205","title":"Learning High Speed Precision Table Tennis on a Physical Robot","display_name":"Learning High Speed Precision Table Tennis on a Physical Robot","publication_year":2022,"publication_date":"2022-10-23","ids":{"openalex":"https://openalex.org/W4312509396","doi":"https://doi.org/10.1109/iros47612.2022.9982205"},"language":"en","primary_location":{"id":"doi:10.1109/iros47612.2022.9982205","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9982205","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001795595","display_name":"Tianli Ding","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tianli Ding","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002723909","display_name":"Laura Graesser","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Laura Graesser","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011850830","display_name":"Saminda Abeyruwan","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Saminda Abeyruwan","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078539163","display_name":"David B. D\u2019Ambrosio","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David B. D'Ambrosio","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039532136","display_name":"Anish Shankar","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anish Shankar","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066544075","display_name":"Pierre Sermanet","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pierre Sermanet","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064611781","display_name":"Pannag Sanketi","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pannag R. Sanketi","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021773088","display_name":"Corey Lynch","orcid":"https://orcid.org/0000-0002-2092-6690"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Corey Lynch","raw_affiliation_strings":["Robotics at Google, Google Research,Mountain View,United States","Robotics at Google, Google Research, Mountain View, United States"],"affiliations":[{"raw_affiliation_string":"Robotics at Google, Google Research,Mountain View,United States","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"Robotics at Google, Google Research, Mountain View, United States","institution_ids":["https://openalex.org/I1291425158"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5001795595"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":1.6631,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.86236802,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"10780","last_page":"10787"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10982","display_name":"Motor Control and Adaptation","score":0.9514999985694885,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7348262667655945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6415454149246216},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6334802508354187},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5751704573631287},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5571611523628235},{"id":"https://openalex.org/keywords/iterative-learning-control","display_name":"Iterative learning control","score":0.5386720895767212},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45902591943740845},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.4424835741519928},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3286876678466797},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.2960612177848816}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7348262667655945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6415454149246216},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6334802508354187},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5751704573631287},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5571611523628235},{"id":"https://openalex.org/C117619785","wikidata":"https://www.wikidata.org/wiki/Q6094414","display_name":"Iterative learning control","level":3,"score":0.5386720895767212},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45902591943740845},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.4424835741519928},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3286876678466797},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2960612177848816},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros47612.2022.9982205","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros47612.2022.9982205","pdf_url":null,"source":{"id":"https://openalex.org/S4363607704","display_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":75,"referenced_works":["https://openalex.org/W151866386","https://openalex.org/W1556151214","https://openalex.org/W1559566475","https://openalex.org/W2010849482","https://openalex.org/W2012204020","https://openalex.org/W2054707543","https://openalex.org/W2083071253","https://openalex.org/W2111978237","https://openalex.org/W2112963000","https://openalex.org/W2142300342","https://openalex.org/W2144576818","https://openalex.org/W2149479912","https://openalex.org/W2166160300","https://openalex.org/W2218183533","https://openalex.org/W2571450712","https://openalex.org/W2596367596","https://openalex.org/W2604382266","https://openalex.org/W2613462707","https://openalex.org/W2736601468","https://openalex.org/W2781726626","https://openalex.org/W2797121477","https://openalex.org/W2810785043","https://openalex.org/W2823112946","https://openalex.org/W2902551807","https://openalex.org/W2904246096","https://openalex.org/W2910474428","https://openalex.org/W2912622940","https://openalex.org/W2914987759","https://openalex.org/W2927128490","https://openalex.org/W2950422748","https://openalex.org/W2958416396","https://openalex.org/W2963669336","https://openalex.org/W2963864421","https://openalex.org/W2970377754","https://openalex.org/W2979211489","https://openalex.org/W2981030070","https://openalex.org/W3015415344","https://openalex.org/W3020712699","https://openalex.org/W3035700320","https://openalex.org/W3037785630","https://openalex.org/W3039737909","https://openalex.org/W3093784762","https://openalex.org/W3120327542","https://openalex.org/W3126321819","https://openalex.org/W3129853634","https://openalex.org/W3131531515","https://openalex.org/W3171176697","https://openalex.org/W3206394619","https://openalex.org/W3207061160","https://openalex.org/W4240186043","https://openalex.org/W4287824211","https://openalex.org/W4289236734","https://openalex.org/W4295113716","https://openalex.org/W4300799055","https://openalex.org/W6740801417","https://openalex.org/W6741002519","https://openalex.org/W6748929038","https://openalex.org/W6750322874","https://openalex.org/W6752736450","https://openalex.org/W6753060773","https://openalex.org/W6753243525","https://openalex.org/W6756687206","https://openalex.org/W6757592117","https://openalex.org/W6760439459","https://openalex.org/W6765008394","https://openalex.org/W6768617876","https://openalex.org/W6769596995","https://openalex.org/W6771179988","https://openalex.org/W6771666257","https://openalex.org/W6775276923","https://openalex.org/W6779282036","https://openalex.org/W6779463497","https://openalex.org/W6785034342","https://openalex.org/W6785555649","https://openalex.org/W6799150178"],"related_works":["https://openalex.org/W2761624296","https://openalex.org/W4386994694","https://openalex.org/W4388738109","https://openalex.org/W2362901947","https://openalex.org/W2362086884","https://openalex.org/W1606071314","https://openalex.org/W2350210972","https://openalex.org/W2369126164","https://openalex.org/W1482785882","https://openalex.org/W2376218423"],"abstract_inverted_index":{"Learning":[0],"goal":[1,97,109],"conditioned":[2],"control":[3,62,99],"in":[4,13,27,63,147,206],"the":[5,19,29,53,64,130,158,219,240,244,250,255,280,294],"real":[6,46,65,145,212],"world":[7,47,213],"is":[8,196],"a":[9,57,76,144,148,170,203,208,236,268,283,297],"challenging":[10],"open":[11],"problem":[12],"robotics.":[14],"Reinforcement":[15],"learning":[16,50,96,137],"systems":[17],"have":[18,85,114],"potential":[20],"to":[21,44,60,88,119,140,173,200,246],"learn":[22,61],"autonomously":[23],"via":[24,107],"trial-and-error,":[25],"but":[26,67],"practice":[28],"costs":[30],"of":[31,242,257,271,282,293],"manual":[32],"reward":[33,182],"design,":[34,183],"ensuring":[35],"safe":[36],"exploration,":[37],"and":[38,74,104],"hyperparameter":[39],"tuning":[40],"are":[41],"often":[42],"enough":[43,199],"preclude":[45],"deployment.":[48],"Imitation":[49],"approaches,":[51,112],"on":[52,143,160,202,224,249,264,296],"other":[54],"hand,":[55],"offer":[56],"simple":[58,122,134],"way":[59,172],"world,":[66],"typically":[68],"require":[69],"costly":[70],"cu-rated":[71],"demonstration":[72,102,273],"data":[73,274],"lack":[75],"mechanism":[77],"for":[78,291],"continuous":[79,175],"improvement.":[80],"Recently,":[81],"iterative":[82,135],"imitation":[83,136],"methods":[84],"been":[86,117],"shown":[87,118],"be":[89],"effective":[90],"at":[91,239],"relaxing":[92],"both":[93],"these":[94],"constraints,":[95],"directed":[98],"from":[100,235],"undirected":[101,260],"data,":[103],"improving":[105],"continuously":[106],"self-supervised":[108],"reaching.":[110],"These":[111],"however,":[113],"not":[115],"yet":[116],"scale":[120,139],"beyond":[121],"simulated":[123],"environments.":[124],"In":[125,211],"this":[126,161,167,194],"work,":[127],"we":[128,215,253],"present":[129],"first":[131],"evidence":[132],"that":[133,166,193,217,218,267],"can":[138,222],"goal-directed":[141],"behavior":[142],"robot":[146,205],"dynamic":[149],"setting:":[150],"high":[151],"speed,":[152],"precision":[153],"table":[154],"tennis":[155],"(e.g.":[156],"\u201cland":[157],"ball":[159,245],"particular":[162],"target\u201d).":[163],"We":[164,190],"find":[165,192,216],"approach":[168,195],"offers":[169],"straightforward":[171],"do":[174],"on-robot":[176],"learning,":[177,186],"without":[178],"complexities":[179],"such":[180],"as":[181],"value":[184],"function":[185],"or":[187,226],"sim-to-real":[188],"transfer.":[189],"also":[191],"scalable-sample":[197],"efficient":[198],"train":[201],"physical":[204,298],"just":[207],"few":[209],"hours.":[210],"evaluations,":[214],"resulting":[220],"policy":[221,295],"perform":[223],"par":[225],"better":[227],"than":[228],"amateur":[229],"humans":[230],"(with":[231],"players":[232],"sampled":[233],"randomly":[234],"robotics":[237],"lab)":[238],"task":[241],"returning":[243],"specific":[247],"targets":[248],"table.":[251],"Finally,":[252],"analyze":[254],"effect":[256],"an":[258],"initial":[259],"bootstrap":[261],"dataset":[262],"size":[263],"performance,":[265],"finding":[266],"modest":[269],"amount":[270],"unstructured":[272],"provided":[275],"up-front":[276],"drastically":[277],"speeds":[278],"up":[279],"convergence":[281],"general":[284],"purpose":[285],"goal-reaching":[286],"policy.":[287],"See":[288],"supplementary":[289],"video":[290],"examples":[292],"robot.":[299]},"counts_by_year":[{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
