{"id":"https://openalex.org/W4391142622","doi":"https://doi.org/10.1177/02783649241227559","title":"Learning dexterity from human hand motion in internet videos","display_name":"Learning dexterity from human hand motion in internet videos","publication_year":2024,"publication_date":"2024-01-22","ids":{"openalex":"https://openalex.org/W4391142622","doi":"https://doi.org/10.1177/02783649241227559"},"language":"en","primary_location":{"id":"doi:10.1177/02783649241227559","is_oa":false,"landing_page_url":"https://doi.org/10.1177/02783649241227559","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of Robotics Research","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074662871","display_name":"Kenneth Shaw","orcid":"https://orcid.org/0009-0002-8571-2922"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kenneth Shaw","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":"https://orcid.org/0009-0002-8571-2922","affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090307838","display_name":"Shikhar Bahl","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shikhar Bahl","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022753223","display_name":"Aravind Sivakumar","orcid":"https://orcid.org/0000-0002-1477-677X"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aravind Sivakumar","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048724992","display_name":"Aditya Kannan","orcid":"https://orcid.org/0000-0002-3104-7560"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aditya Kannan","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":"https://orcid.org/0000-0002-3104-7560","affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101851026","display_name":"Deepak Pathak","orcid":"https://orcid.org/0000-0003-2496-0690"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Deepak Pathak","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5074662871","https://openalex.org/A5101851026"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":2.6701,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.90745097,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"43","issue":"4","first_page":"513","last_page":"532"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5702539682388306},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5541384816169739},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5416321158409119},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.49424269795417786},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.47510895133018494},{"id":"https://openalex.org/keywords/human-motion","display_name":"Human motion","score":0.4324694573879242},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.42610472440719604},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.1740441918373108}],"concepts":[{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5702539682388306},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5541384816169739},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5416321158409119},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.49424269795417786},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47510895133018494},{"id":"https://openalex.org/C2986578859","wikidata":"https://www.wikidata.org/wiki/Q657632","display_name":"Human motion","level":3,"score":0.4324694573879242},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.42610472440719604},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.1740441918373108}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/02783649241227559","is_oa":false,"landing_page_url":"https://doi.org/10.1177/02783649241227559","pdf_url":null,"source":{"id":"https://openalex.org/S73484101","display_name":"The International Journal of Robotics Research","issn_l":"0278-3649","issn":["0278-3649","1741-3176"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The International Journal of Robotics Research","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":69,"referenced_works":["https://openalex.org/W1686810756","https://openalex.org/W1927052826","https://openalex.org/W1967554269","https://openalex.org/W1994530392","https://openalex.org/W1995820507","https://openalex.org/W2003329174","https://openalex.org/W2037841262","https://openalex.org/W2085261163","https://openalex.org/W2101032778","https://openalex.org/W2108598243","https://openalex.org/W2128019145","https://openalex.org/W2155007355","https://openalex.org/W2158782408","https://openalex.org/W2194775991","https://openalex.org/W2213758982","https://openalex.org/W2342840547","https://openalex.org/W2519683295","https://openalex.org/W2558807622","https://openalex.org/W2597261100","https://openalex.org/W2768683308","https://openalex.org/W2769112066","https://openalex.org/W2810785043","https://openalex.org/W2894714230","https://openalex.org/W2896457183","https://openalex.org/W2948426124","https://openalex.org/W2962730651","https://openalex.org/W2963150697","https://openalex.org/W2963202339","https://openalex.org/W2963826370","https://openalex.org/W2963995996","https://openalex.org/W2967695057","https://openalex.org/W2973857456","https://openalex.org/W2978956737","https://openalex.org/W2997581345","https://openalex.org/W3023742835","https://openalex.org/W3034891989","https://openalex.org/W3038298277","https://openalex.org/W3039737909","https://openalex.org/W3043971245","https://openalex.org/W3048833305","https://openalex.org/W3091133300","https://openalex.org/W3108529044","https://openalex.org/W3175995235","https://openalex.org/W3176935502","https://openalex.org/W3180172155","https://openalex.org/W3205786327","https://openalex.org/W3207832698","https://openalex.org/W3213974477","https://openalex.org/W3214952050","https://openalex.org/W3215052027","https://openalex.org/W4212774754","https://openalex.org/W4221145926","https://openalex.org/W4221159977","https://openalex.org/W4226167593","https://openalex.org/W4283786747","https://openalex.org/W4283788863","https://openalex.org/W4287599290","https://openalex.org/W4288020136","https://openalex.org/W4292779060","https://openalex.org/W4303940393","https://openalex.org/W4312424618","https://openalex.org/W4313156423","https://openalex.org/W4321147108","https://openalex.org/W4321153853","https://openalex.org/W4323640751","https://openalex.org/W4385430451","https://openalex.org/W4386065350","https://openalex.org/W4388110459","https://openalex.org/W4390481062"],"related_works":["https://openalex.org/W2804584315","https://openalex.org/W2035558540","https://openalex.org/W2332110715","https://openalex.org/W2167757589","https://openalex.org/W2988011613","https://openalex.org/W2806036343","https://openalex.org/W142482926","https://openalex.org/W2121113403","https://openalex.org/W1550399236","https://openalex.org/W2079653927"],"abstract_inverted_index":{"To":[0,57],"build":[1,119],"general":[2],"robotic":[3],"agents":[4],"that":[5,65,122,225],"can":[6],"operate":[7],"in":[8,20,114,156],"many":[9,239],"environments,":[10],"it":[11],"is":[12,28,88,95],"often":[13,29],"useful":[14],"for":[15,218],"robots":[16],"to":[17,33,96,104,111,126,162,186,213,238],"collect":[18,163],"experience":[19,26,165],"the":[21,43,80,144,160,205],"real":[22,48],"world.":[23],"However,":[24],"unguided":[25],"collection":[27],"not":[30],"feasible":[31],"due":[32],"safety,":[34],"time,":[35],"and":[36,77,83,131,152,207],"hardware":[37],"restrictions.":[38],"We":[39,107,223],"thus":[40],"propose":[41],"leveraging":[42,227],"next":[44],"best":[45],"thing":[46],"as":[47,188],"world":[49],"experience:":[50],"videos":[51],"of":[52,74],"humans":[53],"using":[54,167],"their":[55,138,154],"hands.":[56],"utilize":[58],"these":[59,170,243],"videos,":[60],"we":[61,118,176,232],"develop":[62],"a":[63,89,120,128,148,219],"method":[64,110],"retargets":[66],"any":[67,124],"1st":[68],"person":[69,72],"or":[70],"3rd":[71],"video":[73,103,181],"human":[75,101,125,145,179,199,216,229],"hands":[76],"arms":[78],"into":[79,182],"robot":[81,129,142,161,190,221,235],"hand":[82,102,130,200,230],"arm":[84],"trajectories.":[85],"While":[86],"retargeting":[87],"difficult":[90],"problem,":[91],"our":[92],"key":[93],"insight":[94],"rely":[97],"on":[98],"only":[99],"internet":[100,180,228],"train":[105],"it.":[106],"use":[108,187],"this":[109],"present":[112],"results":[113,171,244],"two":[115],"areas:":[116],"First,":[117],"system":[121],"enables":[123,159],"control":[127],"arm,":[132],"simply":[133],"by":[134,226],"demonstrating":[135],"motions":[136],"with":[137],"own":[139],"hand.":[140],"The":[141],"observes":[143],"operator":[146],"via":[147],"single":[149],"RGB":[150],"camera":[151],"imitates":[153],"actions":[155],"real-time.":[157],"This":[158,192],"real-world":[164],"safely":[166],"supervision.":[168],"See":[169,242],"at":[172,245],"https://robotic-telekinesis.github.io":[173],".":[174],"Second,":[175],"retarget":[177],"in-the-wild":[178],"task-conditioned":[183],"pseudo-robot":[184],"trajectories":[185],"artificial":[189],"experience.":[191],"learning":[193],"algorithm":[194],"leverages":[195],"action":[196],"priors":[197,209],"from":[198,204,210],"actions,":[201],"visual":[202],"features":[203],"images,":[206],"physical":[208],"dynamical":[211],"systems":[212],"pretrain":[214],"typical":[215],"behavior":[217],"particular":[220],"task.":[222],"show":[224],"experience,":[231],"need":[233],"fewer":[234],"demonstrations":[236],"compared":[237],"other":[240],"methods.":[241],"https://video-dex.github.io":[246]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":7}],"updated_date":"2026-05-29T09:21:14.243279","created_date":"2025-10-10T00:00:00"}
