{"id":"https://openalex.org/W4415482504","doi":"https://doi.org/10.1109/access.2025.3624723","title":"Learning by Watching: A Review of Video-Based Learning Approaches for Robot Manipulation","display_name":"Learning by Watching: A Review of Video-Based Learning Approaches for Robot Manipulation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4415482504","doi":"https://doi.org/10.1109/access.2025.3624723"},"language":"en","primary_location":{"id":"doi:10.1109/access.2025.3624723","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3624723","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2025.3624723","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018559398","display_name":"Chrisantus Eze","orcid":"https://orcid.org/0000-0001-5440-4316"},"institutions":[{"id":"https://openalex.org/I115475287","display_name":"Oklahoma State University","ror":"https://ror.org/01g9vbr38","country_code":"US","type":"education","lineage":["https://openalex.org/I115475287"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Chrisantus Eze","raw_affiliation_strings":["Computer Science Department, Oklahoma State University, Stillwater, OK, USA","Computer Science Department, Oklahoma State University, Stillwater, Oklahoma, USA"],"raw_orcid":"https://orcid.org/0000-0001-5440-4316","affiliations":[{"raw_affiliation_string":"Computer Science Department, Oklahoma State University, Stillwater, OK, USA","institution_ids":["https://openalex.org/I115475287"]},{"raw_affiliation_string":"Computer Science Department, Oklahoma State University, Stillwater, Oklahoma, USA","institution_ids":["https://openalex.org/I115475287"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014357711","display_name":"Christopher Crick","orcid":"https://orcid.org/0000-0002-1635-823X"},"institutions":[{"id":"https://openalex.org/I115475287","display_name":"Oklahoma State University","ror":"https://ror.org/01g9vbr38","country_code":"US","type":"education","lineage":["https://openalex.org/I115475287"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Crick","raw_affiliation_strings":["Computer Science Department, Oklahoma State University, Stillwater, OK, USA","Computer Science Department, Oklahoma State University, Stillwater, Oklahoma, USA"],"raw_orcid":"https://orcid.org/0000-0002-1635-823X","affiliations":[{"raw_affiliation_string":"Computer Science Department, Oklahoma State University, Stillwater, OK, USA","institution_ids":["https://openalex.org/I115475287"]},{"raw_affiliation_string":"Computer Science Department, Oklahoma State University, Stillwater, Oklahoma, USA","institution_ids":["https://openalex.org/I115475287"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5018559398"],"corresponding_institution_ids":["https://openalex.org/I115475287"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.1091,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.89181179,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":"13","issue":null,"first_page":"184071","last_page":"184109"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9017999768257141,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9017999768257141,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/affordance","display_name":"Affordance","score":0.571399986743927},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5562000274658203},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.505299985408783},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.4066999852657318},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.3905999958515167},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.385699987411499},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.3797999918460846},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.37869998812675476},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.36410000920295715}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.788100004196167},{"id":"https://openalex.org/C194995250","wikidata":"https://www.wikidata.org/wiki/Q531136","display_name":"Affordance","level":2,"score":0.571399986743927},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5573999881744385},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5562000274658203},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5544999837875366},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.505299985408783},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.4066999852657318},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.3905999958515167},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.385699987411499},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.3797999918460846},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.37869998812675476},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.36000001430511475},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.359499990940094},{"id":"https://openalex.org/C2779542340","wikidata":"https://www.wikidata.org/wiki/Q1062461","display_name":"Learning object","level":2,"score":0.35569998621940613},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.3476000130176544},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.33340001106262207},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33160001039505005},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.32850000262260437},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.3273000121116638},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3138999938964844},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.31060001254081726},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.31040000915527344},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2953000068664551},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.2766000032424927},{"id":"https://openalex.org/C162947575","wikidata":"https://www.wikidata.org/wiki/Q2005645","display_name":"Social robot","level":5,"score":0.2597000002861023},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.25459998846054077},{"id":"https://openalex.org/C16443162","wikidata":"https://www.wikidata.org/wiki/Q1068473","display_name":"Educational technology","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2025.3624723","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3624723","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:01ef0cfd6b0743f4a90ecafa21c25080","is_oa":true,"landing_page_url":"https://doaj.org/article/01ef0cfd6b0743f4a90ecafa21c25080","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 184071-184109 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2025.3624723","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2025.3624723","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Robot":[0],"learning":[1,48,62,80,108,128],"of":[2,10,154],"manipulation":[3,49,100],"skills":[4,50,101],"is":[5],"hindered":[6],"by":[7],"the":[8,152],"scarcity":[9],"diverse,":[11],"unbiased":[12],"datasets.":[13],"While":[14],"curated":[15],"datasets":[16,30],"can":[17,115],"help,":[18],"challenges":[19,143],"remain":[20],"in":[21,34,147],"generalizability":[22],"and":[23,88,118,138,140,144,160],"real-world":[24],"transfer.":[25],"Meanwhile,":[26],"large-scale":[27,89,112],"\u2019in-the-wild\u2019":[28],"video":[29,77,104],"have":[31,46],"driven":[32],"progress":[33],"computer":[35,155],"vision":[36],"using":[37,51],"self-supervised":[38],"techniques.":[39],"Translating":[40],"this":[41,148],"to":[42],"robotics,":[43],"recent":[44],"works":[45],"explored":[47],"abundant":[52],"passive":[53],"videos":[54,114],"sourced":[55],"online.":[56],"Showing":[57],"promising":[58],"results,":[59],"such":[60,75],"video-based":[61,127],"paradigms":[63],"provide":[64],"scalable":[65],"supervision":[66],"while":[67],"reducing":[68],"dataset":[69],"bias.":[70],"This":[71],"survey":[72,125,136],"reviews":[73],"foundations":[74],"as":[76,92,94],"feature":[78],"representation":[79],"techniques,":[81],"object":[82],"affordance":[83],"understanding,":[84],"3D":[85],"hand/body":[86],"modeling,":[87],"robot":[90,99,161],"resources,":[91],"well":[93],"emerging":[95],"techniques":[96],"for":[97,121],"acquiring":[98],"from":[102,109],"uncontrolled":[103],"demonstrations.We":[105],"discuss":[106],"how":[107],"only":[110],"observing":[111],"human":[113],"enhance":[116],"generalization":[117],"sample":[119],"efficiency":[120],"robotic":[122],"manipulation.":[123],"The":[124],"summarizes":[126],"approaches,":[129],"analyzes":[130],"their":[131],"benefits":[132],"over":[133],"standard":[134],"datasets,":[135],"metrics,":[137],"benchmarks,":[139],"discusses":[141],"open":[142],"future":[145],"directions":[146],"nascent":[149],"domain":[150],"at":[151],"intersection":[153],"vision,":[156],"natural":[157],"language":[158],"processing,":[159],"learning.":[162]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-24T00:00:00"}
