{"id":"https://openalex.org/W7138092452","doi":"https://doi.org/10.1609/aaai.v40i13.38086","title":"Human2Robot: Learning Robot Actions from Paired Human-Robot Videos","display_name":"Human2Robot: Learning Robot Actions from Paired Human-Robot Videos","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138092452","doi":"https://doi.org/10.1609/aaai.v40i13.38086"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i13.38086","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i13.38086","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38086/42048","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38086/42048","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007869275","display_name":"Sicheng Xie","orcid":"https://orcid.org/0000-0001-9806-3920"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Sicheng Xie","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University\nShanghai Innovation Institute"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University\nShanghai Innovation Institute","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101961477","display_name":"Han Cao","orcid":"https://orcid.org/0000-0003-3985-0267"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haidong Cao","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075142476","display_name":"Zejia Weng","orcid":"https://orcid.org/0000-0001-9706-6484"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zejia Weng","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129664063","display_name":"Zhen Xing","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Xing","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129689894","display_name":"Haoran Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoran Chen","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015972325","display_name":"Shiwei Shen","orcid":"https://orcid.org/0009-0009-7463-5782"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiwei Shen","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033054582","display_name":"Jiaqi Leng","orcid":"https://orcid.org/0000-0003-4600-1263"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaqi Leng","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129713328","display_name":"Zuxuan Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zuxuan Wu","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University\nShanghai Innovation Institute"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University\nShanghai Innovation Institute","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129669423","display_name":"Yu-Gang Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu-Gang Jiang","raw_affiliation_strings":["Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University"],"affiliations":[{"raw_affiliation_string":"Shanghai Key Lab of Intell. Info. Processing, School of CS, Fudan University","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5007869275"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.39701493,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"13","first_page":"11078","last_page":"11086"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.4020000100135803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.4020000100135803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.17649999260902405,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.11309999972581863,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6718000173568726},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6424000263214111},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5945000052452087},{"id":"https://openalex.org/keywords/teleoperation","display_name":"Teleoperation","score":0.5302000045776367},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5012999773025513},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.47600001096725464},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4756999909877777},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4214000105857849},{"id":"https://openalex.org/keywords/icub","display_name":"iCub","score":0.36880001425743103}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.746399998664856},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6942999958992004},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6718000173568726},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6424000263214111},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5945000052452087},{"id":"https://openalex.org/C161759796","wikidata":"https://www.wikidata.org/wiki/Q3982902","display_name":"Teleoperation","level":3,"score":0.5302000045776367},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5012999773025513},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.47600001096725464},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4756999909877777},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.454800009727478},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4214000105857849},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.38609999418258667},{"id":"https://openalex.org/C111151474","wikidata":"https://www.wikidata.org/wiki/Q1653368","display_name":"iCub","level":4,"score":0.36880001425743103},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.3675999939441681},{"id":"https://openalex.org/C2779038628","wikidata":"https://www.wikidata.org/wiki/Q7248497","display_name":"Programming by demonstration","level":3,"score":0.3529999852180481},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.34540000557899475},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.3375000059604645},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.33379998803138733},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.3025999963283539},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.2937000095844269},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.2892000079154968},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28859999775886536},{"id":"https://openalex.org/C162947575","wikidata":"https://www.wikidata.org/wiki/Q2005645","display_name":"Social robot","level":5,"score":0.28200000524520874},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.2685000002384186},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C2776544517","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Unexpected events","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.25699999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i13.38086","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i13.38086","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38086/42048","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i13.38086","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i13.38086","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38086/42048","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth","score":0.4213047921657562}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138092452.pdf","grobid_xml":"https://content.openalex.org/works/W7138092452.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Distilling":[0],"knowledge":[1],"from":[2,59,149],"human":[3,108,150],"demonstrations":[4],"is":[5],"a":[6,34,60,77,86,98,114,122,131,137,156],"promising":[7],"way":[8],"for":[9,45],"robots":[10],"to":[11,27,38,50,125,135,181],"learn":[12,136],"and":[13,48,66,109,139,186],"act.":[14],"Existing":[15],"methods,":[16],"which":[17,152],"often":[18],"rely":[19],"on":[20,172],"coarsely-aligned":[21],"video":[22,88],"pairs,":[23],"are":[24],"typically":[25],"constrained":[26],"learning":[28],"global":[29],"or":[30],"task-level":[31],"features.":[32],"As":[33],"result,":[35],"they":[36,69],"tend":[37],"neglect":[39],"the":[40,67],"fine-grained":[41,82],"frame-level":[42],"dynamics":[43,144],"required":[44],"complex":[46],"manipulation":[47],"generalization":[49,180],"novel":[51,99,182],"tasks.":[52],"We":[53,118],"posit":[54],"that":[55,80,164],"this":[56,73,92,127,165],"limitation":[57],"stems":[58],"vicious":[61],"circle":[62],"of":[63,105,142],"inadequate":[64],"datasets":[65],"methods":[68],"inspire.":[70],"To":[71,91],"break":[72],"cycle,":[74],"we":[75,94],"propose":[76],"paradigm":[78],"shift":[79],"treats":[81],"human-robot":[83],"alignment":[84],"as":[85],"conditional":[87],"generation":[89],"problem.":[90],"end,":[93],"first":[95],"introduce":[96],"H&amp;R,":[97],"third-person":[100],"dataset":[101],"containing":[102],"2,600":[103],"episodes":[104],"precisely":[106],"synchronized":[107],"robot":[110,143,147],"motions,":[111],"collected":[112],"using":[113],"VR":[115],"teleoperation":[116],"system.":[117],"then":[119],"present":[120],"Human2Robot,":[121],"framework":[123],"designed":[124],"leverage":[126],"data.":[128],"Human2Robot":[129],"employs":[130],"Video":[132],"Prediction":[133],"Model":[134],"rich":[138],"implicit":[140],"representation":[141],"by":[145],"generating":[146],"videos":[148],"input,":[151],"in":[153],"turn":[154],"guides":[155],"decoupled":[157],"action":[158],"decoder.":[159],"Our":[160],"real-world":[161],"experiments":[162],"demonstrate":[163],"approach":[166],"not":[167],"only":[168],"achieves":[169],"high":[170],"performance":[171],"seen":[173],"tasks":[174],"but":[175],"also":[176],"exhibits":[177],"significant":[178],"one-shot":[179],"positions,":[183],"objects,":[184],"instances,":[185],"even":[187],"new":[188],"task":[189],"categories.":[190]},"counts_by_year":[],"updated_date":"2026-03-20T20:47:17.329874","created_date":"2026-03-18T00:00:00"}
