{"id":"https://openalex.org/W7154483605","doi":"https://doi.org/10.48550/arxiv.2604.13015","title":"Learning Versatile Humanoid Manipulation with Touch Dreaming","display_name":"Learning Versatile Humanoid Manipulation with Touch Dreaming","publication_year":2026,"publication_date":"2026-04-14","ids":{"openalex":"https://openalex.org/W7154483605","doi":"https://doi.org/10.48550/arxiv.2604.13015"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.13015","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13015","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.13015","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133644284","display_name":"Yaru Niu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Niu, Yaru","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130224054","display_name":"Zhenlong Fang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fang, Zhenlong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133676061","display_name":"Binghong Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Binghong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123909462","display_name":"Shuai Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Shuai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133722918","display_name":"Revanth Senthilkumaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Senthilkumaran, Revanth Krishna","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100396916","display_name":"Hao Zhang","orcid":"https://orcid.org/0000-0003-4276-5477"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133707111","display_name":"Bingqing Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Bingqing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100729546","display_name":"Chen Qiu","orcid":"https://orcid.org/0000-0002-1668-8773"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiu, Chen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128215626","display_name":"H. Eric Tseng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tseng, H. Eric","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133726952","display_name":"Jonathan Francis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Francis, Jonathan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133715232","display_name":"Ding Zhao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Ding","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5133644284"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.2872999906539917,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.2872999906539917,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.10750000178813934,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.06750000268220901,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/humanoid-robot","display_name":"Humanoid robot","score":0.8784999847412109},{"id":"https://openalex.org/keywords/teleoperation","display_name":"Teleoperation","score":0.5595999956130981},{"id":"https://openalex.org/keywords/torso","display_name":"Torso","score":0.49869999289512634},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.42489999532699585},{"id":"https://openalex.org/keywords/kinesthetic-learning","display_name":"Kinesthetic learning","score":0.38839998841285706},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.3774000108242035},{"id":"https://openalex.org/keywords/active-perception","display_name":"Active perception","score":0.3515999913215637}],"concepts":[{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.8784999847412109},{"id":"https://openalex.org/C161759796","wikidata":"https://www.wikidata.org/wiki/Q3982902","display_name":"Teleoperation","level":3,"score":0.5595999956130981},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5356000065803528},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5224999785423279},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5151000022888184},{"id":"https://openalex.org/C523889960","wikidata":"https://www.wikidata.org/wiki/Q160695","display_name":"Torso","level":2,"score":0.49869999289512634},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.42489999532699585},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41819998621940613},{"id":"https://openalex.org/C55457006","wikidata":"https://www.wikidata.org/wiki/Q3647098","display_name":"Kinesthetic learning","level":2,"score":0.38839998841285706},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.3774000108242035},{"id":"https://openalex.org/C2776010242","wikidata":"https://www.wikidata.org/wiki/Q4677575","display_name":"Active perception","level":3,"score":0.3515999913215637},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3370000123977661},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.33250001072883606},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.31279999017715454},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.3034999966621399},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2818000018596649},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.26089999079704285},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.2605000138282776},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.25870001316070557}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.13015","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13015","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.13015","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.13015","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Humanoid":[0,79],"robots":[1],"promise":[2],"general-purpose":[3],"assistance,":[4],"yet":[5],"real-world":[6,162],"humanoid":[7,32,62,213],"loco-manipulation":[8],"remains":[9],"challenging":[10],"because":[11],"it":[12],"requires":[13],"whole-body":[14,48,61],"stability,":[15],"end-effector":[16],"dexterity,":[17],"and":[18,70,99,127,221],"contact-aware":[19,155],"interaction":[20],"under":[21],"frequent":[22],"contact":[23],"changes.":[24],"In":[25],"this":[26,55],"work,":[27],"we":[28,57],"study":[29],"dexterous,":[30],"contact-rich":[31,74,163],"loco-manipulation.":[33],"We":[34,76],"first":[35],"develop":[36,58],"an":[37,136],"RL-based":[38],"lower-body":[39],"controller":[40],"that":[41,66,89,183,205],"serves":[42],"as":[43,92],"the":[44,121,151,176,216],"stability":[45],"backbone":[46],"for":[47,73,157],"execution":[49],"during":[50],"complex":[51],"manipulation.":[52,75,159],"Built":[53],"on":[54],"controller,":[56],"a":[59,85,93,105,144,167,195],"VR-based":[60],"data":[63],"collection":[64],"system":[65,209],"integrates":[67],"dexterous":[68,158],"hands":[69],"tactile":[71,129,146,185,192],"sensing":[72],"then":[77],"propose":[78],"Transformer":[80,88],"with":[81,108,131],"Touch":[82],"Dreaming":[83],"(HTD),":[84],"multimodal":[86],"encoder--decoder":[87],"models":[90],"touch":[91,113],"core":[94],"modality":[95],"alongside":[96],"multi-view":[97],"vision":[98],"proprioception.":[100],"HTD":[101,165],"is":[102,187],"trained":[103],"in":[104,115,171,199,215],"single":[106],"stage":[107],"behavioral":[109],"cloning":[110],"augmented":[111],"by":[112,135],"dreaming:":[114],"addition":[116],"to":[117,153],"predicting":[118],"action":[119],"chunks,":[120],"policy":[122,152],"predicts":[123],"future":[124,128],"hand-joint":[125],"forces":[126],"latents,":[130],"tactile-latent":[132],"targets":[133],"provided":[134],"exponential":[137],"moving":[138],"average":[139,172],"target":[140],"encoder":[141],"without":[142],"requiring":[143],"separate":[145],"pretraining":[147],"stage.":[148],"This":[149],"encourages":[150],"learn":[154],"representations":[156],"Across":[160],"five":[161],"tasks,":[164],"achieves":[166],"90.9%":[168],"relative":[169,197],"improvement":[170],"success":[173,200],"rate":[174],"over":[175],"stronger":[177],"baseline.":[178],"Ablation":[179],"results":[180,203],"further":[181],"show":[182],"latent-space":[184],"prediction":[186],"more":[188],"effective":[189],"than":[190],"raw":[191],"prediction,":[193],"yielding":[194],"30%":[196],"gain":[198],"rate.":[201],"These":[202],"demonstrate":[204],"our":[206],"touch-dreaming-enhanced":[207],"learning":[208],"enables":[210],"versatile,":[211],"high-dexterity":[212],"manipulation":[214],"real":[217],"world.":[218],"More":[219],"information":[220],"open-source":[222],"materials":[223],"are":[224],"available":[225],"at:":[226],"humanoid-touch-dream.github.io.":[227]},"counts_by_year":[],"updated_date":"2026-04-29T06:10:49.150238","created_date":"2026-04-16T00:00:00"}
