{"id":"https://openalex.org/W7157118346","doi":"https://doi.org/10.48550/arxiv.2604.23609","title":"Tube Diffusion Policy: Reactive Visual-Tactile Policy Learning for Contact-rich Manipulation","display_name":"Tube Diffusion Policy: Reactive Visual-Tactile Policy Learning for Contact-rich Manipulation","publication_year":2026,"publication_date":"2026-04-26","ids":{"openalex":"https://openalex.org/W7157118346","doi":"https://doi.org/10.48550/arxiv.2604.23609"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.23609","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23609","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.23609","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134813882","display_name":"Teng Xue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xue, Teng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032432096","display_name":"Alberto Rigo","orcid":"https://orcid.org/0000-0002-0428-2290"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rigo, Alberto","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033629550","display_name":"Bingjian Huang","orcid":"https://orcid.org/0000-0002-9347-674X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Bingjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100568352","display_name":"Jiayi Shen","orcid":"https://orcid.org/0000-0001-5604-7973"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shen, Jiayi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100583938","display_name":"Zhengtong Xu","orcid":"https://orcid.org/0000-0002-2789-1910"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Zhengtong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071166006","display_name":"Nick Colonnese","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Colonnese, Nick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5055316477","display_name":"Amirhossein H. Memar","orcid":"https://orcid.org/0000-0002-6152-2406"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Memar, Amirhossein H.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.4327000081539154,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.4327000081539154,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10914","display_name":"Tactile and Sensory Interactions","score":0.2054000049829483,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10982","display_name":"Motor Control and Adaptation","score":0.05590000003576279,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.6518999934196472},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5824999809265137},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5134000182151794},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.4251999855041504},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4156999886035919},{"id":"https://openalex.org/keywords/adaptive-learning","display_name":"Adaptive learning","score":0.39100000262260437},{"id":"https://openalex.org/keywords/adaptive-control","display_name":"Adaptive control","score":0.3634999990463257},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3544999957084656}],"concepts":[{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.6518999934196472},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6065000295639038},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5824999809265137},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5134000182151794},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47110000252723694},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4251999855041504},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4156999886035919},{"id":"https://openalex.org/C125014702","wikidata":"https://www.wikidata.org/wiki/Q4680749","display_name":"Adaptive learning","level":2,"score":0.39100000262260437},{"id":"https://openalex.org/C107464732","wikidata":"https://www.wikidata.org/wiki/Q235781","display_name":"Adaptive control","level":3,"score":0.3634999990463257},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3544999957084656},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.3199999928474426},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3149999976158142},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3149999976158142},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.304500013589859},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.29739999771118164},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.2851000130176544},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C108755667","wikidata":"https://www.wikidata.org/wiki/Q1930258","display_name":"AC power","level":3,"score":0.2703999876976013},{"id":"https://openalex.org/C2781002164","wikidata":"https://www.wikidata.org/wiki/Q6822311","display_name":"Meta learning (computer science)","level":3,"score":0.2615000009536743},{"id":"https://openalex.org/C34585555","wikidata":"https://www.wikidata.org/wiki/Q1368723","display_name":"Learning curve","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2587999999523163},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.25529998540878296},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.23609","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23609","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.23609","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.23609","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.616789698600769}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Contact-rich":[0],"manipulation":[1,36,147],"is":[2],"central":[3],"to":[4,12,50,52],"many":[5],"everyday":[6],"human":[7],"activities,":[8],"requiring":[9],"continuous":[10],"adaptation":[11],"contact":[13,168],"uncertainty":[14,67,169],"and":[15,23,68,127,141,170],"external":[16,171],"disturbances":[17],"through":[18],"multi-modal":[19],"perception,":[20],"particularly":[21],"vision":[22],"tactile":[24,70],"feedback.":[25],"While":[26],"imitation":[27,96,156],"learning":[28,34,91,97,157],"has":[29],"shown":[30],"strong":[31],"potential":[32],"for":[33,192],"complex":[35],"behaviors,":[37],"most":[38],"existing":[39],"approaches":[40],"rely":[41],"on":[42,135],"action":[43,118,122,180],"chunking,":[44],"which":[45],"fundamentally":[46],"limits":[47],"their":[48],"ability":[49],"react":[51],"unforeseen":[53],"observations":[54],"during":[55,130],"execution.":[56,131],"This":[57],"limitation":[58],"becomes":[59],"especially":[60],"critical":[61],"in":[62,197],"contact-rich":[63,198],"scenarios,":[64],"where":[65],"physical":[66],"high-frequency":[69,194],"feedback":[71,100,114,195],"demand":[72],"rapid,":[73],"reactive":[74,88],"control.":[75,101],"To":[76],"address":[77],"this":[78],"challenge,":[79],"we":[80],"propose":[81],"Tube":[82],"Diffusion":[83],"Policy":[84],"(TDP),":[85],"a":[86],"novel":[87],"visual-tactile":[89,145],"policy":[90],"framework":[92],"that":[93,124],"bridges":[94],"diffusion-based":[95],"with":[98],"tube-based":[99],"By":[102],"leveraging":[103],"the":[104,136,174,184],"expressive":[105],"power":[106],"of":[107],"generative":[108],"models,":[109],"TDP":[110,134,152,189],"learns":[111],"an":[112,121],"observation-conditioned":[113],"flow":[115],"around":[116],"nominal":[117],"chunks,":[119],"forming":[120],"tube":[123,181],"enables":[125],"fast":[126],"adaptive":[128],"reactions":[129],"We":[132],"evaluate":[133],"widely":[137],"used":[138],"Push-T":[139],"benchmark":[140],"three":[142],"additional":[143],"challenging":[144],"dexterous":[146],"tasks.":[148],"Across":[149],"all":[150],"benchmarks,":[151],"consistently":[153],"outperforms":[154],"state-of-the-art":[155],"baselines.":[158],"Two":[159],"real-world":[160],"experiments":[161],"further":[162],"validate":[163],"its":[164],"robust":[165],"reactivity":[166],"under":[167],"disturbances.":[172],"Moreover,":[173],"step-wise":[175],"correction":[176],"mechanism":[177],"enabled":[178],"by":[179],"significantly":[182],"reduces":[183],"required":[185],"denoising":[186],"steps,":[187],"making":[188],"well":[190],"suited":[191],"real-time,":[193],"control":[196],"manipulation.":[199]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-29T00:00:00"}
