{"id":"https://openalex.org/W7128520237","doi":"https://doi.org/10.48550/arxiv.2602.08602","title":"Mimic Intent, Not Just Trajectories","display_name":"Mimic Intent, Not Just Trajectories","publication_year":2026,"publication_date":"2026-02-09","ids":{"openalex":"https://openalex.org/W7128520237","doi":"https://doi.org/10.48550/arxiv.2602.08602"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.08602","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125574905","display_name":"Renming Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Renming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063555214","display_name":"Chen-dong Zeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Chendong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125588517","display_name":"Wenjing Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Wenjing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125590655","display_name":"Jingtian Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Jintian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107334651","display_name":"CeWu Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Cewu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5077008575","display_name":"Panpan Cai","orcid":"https://orcid.org/0000-0003-1926-4842"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Panpan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6991999745368958,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6991999745368958,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.06750000268220901,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.06340000033378601,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.6348999738693237},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5824999809265137},{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.5769000053405762},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5472999811172485},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5252000093460083},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.48410001397132874},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4496000111103058},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4189000129699707}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7347999811172485},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.6348999738693237},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6103000044822693},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5824999809265137},{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.5769000053405762},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5472999811172485},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5252000093460083},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.48410001397132874},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4496000111103058},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4189000129699707},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.40299999713897705},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.4016999900341034},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.39329999685287476},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.3605000078678131},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.33709999918937683},{"id":"https://openalex.org/C132964779","wikidata":"https://www.wikidata.org/wiki/Q2110223","display_name":"Raw data","level":2,"score":0.33219999074935913},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.3296000063419342},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.32739999890327454},{"id":"https://openalex.org/C13687954","wikidata":"https://www.wikidata.org/wiki/Q4826847","display_name":"Autonomous agent","level":2,"score":0.3160000145435333},{"id":"https://openalex.org/C189645446","wikidata":"https://www.wikidata.org/wiki/Q350865","display_name":"Mirroring","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C2776240099","wikidata":"https://www.wikidata.org/wiki/Q327018","display_name":"Interrogation","level":2,"score":0.275299996137619},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.26829999685287476},{"id":"https://openalex.org/C2780440489","wikidata":"https://www.wikidata.org/wiki/Q5227278","display_name":"Data-driven","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.25619998574256897}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.08602","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.08602","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.08602","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.08602","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"imitation":[1],"learning":[2,146],"(IL)":[3],"has":[4],"achieved":[5],"impressive":[6],"success":[7,184],"in":[8,57],"dexterous":[9],"manipulation":[10,175],"through":[11,137],"generative":[12],"modeling":[13],"and":[14,29,90,100,116,118,148,177,193],"pretraining,":[15],"state-of-the-art":[16,183],"approaches":[17],"like":[18],"Vision-Language-Action":[19],"(VLA)":[20],"models":[21],"still":[22],"struggle":[23],"with":[24,85],"adaptation":[25,125],"to":[26,95,103,126],"environmental":[27,127],"changes":[28],"skill":[30],"transfer.":[31,196],"We":[32,65,81],"argue":[33],"this":[34,67,131,151],"stems":[35],"from":[36,54,164],"mimicking":[37],"raw":[38],"trajectories":[39,136],"without":[40],"understanding":[41],"the":[42,92,161,168],"underlying":[43],"intent.":[44],"To":[45],"address":[46],"this,":[47],"we":[48],"propose":[49],"explicitly":[50],"disentangling":[51],"behavior":[52],"intent":[53],"execution":[55],"details":[56],"end-2-end":[58],"IL:":[59],"Mimic":[60],"Intent,":[61],"Not":[62],"just":[63],"Trajectories(MINT).":[64],"achieve":[66],"via":[68],"multi-scale":[69,87,119],"frequency-space":[70],"tokenization,":[71],"which":[72],"enforces":[73],"a":[74,86,165,179],"spectral":[75],"decomposition":[76],"of":[77,156],"action":[78,83],"chunk":[79],"representation.":[80],"learn":[82],"tokens":[84,102,121],"coarse-to-fine":[88],"structure,":[89],"force":[91],"coarsest":[93],"token":[94,112,163],"capture":[96],"low-frequency":[97],"global":[98],"structure":[99],"finer":[101],"encode":[104],"high-frequency":[105],"details.":[106],"This":[107],"yields":[108],"an":[109],"abstract":[110],"Intent":[111,162],"that":[113,122],"facilitates":[114],"planning":[115],"transfer,":[117],"Execution":[120],"enable":[123],"precise":[124],"dynamics.":[128],"Building":[129],"on":[130,173,178],"hierarchy,":[132],"our":[133],"policy":[134],"generates":[135],"next-scale":[138],"autoregression,":[139],"performing":[140],"progressive":[141],"intent-to-execution":[142],"reasoning,":[143],"thus":[144],"boosting":[145],"efficiency":[147],"generalization.":[149],"Crucially,":[150],"disentanglement":[152],"enables":[153],"one-shot":[154,195],"transfer":[155],"skills,":[157],"by":[158],"simply":[159],"injecting":[160],"demonstration":[166],"into":[167],"autoregressive":[169],"generation":[170],"process.":[171],"Experiments":[172],"several":[174],"benchmarks":[176],"real":[180],"robot":[181],"demonstrate":[182],"rates,":[185],"superior":[186],"inference":[187],"efficiency,":[188],"robust":[189],"generalization":[190],"against":[191],"disturbances,":[192],"effective":[194]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-02-11T00:00:00"}
