{"id":"https://openalex.org/W7162795630","doi":"https://doi.org/10.48550/arxiv.2605.29766","title":"MARS Policy: Multimodality Only When It Matters","display_name":"MARS Policy: Multimodality Only When It Matters","publication_year":2026,"publication_date":"2026-05-28","ids":{"openalex":"https://openalex.org/W7162795630","doi":"https://doi.org/10.48550/arxiv.2605.29766"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.29766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.29766","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004534196","display_name":"Jindou Jia","orcid":"https://orcid.org/0000-0002-1866-6180"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Jindou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137400555","display_name":"Tuo An","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"An, Tuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137383047","display_name":"Yuxuan Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Yuxuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137340516","display_name":"Gen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Gen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137365556","display_name":"Jingliang Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jingliang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137390906","display_name":"Bohan Hou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hou, Bohan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137388672","display_name":"Xiangyu Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Xiangyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137364804","display_name":"Jiaqi Bai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bai, Jiaqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101307843","display_name":"Bofan Lyu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lyu, Bofan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137332650","display_name":"Jianfei Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Jianfei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.450300008058548,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.450300008058548,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.44040000438690186,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.02019999921321869,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5789999961853027},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5350000262260437},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.46619999408721924},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.3862999975681305},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.36410000920295715},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.3626999855041504},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.35569998621940613},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.3447999954223633}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6500999927520752},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6254000067710876},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5789999961853027},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5350000262260437},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5159000158309937},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.46619999408721924},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.3862999975681305},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.3626999855041504},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.35569998621940613},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.350600004196167},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3447999954223633},{"id":"https://openalex.org/C83260615","wikidata":"https://www.wikidata.org/wiki/Q6773121","display_name":"Mars Exploration Program","level":2,"score":0.3222000002861023},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.3199999928474426},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.29319998621940613},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.28760001063346863},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.25679999589920044}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.29766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.29766","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29766","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Imitation":[0],"learning":[1,104],"has":[2,25],"become":[3],"a":[4,34,68,170],"cornerstone":[5],"for":[6],"solving":[7],"complex":[8],"robotic":[9,69],"manipulation":[10],"tasks.":[11],"In":[12,108],"particular,":[13],"multimodality,":[14],"which":[15,87],"enables":[16],"robots":[17],"to":[18,100],"capture":[19],"diverse":[20],"yet":[21],"valid":[22],"behavioral":[23,73],"patterns,":[24],"driven":[26],"the":[27,81,111,120,131,134,141],"rapid":[28],"emergence":[29],"of":[30,67,114,137,147],"generative":[31,138],"policies":[32,139,189],"as":[33],"dominant":[35],"paradigm":[36],"in":[37,55,181,190],"robot":[38],"learning.":[39],"However,":[40],"achieving":[41],"such":[42],"multimodality":[43],"typically":[44],"relies":[45],"on":[46,193],"stochastic":[47],"noise":[48,115],"initialization":[49],"and":[50,59,140,144,155,166,175],"iterative":[51],"denoising":[52],"procedures,":[53],"resulting":[54],"substantial":[56],"training":[57,143,191],"complexity":[58],"low":[60],"inference":[61,145,178],"efficiency.":[62],"Meanwhile,":[63],"not":[64],"all":[65],"phases":[66],"task":[70],"inherently":[71],"require":[72],"diversity.":[74,202],"Motivated":[75],"by":[76,196],"this":[77],"insight,":[78],"we":[79],"propose":[80],"Modality-Adaptive":[82],"Robot":[83],"Sampling":[84],"(MARS)":[85],"policy,":[86],"adaptively":[88],"invokes":[89],"tailored":[90],"stochasticity":[91],"only":[92,118],"when":[93],"it":[94],"is":[95,116],"truly":[96],"beneficial,":[97],"while":[98],"reverting":[99],"an":[101,176],"efficient":[102],"deterministic":[103,148,188],"during":[105],"single-modal":[106],"phases.":[107],"other":[109],"words,":[110],"proper":[112,121],"amount":[113],"injected":[117],"at":[119],"time.":[122],"By":[123],"selectively":[124],"activating":[125],"multimodal":[126,135,164],"generation,":[127],"MARS":[128,161,185],"policy":[129],"bridges":[130],"gap":[132],"between":[133],"capability":[136],"superior":[142],"efficiency":[146,192],"models.":[149],"Empirical":[150],"studies":[151],"across":[152],"8":[153],"simulated":[154],"4":[156],"real-world":[157,182],"tasks":[158,195],"demonstrate":[159],"that":[160],"exhibits":[162],"robust":[163],"expressivity":[165],"high":[167],"efficiency,":[168],"with":[169],"16.67%":[171],"success":[172],"rate":[173],"improvement":[174],"83.20%":[177],"latency":[179],"reduction":[180],"tests.":[183],"Counterintuitively,":[184],"also":[186],"outpaces":[187],"near-deterministic":[194],"more":[197],"effectively":[198],"modeling":[199],"nuanced":[200],"action":[201]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-05-30T00:00:00"}
