{"id":"https://openalex.org/W7160243228","doi":"https://doi.org/10.48550/arxiv.2605.01191","title":"Sentinel-VLA: A Metacognitive VLA Model with Active Status Monitoring for Dynamic Reasoning and Error Recovery","display_name":"Sentinel-VLA: A Metacognitive VLA Model with Active Status Monitoring for Dynamic Reasoning and Error Recovery","publication_year":2026,"publication_date":"2026-05-02","ids":{"openalex":"https://openalex.org/W7160243228","doi":"https://doi.org/10.48550/arxiv.2605.01191"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.01191","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.01191","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.01191","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135335496","display_name":"Wenhao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Wenhao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135403641","display_name":"Xiu Su","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Xiu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135297145","display_name":"Yichao Cao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Niu, Dan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135371616","display_name":"Hongyan Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yichao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135284364","display_name":"Xiaobo Xia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Hongyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135373697","display_name":"Shan You","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qu, Zhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135400969","display_name":"Yi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fan, Lei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135300920","display_name":"Chang Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"You, Shan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Xu, Chang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Chang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9480000138282776,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9480000138282776,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.013199999928474426,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.00559999980032444,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6644999980926514},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5142999887466431},{"id":"https://openalex.org/keywords/metacognition","display_name":"Metacognition","score":0.47510001063346863},{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.4641999900341034},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4422999918460846},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4198000133037567},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.37209999561309814},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.35749998688697815},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.3555999994277954}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7347000241279602},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6644999980926514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5821999907493591},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5142999887466431},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49000000953674316},{"id":"https://openalex.org/C118147538","wikidata":"https://www.wikidata.org/wiki/Q1126970","display_name":"Metacognition","level":3,"score":0.47510001063346863},{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.4641999900341034},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4422999918460846},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4198000133037567},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.37209999561309814},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.35749998688697815},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.3555999994277954},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.3353999853134155},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C197298091","wikidata":"https://www.wikidata.org/wiki/Q5318963","display_name":"Dynamic data","level":2,"score":0.3230000138282776},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.31520000100135803},{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.3109999895095825},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.28850001096725464},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.26930001378059387},{"id":"https://openalex.org/C193611912","wikidata":"https://www.wikidata.org/wiki/Q4677596","display_name":"Active vision","level":2,"score":0.26820001006126404},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.2653999924659729},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.25540000200271606},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.2513999938964844}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.01191","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.01191","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.01191","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.01191","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7875229716300964,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Vision-language-action":[0],"(VLA)":[1],"models":[2,21],"have":[3],"advanced":[4],"the":[5,73,119,163,172,180],"field":[6],"of":[7,32],"embodied":[8],"manipulation":[9],"by":[10,167],"harnessing":[11],"broad":[12],"world":[13],"knowledge":[14],"and":[15,35,102,110,133,183],"strong":[16],"generalization.":[17],"However,":[18],"current":[19],"VLA":[20,47],"still":[22],"face":[23],"several":[24],"key":[25],"challenges,":[26],"including":[27],"limited":[28],"reasoning":[29,78,86],"capability,":[30],"lack":[31],"status":[33],"monitoring,":[34],"difficulty":[36],"in":[37],"self-correction.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42],"introduce":[43],"\\textbf{Sentinel-VLA},":[44],"a":[45,76],"metacognitive":[46],"model":[48,74],"equipped":[49],"with":[50,140],"an":[51,71,150],"active":[52],"``sentinel''":[53],"module":[54],"to":[55,128,145,149,171],"monitor":[56],"real-time":[57],"execution":[58],"status.":[59],"Only":[60],"when":[61],"necessary,":[62],"such":[63],"as":[64],"during":[65],"initial":[66],"planning":[67],"or":[68,79],"upon":[69],"detecting":[70],"error,":[72],"triggers":[75],"dynamic":[77],"formulate":[80],"error":[81],"recovery":[82],"solutions.":[83],"This":[84],"on-demand":[85],"mechanism":[87],"ensures":[88],"robust":[89],"decision-making":[90],"while":[91],"minimizing":[92],"computational":[93],"overhead.":[94],"Notably,":[95],"all":[96,179],"training":[97],"data":[98,136,184],"(spanning":[99],"44":[100],"tasks":[101],"over":[103,168],"2.6":[104],"million":[105],"transitions)":[106],"is":[107],"automatically":[108,134],"generated":[109],"annotated":[111],"through":[112],"our":[113],"designed":[114],"pipeline.":[115,186],"We":[116,176],"also":[117],"propose":[118],"Self-Evolving":[120],"Continual":[121,142],"Learning":[122],"(SECL)":[123],"algorithm,":[124],"which":[125],"allows":[126],"Sentinel-VLA":[127,161],"identify":[129],"its":[130],"capability":[131],"boundaries":[132],"collect":[135],"for":[137],"expansion,":[138],"paired":[139],"Orthogonal":[141],"Adapter":[143],"(OC-Adapter)":[144],"constrain":[146],"parameter":[147],"updates":[148],"orthogonal":[151],"space,":[152],"thereby":[153],"preventing":[154],"catastrophic":[155],"forgetting.":[156],"Real-world":[157],"experiments":[158],"demonstrate":[159],"that":[160],"boosts":[162],"task":[164],"success":[165],"rate":[166],"30\\%":[169],"compared":[170],"SOTA":[173],"model,":[174],"PI0.":[175],"will":[177],"open-source":[178],"code,":[181],"weights,":[182],"generation":[185]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-06T00:00:00"}
