{"id":"https://openalex.org/W7123339755","doi":"https://doi.org/10.1109/tro.2026.3651678","title":"Safe MPC Alignment With Human Directional Feedback","display_name":"Safe MPC Alignment With Human Directional Feedback","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7123339755","doi":"https://doi.org/10.1109/tro.2026.3651678"},"language":null,"primary_location":{"id":"doi:10.1109/tro.2026.3651678","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tro.2026.3651678","pdf_url":null,"source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102702858","display_name":"Zhixian Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhixian Xie","raw_affiliation_strings":["Intelligent Robotics and Interactive Systems (IRIS) Lab, School for Engineering of Matter, Transport and Energy, Arizona State University, Tempe, AZ, USA"],"affiliations":[{"raw_affiliation_string":"Intelligent Robotics and Interactive Systems (IRIS) Lab, School for Engineering of Matter, Transport and Energy, Arizona State University, Tempe, AZ, USA","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122876197","display_name":"Wenlong Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wenlong Zhang","raw_affiliation_strings":["Polytechnic School, Arizona State University, Tempe, AZ, USA"],"affiliations":[{"raw_affiliation_string":"Polytechnic School, Arizona State University, Tempe, AZ, USA","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122884711","display_name":"Yi Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yi Ren","raw_affiliation_strings":["School for Engineering of Matter, Transport and Energy, Arizona State University, Tempe, AZ, USA"],"affiliations":[{"raw_affiliation_string":"School for Engineering of Matter, Transport and Energy, Arizona State University, Tempe, AZ, USA","institution_ids":["https://openalex.org/I55732556"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhaoran Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhaoran Wang","raw_affiliation_strings":["Departments of Industrial Engineering and Management Sciences, Northwestern University, Evanston, IL, USA"],"affiliations":[{"raw_affiliation_string":"Departments of Industrial Engineering and Management Sciences, Northwestern University, Evanston, IL, USA","institution_ids":["https://openalex.org/I111979921"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122876024","display_name":"George J. Pappas","orcid":null},"institutions":[{"id":"https://openalex.org/I79576946","display_name":"University of Pennsylvania","ror":"https://ror.org/00b30xv10","country_code":"US","type":"education","lineage":["https://openalex.org/I79576946"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"George J. Pappas","raw_affiliation_strings":["Department of Electrical and Systems Engineering, University of Pennsylvania, Philadelphia, PA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Systems Engineering, University of Pennsylvania, Philadelphia, PA, USA","institution_ids":["https://openalex.org/I79576946"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111136880","display_name":"Wanxin Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I55732556","display_name":"Arizona State University","ror":"https://ror.org/03efmqc40","country_code":"US","type":"education","lineage":["https://openalex.org/I55732556"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wanxin Jin","raw_affiliation_strings":["Intelligent Robotics and Interactive Systems (IRIS) Lab, School for Engineering of Matter, Transport and Energy, Arizona State University, Tempe, AZ, USA"],"affiliations":[{"raw_affiliation_string":"Intelligent Robotics and Interactive Systems (IRIS) Lab, School for Engineering of Matter, Transport and Energy, Arizona State University, Tempe, AZ, USA","institution_ids":["https://openalex.org/I55732556"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102702858"],"corresponding_institution_ids":["https://openalex.org/I55732556"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.09153895,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"42","issue":null,"first_page":"750","last_page":"769"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.4855000078678131,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.4855000078678131,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.24469999969005585,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.049400001764297485,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.7394999861717224},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.6912000179290771},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6503999829292297},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.5960999727249146},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.5586000084877014},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.4131999909877777},{"id":"https://openalex.org/keywords/robot-kinematics","display_name":"Robot kinematics","score":0.3982999920845032},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3785000145435333}],"concepts":[{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.7394999861717224},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.6912000179290771},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6503999829292297},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6450999975204468},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.5960999727249146},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.5586000084877014},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.414900004863739},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.4131999909877777},{"id":"https://openalex.org/C74222875","wikidata":"https://www.wikidata.org/wiki/Q16000312","display_name":"Robot kinematics","level":4,"score":0.3982999920845032},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.385699987411499},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3785000145435333},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.37389999628067017},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.3472999930381775},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.32170000672340393},{"id":"https://openalex.org/C60692881","wikidata":"https://www.wikidata.org/wiki/Q584529","display_name":"Humanoid robot","level":3,"score":0.31619998812675476},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.31299999356269836},{"id":"https://openalex.org/C150415221","wikidata":"https://www.wikidata.org/wiki/Q40687","display_name":"Robotic arm","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C2986087404","wikidata":"https://www.wikidata.org/wiki/Q15946010","display_name":"Online learning","level":2,"score":0.2996000051498413},{"id":"https://openalex.org/C196467688","wikidata":"https://www.wikidata.org/wiki/Q1851985","display_name":"Telerobotics","level":4,"score":0.29820001125335693},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.2687000036239624},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.267300009727478},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.25839999318122864}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tro.2026.3651678","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tro.2026.3651678","pdf_url":null,"source":{"id":"https://openalex.org/S144620930","display_name":"IEEE Transactions on Robotics","issn_l":"1552-3098","issn":["1552-3098","1941-0468"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Robotics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1837766154","https://openalex.org/W1999874108","https://openalex.org/W2005900349","https://openalex.org/W2037997802","https://openalex.org/W2158782408","https://openalex.org/W2169498096","https://openalex.org/W2735318784","https://openalex.org/W2737702598","https://openalex.org/W2763110165","https://openalex.org/W2963627347","https://openalex.org/W2969050806","https://openalex.org/W2994446013","https://openalex.org/W3003858867","https://openalex.org/W3008128154","https://openalex.org/W3023096123","https://openalex.org/W3088135243","https://openalex.org/W3092948749","https://openalex.org/W3130163632","https://openalex.org/W3196191018","https://openalex.org/W3205292576","https://openalex.org/W3208223622","https://openalex.org/W3216784117","https://openalex.org/W4200632446","https://openalex.org/W4250589301","https://openalex.org/W4283785867","https://openalex.org/W4285018727","https://openalex.org/W4313952519","https://openalex.org/W4382239602","https://openalex.org/W4383108621","https://openalex.org/W4386981938","https://openalex.org/W4387123822","https://openalex.org/W4401417251","https://openalex.org/W4402354098","https://openalex.org/W4402402057","https://openalex.org/W4407831732","https://openalex.org/W7124354995"],"related_works":[],"abstract_inverted_index":{"In":[0,18],"safety-critical":[1],"robot":[2,29,80,165,186],"planning":[3],"or":[4,10,119],"control,":[5],"manually":[6],"specifying":[7],"safety":[8,33,57,128,190],"constraints":[9,58,191],"learning":[11,96],"them":[12],"from":[13,59],"demonstrations":[14],"can":[15],"be":[16,131],"challenging.":[17],"this":[19],"article,":[20],"we":[21,154],"propose":[22],"a":[23,28,32,162,185,193],"certifiable":[24],"alignment":[25],"method":[26,54,64,85,142,160],"for":[27],"to":[30,55,77,93,187],"learn":[31,56,189],"constraint":[34,129],"in":[35,113,149],"its":[36],"model":[37],"predictive":[38],"control":[39],"(MPC)":[40],"policy":[41],"with":[42,192],"human":[43,60,71,91,111,198],"online":[44],"directional":[45,72,199],"feedback.":[46,61],"To":[47],"our":[48,179],"knowledge,":[49],"it":[50,183],"is":[51,65,100],"the":[52,79,88,95,107,114,121,125,134,140,158,174],"first":[53],"The":[62,84,171],"proposed":[63,141,159],"based":[66],"on":[67,106,161],"an":[68,103],"empirical":[69],"observation:":[70],"feedback,":[73],"when":[74],"available,":[75],"tends":[76],"guide":[78],"toward":[81],"safer":[82],"regions.":[83],"only":[86],"requires":[87],"direction":[89],"of":[90,110,116,178,197],"feedback":[92,112],"update":[94],"hypothesis":[97,122,136],"space.":[98,137],"It":[99],"certifiable,":[101],"providing":[102],"upper":[104],"bound":[105],"total":[108],"number":[109],"case":[115],"successful":[117],"learning,":[118],"declaring":[120],"misspecification,":[123],"i.e.,":[124],"true":[126],"implicit":[127],"cannot":[130],"found":[132],"within":[133],"specified":[135],"We":[138],"evaluated":[139],"using":[143],"numerical":[144],"examples":[145],"and":[146,156,176],"user":[147],"studies":[148],"two":[150],"simulation":[151],"games.":[152],"Additionally,":[153],"implemented":[155],"tested":[157],"real-world":[163],"Franka":[164],"arm":[166],"performing":[167],"mobile":[168],"water-pouring":[169],"tasks.":[170],"results":[172],"demonstrate":[173],"efficacy":[175],"efficiency":[177],"method,":[180],"showing":[181],"that":[182],"enables":[184],"successfully":[188],"small":[194],"handful":[195],"(tens)":[196],"corrections.":[200]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2026-01-14T00:00:00"}
