{"id":"https://openalex.org/W3164043830","doi":"https://doi.org/10.2514/1.i010921","title":"Human-Aware Reinforcement Learning for Fault Recovery Using Contextual Gaussian Processes","display_name":"Human-Aware Reinforcement Learning for Fault Recovery Using Contextual Gaussian Processes","publication_year":2021,"publication_date":"2021-05-21","ids":{"openalex":"https://openalex.org/W3164043830","doi":"https://doi.org/10.2514/1.i010921","mag":"3164043830"},"language":"en","primary_location":{"id":"doi:10.2514/1.i010921","is_oa":false,"landing_page_url":"https://doi.org/10.2514/1.i010921","pdf_url":null,"source":{"id":"https://openalex.org/S4210240151","display_name":"Journal of Aerospace Information Systems","issn_l":"2327-3097","issn":["2327-3097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315709","host_organization_name":"American Institute of Aeronautics and Astronautics","host_organization_lineage":["https://openalex.org/P4310315709"],"host_organization_lineage_names":["American Institute of Aeronautics and Astronautics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Aerospace Information Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072438726","display_name":"Steve McGuire","orcid":"https://orcid.org/0000-0003-4650-7950"},"institutions":[{"id":"https://openalex.org/I185103710","display_name":"University of California, Santa Cruz","ror":"https://ror.org/03s65by71","country_code":"US","type":"education","lineage":["https://openalex.org/I185103710"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steve McGuire","raw_affiliation_strings":["University of California Santa Cruz, Santa Cruz, California 95064"],"raw_orcid":"https://orcid.org/0000-0003-4650-7950","affiliations":[{"raw_affiliation_string":"University of California Santa Cruz, Santa Cruz, California 95064","institution_ids":["https://openalex.org/I185103710"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060580206","display_name":"P. Michael Furlong","orcid":"https://orcid.org/0000-0001-9503-8498"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"P. Michael Furlong","raw_affiliation_strings":["University of Waterloo, Waterloo, Ontario N2L 3G1, Canada"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, Ontario N2L 3G1, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009328815","display_name":"Christoffer Heckman","orcid":"https://orcid.org/0000-0002-9651-6866"},"institutions":[{"id":"https://openalex.org/I188538660","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026","country_code":"US","type":"education","lineage":["https://openalex.org/I188538660"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christoffer Heckman","raw_affiliation_strings":["University of Colorado at Boulder, Boulder, Colorado 80309"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Colorado at Boulder, Boulder, Colorado 80309","institution_ids":["https://openalex.org/I188538660"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049634973","display_name":"Simon Julier","orcid":"https://orcid.org/0000-0003-4380-137X"},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Simon Julier","raw_affiliation_strings":["University College London, London WC1E 6BT, England, United Kingdom"],"raw_orcid":"https://orcid.org/0000-0003-4380-137X","affiliations":[{"raw_affiliation_string":"University College London, London WC1E 6BT, England, United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100664008","display_name":"Nisar Ahmed","orcid":"https://orcid.org/0000-0002-7555-5671"},"institutions":[{"id":"https://openalex.org/I188538660","display_name":"University of Colorado Boulder","ror":"https://ror.org/02ttsq026","country_code":"US","type":"education","lineage":["https://openalex.org/I188538660"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nisar Ahmed","raw_affiliation_strings":["University of Colorado at Boulder, Boulder, Colorado 80303"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Colorado at Boulder, Boulder, Colorado 80303","institution_ids":["https://openalex.org/I188538660"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4197,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.68491878,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"18","issue":"7","first_page":"429","last_page":"441"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.9713000059127808,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/forgetting","display_name":"Forgetting","score":0.7450202703475952},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7434207797050476},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6183128356933594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6000363826751709},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5938935875892639},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5016045570373535},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4989008903503418},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49732711911201477},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.42670345306396484},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.42257770895957947},{"id":"https://openalex.org/keywords/human\u2013robot-interaction","display_name":"Human\u2013robot interaction","score":0.4143655598163605},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.41273263096809387},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.2733546495437622},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.24193859100341797}],"concepts":[{"id":"https://openalex.org/C7149132","wikidata":"https://www.wikidata.org/wiki/Q1377840","display_name":"Forgetting","level":2,"score":0.7450202703475952},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7434207797050476},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6183128356933594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6000363826751709},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5938935875892639},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5016045570373535},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4989008903503418},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49732711911201477},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42670345306396484},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.42257770895957947},{"id":"https://openalex.org/C145460709","wikidata":"https://www.wikidata.org/wiki/Q859951","display_name":"Human\u2013robot interaction","level":3,"score":0.4143655598163605},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.41273263096809387},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.2733546495437622},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.24193859100341797},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.2514/1.i010921","is_oa":false,"landing_page_url":"https://doi.org/10.2514/1.i010921","pdf_url":null,"source":{"id":"https://openalex.org/S4210240151","display_name":"Journal of Aerospace Information Systems","issn_l":"2327-3097","issn":["2327-3097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310315709","host_organization_name":"American Institute of Aeronautics and Astronautics","host_organization_lineage":["https://openalex.org/P4310315709"],"host_organization_lineage_names":["American Institute of Aeronautics and Astronautics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Aerospace Information Systems","raw_type":"journal-article"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:10155800","is_oa":false,"landing_page_url":"https://discovery.ucl.ac.uk/id/eprint/10155800/","pdf_url":null,"source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"   Journal of Aerospace Information Systems , 18  (7)     (2021)      ","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5699999928474426,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G3885598841","display_name":null,"funder_award_id":"HR0011-18-2-0043","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G6664440266","display_name":"STATE OF THE ART VIRTUAL REALITY REQUIRES LOW LATENCY  ON THE ORDER OF SINGLE-DIGIT MILLISECONDS TO PRESENT A SCENE TO AN OPERATOR USING IMMERSIVE TRACKING DEVICES. IN CONVENTIONAL TELEOPERATION  THE OPERATOR S MOVEMENTS ARE USED TO DIRECTLY CONTROL A REMOTE CAMERA  REQUIRING A FAST RESPONSE TIME TO AVOID SIMULATOR SICKNESS  AN APPROACH NOT FEASIBLE FOR INTERPLANETARY ROBOTIC CONTROL WITH LIMITED BANDWIDTH  HIGH LATENCY COMMUNICATIONS. THE PROPOSED WORK DEVELOPS A HYBRID ARCHITECTURE TO PRESENT A MODEL OF A COARSE VIRTUAL WORLD TO AN OPERATOR  WHILE THE REAL IMAGERY SLOWLY REFINES THE PRESENTATION AS BANDWIDTH ALLOWS. AN ONLINE PHYSICS ENGINE ALLOWS AN ACTUATION COMMAND IN THE VIRTUAL WORLD TO BE FAITHFULLY EXECUTED IN THE REAL WORLD WITHOUT DIRECT OPERATOR FEEDBACK. THE END GOAL IS A SMOOTH  VISUALLY REALISTIC OPERATOR INTERFACE THAT ALLOWS FOR REMOTE OPERATION OF AN EXPLORATION VEHICLE IN A BLENDED WORLD SCENE OF VIRTUAL AND ACTUAL DATA.","funder_award_id":"NNX15AQ14H","funder_id":"https://openalex.org/F4320306101","funder_display_name":"National Aeronautics and Space Administration"}],"funders":[{"id":"https://openalex.org/F4320306101","display_name":"National Aeronautics and Space Administration","ror":"https://ror.org/027ka1x80"},{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1495862233","https://openalex.org/W1576373160","https://openalex.org/W1944484981","https://openalex.org/W1970006433","https://openalex.org/W1974975426","https://openalex.org/W1990212011","https://openalex.org/W2000379412","https://openalex.org/W2028626340","https://openalex.org/W2057265280","https://openalex.org/W2077148472","https://openalex.org/W2105282743","https://openalex.org/W2108437595","https://openalex.org/W2113257089","https://openalex.org/W2138467064","https://openalex.org/W2144065457","https://openalex.org/W2164313740","https://openalex.org/W2222512263","https://openalex.org/W2570486275","https://openalex.org/W2790528771","https://openalex.org/W2914741383","https://openalex.org/W2946508746","https://openalex.org/W3013147429","https://openalex.org/W3028409083","https://openalex.org/W3100329718","https://openalex.org/W3147801202","https://openalex.org/W4206814356","https://openalex.org/W4211049957","https://openalex.org/W4230399697","https://openalex.org/W4253821632","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W4289718052","https://openalex.org/W2164121020","https://openalex.org/W2145559838","https://openalex.org/W2905319430","https://openalex.org/W3116498279","https://openalex.org/W4287549553","https://openalex.org/W4310285384","https://openalex.org/W3183027292","https://openalex.org/W4248896073","https://openalex.org/W2974871044"],"abstract_inverted_index":{"This":[0,89],"work":[1,168],"addresses":[2],"the":[3,12,61,76,99,110,147],"iterated":[4],"nonstationary":[5],"assistant":[6,82],"selection":[7,144,159],"problem,":[8],"in":[9,44,123],"which":[10,85,91],"over":[11],"course":[13],"of":[14,35,50,57,78,120,131,134,187],"repeated":[15],"interactions":[16],"on":[17,94,164],"a":[18,24,28,33,48,55,69,102,142,185],"mission,":[19],"an":[20,170],"autonomous":[21,193],"robot":[22,194],"experiencing":[23],"fault":[25],"must":[26],"select":[27],"single":[29],"human":[30,81,86,115,165,176],"from":[31],"among":[32],"group":[34],"assistants":[36,43],"to":[37,40,73,87,107,174,180],"restore":[38],"it":[39,150],"operation.":[41],"The":[42],"our":[45,95,121,127,154],"problem":[46],"have":[47],"level":[49],"performance":[51,133],"that":[52,126,153],"changes":[53],"as":[54],"function":[56],"their":[58],"experience":[59],"solving":[60],"problem.":[62],"Our":[63,167],"approach":[64],"uses":[65],"reinforcement":[66],"learning":[67,105,116,138],"via":[68],"multi-arm":[70],"bandit":[71],"formulation":[72],"learn":[74],"about":[75],"capabilities":[77],"each":[79],"potential":[80,100,172],"and":[83,117,139],"decide":[84],"task.":[88],"study,":[90],"is":[92,129,151,189],"built":[93],"past":[96],"work,":[97],"evaluates":[98],"for":[101,137,191],"Gaussian-process-based":[103],"machine":[104],"method":[106,122,128],"effectively":[108],"model":[109],"complex":[111],"dynamics":[112,136],"associated":[113],"with":[114,178],"forgetting.":[118,140],"Application":[119],"simulation":[124],"shows":[125],"capable":[130],"tracking":[132],"human-like":[135],"Using":[141],"novel":[143],"policy":[145],"called":[146],"proficiency":[148],"window,":[149],"shown":[152],"technique":[155],"can":[156],"outperform":[157],"baseline":[158],"strategies":[160],"while":[161],"providing":[162],"guarantees":[163],"use.":[166],"offers":[169],"effective":[171],"alternative":[173],"dedicated":[175],"supervisors,":[177],"application":[179],"any":[181],"human\u2013robot":[182],"system":[183],"where":[184],"set":[186],"humans":[188],"responsible":[190],"overseeing":[192],"operations.":[195]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-06-22T08:00:12.763002","created_date":"2025-10-10T00:00:00"}
