{"id":"https://openalex.org/W2883896749","doi":"https://doi.org/10.1109/iros40897.2019.8968287","title":"EnsembleDAgger: A Bayesian Approach to Safe Imitation Learning","display_name":"EnsembleDAgger: A Bayesian Approach to Safe Imitation Learning","publication_year":2019,"publication_date":"2019-11-01","ids":{"openalex":"https://openalex.org/W2883896749","doi":"https://doi.org/10.1109/iros40897.2019.8968287","mag":"2883896749"},"language":"en","primary_location":{"id":"doi:10.1109/iros40897.2019.8968287","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968287","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1807.08364","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019684645","display_name":"Kunal Menda","orcid":"https://orcid.org/0000-0003-1830-0637"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kunal Menda","raw_affiliation_strings":["Stanford University,Stanford,CA,USA,94305","Stanford University ()"],"affiliations":[{"raw_affiliation_string":"Stanford University,Stanford,CA,USA,94305","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Stanford University ()","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059066811","display_name":"Katherine Driggs-Campbell","orcid":"https://orcid.org/0000-0003-3760-9859"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]},{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Katherine Driggs-Campbell","raw_affiliation_strings":["University of Illinois at Urbana-Champaign,IL,USA,61820","Stanford University ()"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign,IL,USA,61820","institution_ids":["https://openalex.org/I157725225"]},{"raw_affiliation_string":"Stanford University ()","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068326377","display_name":"Mykel J. Kochenderfer","orcid":"https://orcid.org/0000-0002-7238-9663"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]},{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mykel J. Kochenderfer","raw_affiliation_strings":["Stanford University,Stanford,CA,USA,94305","***University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"Stanford University,Stanford,CA,USA,94305","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"***University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5019684645"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":0.76808873,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.76854943,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"5041","last_page":"5048"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6826623678207397},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6424659490585327},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6370389461517334},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6256650686264038},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.5336967706680298},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.4695706367492676},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.43519580364227295},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4241240620613098}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6826623678207397},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6424659490585327},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6370389461517334},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6256650686264038},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.5336967706680298},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.4695706367492676},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.43519580364227295},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4241240620613098},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/iros40897.2019.8968287","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros40897.2019.8968287","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1807.08364","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1807.08364","pdf_url":"https://arxiv.org/pdf/1807.08364","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"mag:2883896749","is_oa":true,"landing_page_url":"https://arxiv.org/pdf/1807.08364.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.1807.08364","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.1807.08364","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1807.08364","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1807.08364","pdf_url":"https://arxiv.org/pdf/1807.08364","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.550000011920929}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2883896749.pdf","grobid_xml":"https://content.openalex.org/works/W2883896749.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W1502922572","https://openalex.org/W1746819321","https://openalex.org/W1986014385","https://openalex.org/W2053572490","https://openalex.org/W2071841410","https://openalex.org/W2095705004","https://openalex.org/W2097113539","https://openalex.org/W2100128988","https://openalex.org/W2101234009","https://openalex.org/W2104733512","https://openalex.org/W2142641780","https://openalex.org/W2148112459","https://openalex.org/W2158349948","https://openalex.org/W2295827790","https://openalex.org/W2298163601","https://openalex.org/W2396217537","https://openalex.org/W2409942531","https://openalex.org/W2462906003","https://openalex.org/W2618318883","https://openalex.org/W2895144567","https://openalex.org/W2912415163","https://openalex.org/W2962957031","https://openalex.org/W2963238274","https://openalex.org/W2963641140","https://openalex.org/W2964052793","https://openalex.org/W2964059111","https://openalex.org/W3098713169","https://openalex.org/W4211049957","https://openalex.org/W6617145748","https://openalex.org/W6640174482","https://openalex.org/W6675999342","https://openalex.org/W6680724558","https://openalex.org/W6704571135","https://openalex.org/W6718836005","https://openalex.org/W6730042731","https://openalex.org/W6738483526","https://openalex.org/W6745256532","https://openalex.org/W6753133050","https://openalex.org/W6754881090","https://openalex.org/W6780559895"],"related_works":["https://openalex.org/W3003342008","https://openalex.org/W2757751962","https://openalex.org/W2895144567","https://openalex.org/W2951934018","https://openalex.org/W2891781407","https://openalex.org/W2750875954","https://openalex.org/W2560678327","https://openalex.org/W3210702899","https://openalex.org/W3205195733","https://openalex.org/W2902567911","https://openalex.org/W2626860042","https://openalex.org/W3138964531","https://openalex.org/W2097668489","https://openalex.org/W3175537068","https://openalex.org/W2890026535","https://openalex.org/W3181841583","https://openalex.org/W2084310490","https://openalex.org/W1486103295","https://openalex.org/W3208712148","https://openalex.org/W2998219625"],"abstract_inverted_index":{"While":[0],"imitation":[1,146],"learning":[2,137,147],"is":[3,19,106],"often":[4],"used":[5],"in":[6,153],"robotics,":[7],"the":[8,33,42,57,60,82,100,110,121,128,154],"approach":[9],"frequently":[10],"suffers":[11],"from":[12,31],"data":[13,30],"mismatch":[14],"and":[15,35,136,144,152],"compounding":[16],"errors.":[17],"DAgger":[18,142],"an":[20,76,149],"iterative":[21],"algorithm":[22],"that":[23,94],"addresses":[24],"these":[25],"issues":[26],"by":[27],"aggregating":[28],"training":[29],"both":[32],"expert":[34],"novice":[36,61,111],"policies,":[37],"but":[38],"does":[39],"not":[40],"consider":[41],"impact":[43],"of":[44,59,78,87,124,130],"safety.":[45,67],"We":[46,132],"present":[47],"a":[48,64,72,85,91],"probabilistic":[49],"extension":[50],"to":[51,55,108,112,119,140],"DAgger,":[52],"which":[53],"attempts":[54],"quantify":[56],"confidence":[58],"policy":[62],"as":[63,84],"proxy":[65],"for":[66],"Our":[68],"method,":[69],"EnsembleDAgger,":[70],"approximates":[71],"Gaussian":[73],"Process":[74],"using":[75],"ensemble":[77],"neural":[79],"networks.":[80],"Using":[81],"variance":[83],"measure":[86],"confidence,":[88],"we":[89,98,117],"compute":[90],"decision":[92],"rule":[93],"captures":[95],"how":[96],"much":[97],"doubt":[99],"novice,":[101],"thus":[102],"determining":[103],"when":[104],"it":[105],"safe":[107],"allow":[109],"act.":[113],"With":[114],"this":[115],"approach,":[116],"aim":[118],"maximize":[120],"novice's":[122],"share":[123],"actions,":[125],"while":[126],"constraining":[127],"probability":[129],"failure.":[131],"demonstrate":[133],"improved":[134],"safety":[135],"performance":[138],"compared":[139],"other":[141],"variants":[143],"classic":[145],"on":[148],"inverted":[150],"pendulum":[151],"MuJoCo":[155],"HalfCheetah":[156],"environment.":[157]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
