{"id":"https://openalex.org/W3212409086","doi":"https://doi.org/10.3390/robotics12050127","title":"GRI: General Reinforced Imitation and Its Application to Vision-Based Autonomous Driving","display_name":"GRI: General Reinforced Imitation and Its Application to Vision-Based Autonomous Driving","publication_year":2023,"publication_date":"2023-09-06","ids":{"openalex":"https://openalex.org/W3212409086","doi":"https://doi.org/10.3390/robotics12050127","mag":"3212409086"},"language":"en","primary_location":{"id":"doi:10.3390/robotics12050127","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics12050127","pdf_url":"https://www.mdpi.com/2218-6581/12/5/127/pdf?version=1693994176","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2218-6581/12/5/127/pdf?version=1693994176","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040722138","display_name":"Raphael Chekroun","orcid":null},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]},{"id":"https://openalex.org/I2746051580","display_name":"Universit\u00e9 Paris Sciences et Lettres","ror":"https://ror.org/013cjyk83","country_code":"FR","type":"education","lineage":["https://openalex.org/I2746051580"]},{"id":"https://openalex.org/I4210154688","display_name":"H\u00f4pital Saint-Michel","ror":"https://ror.org/057v2pg43","country_code":"FR","type":"healthcare","lineage":["https://openalex.org/I4210154688"]},{"id":"https://openalex.org/I4403386650","display_name":"Centre de Robotique","ror":"https://ror.org/0180r7w69","country_code":null,"type":"education","lineage":["https://openalex.org/I190752583","https://openalex.org/I2746051580","https://openalex.org/I4403386650","https://openalex.org/I70768539"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Raphael Chekroun","raw_affiliation_strings":["Center for Robotics, Mines Paris, PSL University, 75006 Paris, France","Valeo Driving Assistant Research, 75017 Paris, France","CAOR - Centre de Robotique (60, boulevard Saint-Michel 75272 Paris cedex 06 - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Robotics, Mines Paris, PSL University, 75006 Paris, France","institution_ids":["https://openalex.org/I2746051580"]},{"raw_affiliation_string":"Valeo Driving Assistant Research, 75017 Paris, France","institution_ids":["https://openalex.org/I220619192"]},{"raw_affiliation_string":"CAOR - Centre de Robotique (60, boulevard Saint-Michel 75272 Paris cedex 06 - France)","institution_ids":["https://openalex.org/I4210154688","https://openalex.org/I4403386650"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046953494","display_name":"Marin Toromanoff","orcid":null},"institutions":[{"id":"https://openalex.org/I220619192","display_name":"Valeo (France)","ror":"https://ror.org/04ryqpf83","country_code":"FR","type":"company","lineage":["https://openalex.org/I220619192"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Marin Toromanoff","raw_affiliation_strings":["Valeo Driving Assistant Research, 75017 Paris, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Valeo Driving Assistant Research, 75017 Paris, France","institution_ids":["https://openalex.org/I220619192"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044031406","display_name":"Sascha Hornauer","orcid":null},"institutions":[{"id":"https://openalex.org/I2746051580","display_name":"Universit\u00e9 Paris Sciences et Lettres","ror":"https://ror.org/013cjyk83","country_code":"FR","type":"education","lineage":["https://openalex.org/I2746051580"]},{"id":"https://openalex.org/I4210154688","display_name":"H\u00f4pital Saint-Michel","ror":"https://ror.org/057v2pg43","country_code":"FR","type":"healthcare","lineage":["https://openalex.org/I4210154688"]},{"id":"https://openalex.org/I4403386650","display_name":"Centre de Robotique","ror":"https://ror.org/0180r7w69","country_code":null,"type":"education","lineage":["https://openalex.org/I190752583","https://openalex.org/I2746051580","https://openalex.org/I4403386650","https://openalex.org/I70768539"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Sascha Hornauer","raw_affiliation_strings":["Center for Robotics, Mines Paris, PSL University, 75006 Paris, France","CAOR - Centre de Robotique (60, boulevard Saint-Michel 75272 Paris cedex 06 - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Center for Robotics, Mines Paris, PSL University, 75006 Paris, France","institution_ids":["https://openalex.org/I2746051580"]},{"raw_affiliation_string":"CAOR - Centre de Robotique (60, boulevard Saint-Michel 75272 Paris cedex 06 - France)","institution_ids":["https://openalex.org/I4210154688","https://openalex.org/I4403386650"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008228948","display_name":"Fabien Moutarde","orcid":"https://orcid.org/0000-0003-4799-7285"},"institutions":[{"id":"https://openalex.org/I2746051580","display_name":"Universit\u00e9 Paris Sciences et Lettres","ror":"https://ror.org/013cjyk83","country_code":"FR","type":"education","lineage":["https://openalex.org/I2746051580"]},{"id":"https://openalex.org/I4210154688","display_name":"H\u00f4pital Saint-Michel","ror":"https://ror.org/057v2pg43","country_code":"FR","type":"healthcare","lineage":["https://openalex.org/I4210154688"]},{"id":"https://openalex.org/I4403386650","display_name":"Centre de Robotique","ror":"https://ror.org/0180r7w69","country_code":null,"type":"education","lineage":["https://openalex.org/I190752583","https://openalex.org/I2746051580","https://openalex.org/I4403386650","https://openalex.org/I70768539"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Fabien Moutarde","raw_affiliation_strings":["Center for Robotics, Mines Paris, PSL University, 75006 Paris, France","CAOR - Centre de Robotique (60, boulevard Saint-Michel 75272 Paris cedex 06 - France)"],"raw_orcid":"https://orcid.org/0000-0003-4799-7285","affiliations":[{"raw_affiliation_string":"Center for Robotics, Mines Paris, PSL University, 75006 Paris, France","institution_ids":["https://openalex.org/I2746051580"]},{"raw_affiliation_string":"CAOR - Centre de Robotique (60, boulevard Saint-Michel 75272 Paris cedex 06 - France)","institution_ids":["https://openalex.org/I4210154688","https://openalex.org/I4403386650"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5040722138"],"corresponding_institution_ids":["https://openalex.org/I220619192","https://openalex.org/I2746051580","https://openalex.org/I4210154688","https://openalex.org/I4403386650"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":6.8163,"has_fulltext":true,"cited_by_count":42,"citation_normalized_percentile":{"value":0.97527069,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"12","issue":"5","first_page":"127","last_page":"127"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.8674029111862183},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7642808556556702},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7335363030433655},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6540268659591675},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.5514319539070129},{"id":"https://openalex.org/keywords/imitation","display_name":"Imitation","score":0.4456263780593872},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41823485493659973},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4182090759277344},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.3728260397911072},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.14713618159294128}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.8674029111862183},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7642808556556702},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7335363030433655},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6540268659591675},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.5514319539070129},{"id":"https://openalex.org/C126388530","wikidata":"https://www.wikidata.org/wiki/Q1131737","display_name":"Imitation","level":2,"score":0.4456263780593872},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41823485493659973},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4182090759277344},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3728260397911072},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.14713618159294128},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.3390/robotics12050127","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics12050127","pdf_url":"https://www.mdpi.com/2218-6581/12/5/127/pdf?version=1693994176","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2111.08575","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2111.08575","pdf_url":"https://arxiv.org/pdf/2111.08575","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:HAL:hal-04375385v1","is_oa":true,"landing_page_url":"https://minesparis-psl.hal.science/hal-04375385","pdf_url":"https://minesparis-psl.hal.science/hal-04375385/document","source":{"id":"https://openalex.org/S4406922466","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics, 2023, 12 (5), pp.127. &#x27E8;10.3390/robotics12050127&#x27E9;","raw_type":"Journal articles"},{"id":"pmh:oai:doaj.org/article:b1048a8c866d48639b380ceedde5efc9","is_oa":true,"landing_page_url":"https://doaj.org/article/b1048a8c866d48639b380ceedde5efc9","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics, Vol 12, Iss 5, p 127 (2023)","raw_type":"article"},{"id":"pmh:oai:mdpi.com:/2218-6581/12/5/127/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/robotics12050127","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Robotics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/robotics12050127","is_oa":true,"landing_page_url":"https://doi.org/10.3390/robotics12050127","pdf_url":"https://www.mdpi.com/2218-6581/12/5/127/pdf?version=1693994176","source":{"id":"https://openalex.org/S4210232487","display_name":"Robotics","issn_l":"2218-6581","issn":["2218-6581"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Robotics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.7699999809265137}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3212409086.pdf"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W2145339207","https://openalex.org/W2158782408","https://openalex.org/W2173248099","https://openalex.org/W2260756217","https://openalex.org/W2342840547","https://openalex.org/W2607198029","https://openalex.org/W2736601468","https://openalex.org/W2761873684","https://openalex.org/W2781726626","https://openalex.org/W2785379783","https://openalex.org/W2787938642","https://openalex.org/W2788862220","https://openalex.org/W2803308811","https://openalex.org/W2944911388","https://openalex.org/W2946948417","https://openalex.org/W2955425717","https://openalex.org/W2962867954","https://openalex.org/W2962878825","https://openalex.org/W2962999504","https://openalex.org/W2963363446","https://openalex.org/W2963411833","https://openalex.org/W2963864421","https://openalex.org/W2963923407","https://openalex.org/W2964043796","https://openalex.org/W2964055695","https://openalex.org/W2967785980","https://openalex.org/W2981836239","https://openalex.org/W2994240296","https://openalex.org/W3009593063","https://openalex.org/W3028831193","https://openalex.org/W3034445502","https://openalex.org/W3101780148","https://openalex.org/W3157836284","https://openalex.org/W3172863135","https://openalex.org/W3193987867","https://openalex.org/W3204011027","https://openalex.org/W4214759451","https://openalex.org/W4283076523","https://openalex.org/W4288804588","https://openalex.org/W4312862130","https://openalex.org/W4312947590","https://openalex.org/W4386066695","https://openalex.org/W6745935785","https://openalex.org/W6771522568","https://openalex.org/W6772033386","https://openalex.org/W6839043673"],"related_works":["https://openalex.org/W4387497383","https://openalex.org/W3183948672","https://openalex.org/W3173606202","https://openalex.org/W3110381201","https://openalex.org/W2948807893","https://openalex.org/W2935909890","https://openalex.org/W2778153218","https://openalex.org/W2758277628","https://openalex.org/W1531601525","https://openalex.org/W2768698792"],"abstract_inverted_index":{"Deep":[0],"reinforcement":[1],"learning":[2],"(DRL)":[3],"has":[4],"been":[5],"demonstrated":[6],"to":[7,47,49,76],"be":[8,91],"effective":[9],"for":[10],"several":[11],"complex":[12],"decision-making":[13],"applications,":[14],"such":[15],"as":[16,39,93],"autonomous":[17,148],"driving":[18,149],"and":[19,31,70,73,126,177],"robotics.":[20],"However,":[21],"DRL":[22],"is":[23,42,74],"notoriously":[24],"limited":[25],"by":[26,186],"its":[27,32],"high":[28,102],"sample":[29],"complexity":[30],"lack":[33],"of":[34,112],"stability.":[35],"Prior":[36],"knowledge,":[37],"e.g.,":[38],"expert":[40,71,88,119],"demonstrations,":[41],"often":[43],"available":[44],"but":[45],"challenging":[46],"leverage":[48],"mitigate":[50],"these":[51],"issues.":[52],"In":[53],"this":[54,106],"paper,":[55],"we":[56],"propose":[57],"General":[58],"Reinforced":[59],"Imitation":[60],"(GRI),":[61],"a":[62,100],"novel":[63],"method":[64,158,170],"which":[65,121],"combines":[66],"benefits":[67],"from":[68,132],"exploration":[69,136],"data":[72,95,120],"straightforward":[75],"implement":[77],"over":[78],"any":[79],"off-policy":[80,166],"RL":[81,135,167],"algorithm.":[82],"We":[83,138,153],"make":[84],"one":[85],"simplifying":[86],"hypothesis:":[87],"demonstrations":[89],"can":[90],"seen":[92],"perfect":[94],"whose":[96],"underlying":[97],"policy":[98],"gets":[99],"constant":[101],"reward.":[103],"Based":[104],"on":[105,146,159,173,180],"assumption,":[107],"GRI":[108,157],"introduces":[109],"the":[110,129,133,156,174,182],"notion":[111],"offline":[113],"demonstration":[114],"agent.":[115,137],"This":[116],"agent":[117],"sends":[118],"are":[122],"processed":[123],"both":[124],"concurrently":[125],"indistinguishably":[127],"with":[128,164],"experiences":[130],"coming":[131],"online":[134],"show":[139],"that":[140],"our":[141],"approach":[142],"enables":[143],"major":[144],"improvements":[145],"camera-based":[147],"in":[150],"urban":[151],"environments.":[152],"further":[154],"validate":[155],"Mujoco":[160],"continuous":[161],"control":[162],"tasks":[163],"different":[165],"algorithms.":[168],"Our":[169],"ranked":[171],"first":[172],"CARLA":[175],"Leaderboard":[176],"outperforms":[178],"World":[179],"Rails,":[181],"previous":[183],"state-of-the-art":[184],"method,":[185],"17%.":[187]},"counts_by_year":[{"year":2025,"cited_by_count":19},{"year":2024,"cited_by_count":16},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":2}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
