{"id":"https://openalex.org/W2911695803","doi":"https://doi.org/10.1109/lra.2019.2895892","title":"Rover-IRL: Inverse Reinforcement Learning With Soft Value Iteration Networks for Planetary Rover Path Planning","display_name":"Rover-IRL: Inverse Reinforcement Learning With Soft Value Iteration Networks for Planetary Rover Path Planning","publication_year":2019,"publication_date":"2019-01-29","ids":{"openalex":"https://openalex.org/W2911695803","doi":"https://doi.org/10.1109/lra.2019.2895892","mag":"2911695803"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2019.2895892","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2019.2895892","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072199290","display_name":"Max Pflueger","orcid":"https://orcid.org/0000-0003-0667-0518"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Max Pflueger","raw_affiliation_strings":["Department of Computer Science, University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110480055","display_name":"Ali Agha","orcid":null},"institutions":[{"id":"https://openalex.org/I1334627681","display_name":"Jet Propulsion Laboratory","ror":"https://ror.org/027k65916","country_code":"US","type":"facility","lineage":["https://openalex.org/I122411786","https://openalex.org/I1334627681","https://openalex.org/I4210124779"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ali Agha","raw_affiliation_strings":["Jet Propulsion Laboratory, California Institute of Technology, Pasadena, CA, USA"],"affiliations":[{"raw_affiliation_string":"Jet Propulsion Laboratory, California Institute of Technology, Pasadena, CA, USA","institution_ids":["https://openalex.org/I1334627681"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077367921","display_name":"Gaurav S. Sukhatme","orcid":"https://orcid.org/0000-0003-2408-474X"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gaurav S. Sukhatme","raw_affiliation_strings":["Department of Computer Science, University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5072199290"],"corresponding_institution_ids":["https://openalex.org/I1174212"],"apc_list":null,"apc_paid":null,"fwci":4.4806,"has_fulltext":false,"cited_by_count":58,"citation_normalized_percentile":{"value":0.95581468,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"4","issue":"2","first_page":"1387","last_page":"1394"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9805999994277954,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7531414031982422},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6601762175559998},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6045448184013367},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4730488359928131},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4725577235221863},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.33810916543006897}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7531414031982422},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6601762175559998},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6045448184013367},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4730488359928131},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4725577235221863},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.33810916543006897}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2019.2895892","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2019.2895892","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320310358","display_name":"Achievement Rewards for College Scientists Foundation","ror":"https://ror.org/054awkm93"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1191599655","https://openalex.org/W1929981607","https://openalex.org/W1975463331","https://openalex.org/W2082252833","https://openalex.org/W2082764616","https://openalex.org/W2098432798","https://openalex.org/W2098774185","https://openalex.org/W2123491406","https://openalex.org/W2145339207","https://openalex.org/W2173248099","https://openalex.org/W2296673577","https://openalex.org/W2341171179","https://openalex.org/W2506342991","https://openalex.org/W2567374473","https://openalex.org/W2586680856","https://openalex.org/W2962893898","https://openalex.org/W2962951365","https://openalex.org/W2963604043","https://openalex.org/W2963864421","https://openalex.org/W2964077562","https://openalex.org/W2972264811","https://openalex.org/W2990301063","https://openalex.org/W3021208093","https://openalex.org/W4285719527","https://openalex.org/W4297573592","https://openalex.org/W6627932998","https://openalex.org/W6640443443","https://openalex.org/W6674884181","https://openalex.org/W6684921986","https://openalex.org/W6731227521","https://openalex.org/W6735030908","https://openalex.org/W6768430399","https://openalex.org/W6770671346"],"related_works":["https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W4380318855","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W4293226380","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W20361778","https://openalex.org/W2024136090"],"abstract_inverted_index":{"Planetary":[0],"rovers,":[1],"such":[2],"as":[3,21,23,54,89,154,156],"those":[4],"currently":[5,164],"on":[6,25,41,110],"Mars,":[7],"face":[8],"difficult":[9],"path":[10],"planning":[11,19,38,168],"problems,":[12],"both":[13,149],"before":[14],"landing":[15],"during":[16],"the":[17,26,63,83,90,106,117,137,142],"mission":[18,167],"stages":[20],"well":[22,155],"once":[24],"ground.":[27],"In":[28],"this":[29],"work,":[30],"we":[31],"present":[32],"a":[33,80,122,131,150,157],"new":[34],"approach":[35],"to":[36,73,82,88,99],"these":[37],"problems":[39],"based":[40],"inverse":[42],"reinforcement":[43],"learning":[44],"using":[45],"deep":[46],"convolutional":[47,70],"networks":[48,52,72],"and":[49,170],"value":[50,64,84,92],"iteration":[51,65,85,93],"(VIN)":[53],"important":[55],"internal":[56,112],"structures.":[57],"VIN":[58],"are":[59],"an":[60,111],"approximation":[61],"of":[62,144],"(VI)":[66],"algorithm":[67],"implemented":[68],"with":[69,121],"neural":[71],"make":[74],"VI":[75],"fully":[76],"differentiable.":[77],"We":[78,140],"propose":[79],"modification":[81],"recurrence,":[86],"referred":[87],"soft":[91,113],"network":[94],"(SVIN).":[95],"SVIN":[96],"is":[97,119],"designed":[98],"produce":[100],"more":[101],"effective":[102],"training":[103],"gradients":[104],"through":[105],"VIN.":[107],"It":[108],"relies":[109],"policy":[114,118,133],"model,":[115],"where":[116],"represented":[120],"probability":[123],"distribution":[124],"over":[125],"all":[126],"possible":[127],"actions,":[128],"rather":[129],"than":[130],"deterministic":[132],"that":[134],"returns":[135],"only":[136],"best":[138],"action.":[139],"demonstrate":[141],"effectiveness":[143],"our":[145],"proposed":[146],"architecture":[147],"in":[148],"grid":[151],"world":[152],"dataset":[153,161],"highly":[158],"realistic":[159],"synthetic":[160],"generated":[162],"from":[163],"deployed":[165],"rover":[166],"tools":[169],"real":[171],"Mars":[172],"imagery.":[173]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":7},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
