{"id":"https://openalex.org/W4384916367","doi":"https://doi.org/10.1109/lra.2023.3296933","title":"Learning Adaptive Policies for Autonomous Excavation Under Various Soil Conditions by Adversarial Domain Sampling","display_name":"Learning Adaptive Policies for Autonomous Excavation Under Various Soil Conditions by Adversarial Domain Sampling","publication_year":2023,"publication_date":"2023-07-19","ids":{"openalex":"https://openalex.org/W4384916367","doi":"https://doi.org/10.1109/lra.2023.3296933"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2023.3296933","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2023.3296933","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028032706","display_name":"Takayuki Osa","orcid":"https://orcid.org/0000-0002-6895-9088"},"institutions":[{"id":"https://openalex.org/I4210126580","display_name":"RIKEN Center for Advanced Intelligence Project","ror":"https://ror.org/03ckxwf91","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210126580"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Takayuki Osa","raw_affiliation_strings":["University of Tokyo, Tokyo, Japan","RIKEN Center for Advanced Intelligence Project, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0000-0002-6895-9088","affiliations":[{"raw_affiliation_string":"University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"RIKEN Center for Advanced Intelligence Project, Tokyo, Japan","institution_ids":["https://openalex.org/I4210126580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092505831","display_name":"Naoto Osajima","orcid":null},"institutions":[{"id":"https://openalex.org/I207014233","display_name":"Kyushu Institute of Technology","ror":"https://ror.org/02278tr80","country_code":"JP","type":"education","lineage":["https://openalex.org/I207014233"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Naoto Osajima","raw_affiliation_strings":["Kyushu Institute of Technology, Fukuoka, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kyushu Institute of Technology, Fukuoka, Japan","institution_ids":["https://openalex.org/I207014233"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025652230","display_name":"Masanori Aizawa","orcid":null},"institutions":[{"id":"https://openalex.org/I882656400","display_name":"Komatsu (Japan)","ror":"https://ror.org/03s23ay81","country_code":"JP","type":"company","lineage":["https://openalex.org/I882656400"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masanori Aizawa","raw_affiliation_strings":["Komatsu Ltd., Kanagawa, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Komatsu Ltd., Kanagawa, Japan","institution_ids":["https://openalex.org/I882656400"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042711470","display_name":"Tatsuya Harada","orcid":"https://orcid.org/0000-0002-3712-3691"},"institutions":[{"id":"https://openalex.org/I4210126580","display_name":"RIKEN Center for Advanced Intelligence Project","ror":"https://ror.org/03ckxwf91","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210126580"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tatsuya Harada","raw_affiliation_strings":["University of Tokyo, Tokyo, Japan","RIKEN Center for Advanced Intelligence Project, Tokyo, Japan"],"raw_orcid":"https://orcid.org/0000-0002-3712-3691","affiliations":[{"raw_affiliation_string":"University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"RIKEN Center for Advanced Intelligence Project, Tokyo, Japan","institution_ids":["https://openalex.org/I4210126580"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5028032706"],"corresponding_institution_ids":["https://openalex.org/I4210126580","https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":1.022,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.75998033,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"8","issue":"9","first_page":"5536","last_page":"5543"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10409","display_name":"Fuel Cells and Related Materials","score":0.9764000177383423,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10409","display_name":"Fuel Cells and Related Materials","score":0.9764000177383423,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9739999771118164,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9574000239372253,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.735180139541626},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6382728815078735},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6117784380912781},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6044303774833679},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5899553894996643},{"id":"https://openalex.org/keywords/excavation","display_name":"Excavation","score":0.548193097114563},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5402511954307556},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.5165923833847046},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4888245463371277},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.44735774397850037},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.43905341625213623},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.43612760305404663},{"id":"https://openalex.org/keywords/sensitivity","display_name":"Sensitivity (control systems)","score":0.4260708689689636},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.4214095175266266},{"id":"https://openalex.org/keywords/hazard","display_name":"Hazard","score":0.4171091616153717},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.1756397783756256},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.16824296116828918},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.15796113014221191},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1487044095993042},{"id":"https://openalex.org/keywords/software-engineering","display_name":"Software engineering","score":0.08188357949256897}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.735180139541626},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6382728815078735},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6117784380912781},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6044303774833679},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5899553894996643},{"id":"https://openalex.org/C31858485","wikidata":"https://www.wikidata.org/wiki/Q959782","display_name":"Excavation","level":2,"score":0.548193097114563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5402511954307556},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.5165923833847046},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4888245463371277},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.44735774397850037},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.43905341625213623},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.43612760305404663},{"id":"https://openalex.org/C21200559","wikidata":"https://www.wikidata.org/wiki/Q7451068","display_name":"Sensitivity (control systems)","level":2,"score":0.4260708689689636},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.4214095175266266},{"id":"https://openalex.org/C49261128","wikidata":"https://www.wikidata.org/wiki/Q1132455","display_name":"Hazard","level":2,"score":0.4171091616153717},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.1756397783756256},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.16824296116828918},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.15796113014221191},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1487044095993042},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.08188357949256897},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C187320778","wikidata":"https://www.wikidata.org/wiki/Q1349130","display_name":"Geotechnical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2023.3296933","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2023.3296933","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.5400000214576721,"id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320317546","display_name":"Komatsu","ror":"https://ror.org/03s23ay81"},{"id":"https://openalex.org/F4320322832","display_name":"University of Tokyo","ror":"https://ror.org/057zh3y96"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W41554520","https://openalex.org/W83284419","https://openalex.org/W1846039755","https://openalex.org/W2132083787","https://openalex.org/W2145339207","https://openalex.org/W2597234992","https://openalex.org/W2603088459","https://openalex.org/W2604763608","https://openalex.org/W2605102758","https://openalex.org/W2736601468","https://openalex.org/W2781726626","https://openalex.org/W2787938642","https://openalex.org/W2897462754","https://openalex.org/W2952526277","https://openalex.org/W2978134924","https://openalex.org/W3015872276","https://openalex.org/W3039130562","https://openalex.org/W3127007986","https://openalex.org/W3127831513","https://openalex.org/W3175254947","https://openalex.org/W3185855727","https://openalex.org/W3208816282","https://openalex.org/W3210150378","https://openalex.org/W4205847188","https://openalex.org/W4285059108","https://openalex.org/W4309137642","https://openalex.org/W6638954810","https://openalex.org/W6735789912","https://openalex.org/W6736057607","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6748839928","https://openalex.org/W6760698134","https://openalex.org/W6780628154","https://openalex.org/W6785756301","https://openalex.org/W6802809499","https://openalex.org/W6803699115","https://openalex.org/W6846664724"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W4246396837","https://openalex.org/W2482350142","https://openalex.org/W3176240006","https://openalex.org/W3126451824","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W4288019534","https://openalex.org/W2914522629"],"abstract_inverted_index":{"Excavation":[0],"is":[1,11,110],"a":[2,125,129,166,196,200],"frequent":[3],"task":[4,89,114,120],"in":[5,39,139,154],"construction.":[6],"In":[7,70,98,170,192],"this":[8,21,81,99],"context,":[9],"automation":[10],"expected":[12,183],"to":[13,31,42,49,118,135,181,211],"reduce":[14],"hazard":[15],"risks":[16],"and":[17,161,238],"labor-intensive":[18],"work.":[19],"To":[20],"end,":[22],"recent":[23],"studies":[24],"have":[25],"investigated":[26],"using":[27],"reinforcement":[28],"learning":[29,128],"(RL)":[30],"automate":[32],"construction":[33],"machines.":[34],"One":[35],"of":[36,55,87,150,208,221],"the":[37,53,58,64,74,85,88,107,113,119,148,171,177,189,206,209,212,219,222],"challenges":[38],"applying":[40],"RL":[41,152,223],"excavation":[43,140,227,243],"tasks":[44],"concerns":[45],"obtaining":[46],"skills":[47],"adaptable":[48],"various":[50,136],"conditions.":[51],"When":[52],"conditions":[54],"soils":[56],"differ,":[57],"optimal":[59],"plans":[60],"for":[61,94,127,146,198,225,242],"efficiently":[62],"excavating":[63],"target":[65],"area":[66],"will":[67],"significantly":[68,93],"differ.":[69],"existing":[71,236],"meta-learning":[72,237],"methods,":[73],"domain":[75,96,108,137,159,162,174,178,201,213,239],"parameters":[76,109,138,179],"are":[77,185],"often":[78],"uniformly":[79,105],"sampled;":[80],"implicitly":[82],"assumes":[83],"that":[84,104,131,232],"difficulty":[86,115],"does":[90],"not":[91],"change":[92],"different":[95],"parameters.":[97,121],"study,":[100],"we":[101,123,194],"empirically":[102,230],"show":[103,231],"sampling":[106,160,175],"insufficient":[111],"when":[112],"varies":[116],"according":[117],"Correspondingly,":[122],"develop":[124],"framework":[126],"policy":[130],"can":[132],"be":[133],"generalized":[134],"tasks.":[141,244],"We":[142,229],"propose":[143,195],"two":[144],"techniques":[145,217],"improving":[147],"performance":[149,220],"an":[151],"method":[153,224],"our":[155,226,233],"problem":[156],"setting:":[157],"adversarial":[158,173],"parameter":[163,202],"estimation":[164],"with":[165],"sensitivity-aware":[167],"importance":[168],"weight.":[169],"proposed":[172,216],"technique,":[176],"leading":[180],"low":[182],"Q-values":[184],"actively":[186],"sampled":[187],"during":[188],"training":[190,199],"phase.":[191],"addition,":[193],"technique":[197],"estimator":[203],"based":[204],"on":[205],"sensitivity":[207],"Q-function":[210],"parameter.":[214],"The":[215],"improve":[218],"task.":[228],"approach":[234],"outperforms":[235],"adaptation":[240],"methods":[241]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
