{"id":"https://openalex.org/W4405262843","doi":"https://doi.org/10.1109/tase.2025.3590068","title":"Progressive-Resolution Policy Distillation: Leveraging Coarse-Resolution Simulations for Time-Efficient Fine-Resolution Policy Learning","display_name":"Progressive-Resolution Policy Distillation: Leveraging Coarse-Resolution Simulations for Time-Efficient Fine-Resolution Policy Learning","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4405262843","doi":"https://doi.org/10.1109/tase.2025.3590068"},"language":"en","primary_location":{"id":"doi:10.1109/tase.2025.3590068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3590068","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2412.07477","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001325713","display_name":"Yuki Kadokawa","orcid":"https://orcid.org/0000-0003-3358-9520"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Yuki Kadokawa","raw_affiliation_strings":["Nara Institute of Science and Technology, Nara, Japan"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075825270","display_name":"Hirotaka Tahara","orcid":"https://orcid.org/0000-0001-5883-9181"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hirotaka Tahara","raw_affiliation_strings":["Nara Institute of Science and Technology, Nara, Japan"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042074952","display_name":"Takamitsu Matsubara","orcid":"https://orcid.org/0000-0003-3545-4814"},"institutions":[{"id":"https://openalex.org/I75917431","display_name":"Nara Institute of Science and Technology","ror":"https://ror.org/05bhada84","country_code":"JP","type":"education","lineage":["https://openalex.org/I75917431"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takamitsu Matsubara","raw_affiliation_strings":["Nara Institute of Science and Technology, Nara, Japan"],"affiliations":[{"raw_affiliation_string":"Nara Institute of Science and Technology, Nara, Japan","institution_ids":["https://openalex.org/I75917431"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5001325713"],"corresponding_institution_ids":["https://openalex.org/I75917431"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00138644,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"22","issue":null,"first_page":"18682","last_page":"18693"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11195","display_name":"Simulation Techniques and Applications","score":0.9646999835968018,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11195","display_name":"Simulation Techniques and Applications","score":0.9646999835968018,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9534000158309937,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9279999732971191,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/resolution","display_name":"Resolution (logic)","score":0.8271170854568481},{"id":"https://openalex.org/keywords/policy-learning","display_name":"Policy learning","score":0.6454232931137085},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5481621623039246},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.5263094902038574},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31846529245376587},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2663874626159668},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.1283818781375885},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.11207780241966248}],"concepts":[{"id":"https://openalex.org/C138268822","wikidata":"https://www.wikidata.org/wiki/Q1051925","display_name":"Resolution (logic)","level":2,"score":0.8271170854568481},{"id":"https://openalex.org/C2779436431","wikidata":"https://www.wikidata.org/wiki/Q30672407","display_name":"Policy learning","level":2,"score":0.6454232931137085},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5481621623039246},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.5263094902038574},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31846529245376587},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2663874626159668},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.1283818781375885},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.11207780241966248}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tase.2025.3590068","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3590068","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2412.07477","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.07477","pdf_url":"https://arxiv.org/pdf/2412.07477","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2412.07477","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2412.07477","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2412.07477","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2412.07477","pdf_url":"https://arxiv.org/pdf/2412.07477","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5543296614","display_name":null,"funder_award_id":"JPMJMS20","funder_id":"https://openalex.org/F4320338247","funder_display_name":"Moonshot Research and Development Program"},{"id":"https://openalex.org/G5830100352","display_name":null,"funder_award_id":"JPMJMS2032","funder_id":"https://openalex.org/F4320338247","funder_display_name":"Moonshot Research and Development Program"}],"funders":[{"id":"https://openalex.org/F4320338247","display_name":"Moonshot Research and Development Program","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4405262843.pdf"},"referenced_works_count":62,"referenced_works":["https://openalex.org/W1479682106","https://openalex.org/W1977655452","https://openalex.org/W2036562286","https://openalex.org/W2403171414","https://openalex.org/W2442814322","https://openalex.org/W2575705757","https://openalex.org/W2604382266","https://openalex.org/W2619566615","https://openalex.org/W2767050701","https://openalex.org/W2773691349","https://openalex.org/W2952691404","https://openalex.org/W2972758308","https://openalex.org/W2998538471","https://openalex.org/W3005783773","https://openalex.org/W3015082424","https://openalex.org/W3034225898","https://openalex.org/W3106048578","https://openalex.org/W3132694240","https://openalex.org/W3175313230","https://openalex.org/W3175558129","https://openalex.org/W3178119935","https://openalex.org/W3185643802","https://openalex.org/W3200757893","https://openalex.org/W3202905658","https://openalex.org/W3204518412","https://openalex.org/W4211108606","https://openalex.org/W4220731692","https://openalex.org/W4223927937","https://openalex.org/W4252279978","https://openalex.org/W4280630155","https://openalex.org/W4283446143","https://openalex.org/W4285278949","https://openalex.org/W4319996426","https://openalex.org/W4362650357","https://openalex.org/W4364374595","https://openalex.org/W4365801600","https://openalex.org/W4385430476","https://openalex.org/W4388191662","https://openalex.org/W4389665473","https://openalex.org/W4390224266","https://openalex.org/W4390968535","https://openalex.org/W4398793977","https://openalex.org/W4399043691","https://openalex.org/W4399213366","https://openalex.org/W4402448573","https://openalex.org/W6627932998","https://openalex.org/W6721408278","https://openalex.org/W6735677848","https://openalex.org/W6737937804","https://openalex.org/W6741002519","https://openalex.org/W6747473740","https://openalex.org/W6759225949","https://openalex.org/W6760405395","https://openalex.org/W6760560886","https://openalex.org/W6775683342","https://openalex.org/W6776730770","https://openalex.org/W6776901495","https://openalex.org/W6789305357","https://openalex.org/W6798755213","https://openalex.org/W6800004206","https://openalex.org/W6802659552","https://openalex.org/W6804563612"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0,35,253],"earthwork":[1],"and":[2,62,142,199,241,307,331,371,406],"construction,":[3],"excavators":[4,370],"often":[5],"encounter":[6],"large":[7],"rocks":[8],"mixed":[9],"with":[10,121],"various":[11],"soil":[12,49,189,195,211],"conditions,":[13],"requiring":[14],"skilled":[15],"operators.":[16],"This":[17,224,312],"paper":[18,176,225,300,381],"presents":[19],"a":[20,31,103,138,170,227,243,256,263,277,302],"framework":[21,107,244,341],"for":[22,93,245,280,376],"achieving":[23,283],"autonomous":[24,318,334,384],"excavation":[25,33,140,186,239,319,362],"using":[26,87,188],"reinforcement":[27],"learning":[28,106,168,234,350],"(RL)":[29],"through":[30,117,166],"rock":[32,139,145],"simulator.":[34],"the":[36,43,47,80,180,233,315,329,386],"simulation,":[37,265],"resolution":[38,204,310,398],"can":[39,389],"be":[40,391],"defined":[41],"by":[42,179,230],"particle":[44],"size/number":[45],"in":[46,90,95,137,169,185,238,249,262,287],"whole":[48],"space.":[50],"Fine-resolution":[51],"simulations":[52,68,92,120],"closely":[53],"mimic":[54],"real-world":[55,76,144,325,353,377],"behavior":[56,192],"but":[57,73],"demand":[58],"significant":[59],"calculation":[60,247],"time":[61,152,184,248,345],"challenging":[63],"sample":[64,71],"collection,":[65,327],"while":[66,157,219],"coarse-resolution":[67,91],"enable":[69,292],"faster":[70],"collection":[72],"deviate":[74],"from":[75],"behavior.":[77],"To":[78,98],"combine":[79],"advantages":[81],"of":[82,182,193,235,317,333],"both":[83],"resolutions,":[84,298],"we":[85,101],"explore":[86,367],"policies":[88,116,237],"developed":[89],"pre-training":[94],"fine-resolution":[96,171],"simulations.":[97],"this":[99,254,299,340,380],"end,":[100],"propose":[102],"novel":[104],"policy":[105,123,133,167,258,272,294,304,349],"called":[108],"Progressive-Resolution":[109],"Policy":[110],"Distillation":[111],"(PRPD),":[112],"which":[113],"progressively":[114],"transfers":[115],"some":[118],"middle-resolution":[119],"conservative":[122],"transfer":[124,134,295],"to":[125,132,153,163,174,276,291,347,360,369,393],"avoid":[126],"domain":[127],"gaps":[128],"that":[129,148,339],"could":[130],"lead":[131],"failure.":[135],"Validation":[136],"simulator":[141],"nine":[143],"environments":[146,394],"demonstrated":[147],"PRPD":[149],"reduced":[150,221],"sampling":[151],"less":[154],"than":[155],"1/7":[156],"maintaining":[158,220],"task":[159],"success":[160],"rates":[161],"comparable":[162],"those":[164],"achieved":[165],"simulation.":[172],"Note":[173],"Practitioners\u2014This":[175],"is":[177,196,259,273],"motivated":[178],"issue":[181],"computation":[183,222,268,401],"simulation":[187,217,279,288,397],"particles.":[190],"The":[191,270],"real":[194],"highly":[197],"complex,":[198],"approximating":[200],"it":[201],"at":[202],"high":[203],"requires":[205],"enormous":[206],"computational":[207],"costs.":[208],"Therefore,":[209],"existing":[210],"simulators":[212,240],"have":[213],"focused":[214],"on":[215,232,323,383],"improving":[216,328],"accuracy":[218],"time.":[223,269,289],"takes":[226],"different":[228,297],"approach":[229,313,388],"focusing":[231],"control":[236,257],"proposes":[242],"reducing":[246,267],"such":[250,403],"use":[251],"cases.":[252],"framework,":[255],"first":[260],"learned":[261,271],"low-resolution":[264],"significantly":[266,342],"then":[274],"transferred":[275],"high-resolution":[278],"retraining,":[281],"thereby":[282],"an":[284],"overall":[285],"reduction":[286],"Furthermore,":[290],"robust":[293],"across":[296],"discusses":[301],"stable":[303],"distillation":[305],"scheme":[306],"insights":[308],"into":[309],"design.":[311],"enables":[314],"development":[316],"systems":[320],"without":[321],"relying":[322],"expensive":[324],"data":[326],"scalability":[330],"adaptability":[332],"excavation.":[335],"Simulation":[336],"experiments":[337],"suggest":[338],"reduces":[343],"training":[344],"compared":[346],"conventional":[348],"approaches.":[351],"However,":[352],"validation":[354],"has":[355],"so":[356],"far":[357],"been":[358],"limited":[359],"simple":[361],"robots.":[363],"Future":[364],"research":[365],"will":[366],"applications":[368],"other":[372],"machinery":[373],"more":[374],"suitable":[375],"operations.":[378],"Although":[379],"focuses":[382],"excavation,":[385],"proposed":[387],"also":[390],"extended":[392],"where":[395],"increased":[396],"critically":[399],"impacts":[400],"time,":[402],"as":[404],"liquid":[405],"soft":[407],"object":[408],"manipulation.":[409]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2024-12-12T00:00:00"}
