{"id":"https://openalex.org/W4385299175","doi":"https://doi.org/10.1109/tai.2023.3299252","title":"Facilitating Sim-to-Real by Intrinsic Stochasticity of Real-Time Simulation in Reinforcement Learning for Robot Manipulation","display_name":"Facilitating Sim-to-Real by Intrinsic Stochasticity of Real-Time Simulation in Reinforcement Learning for Robot Manipulation","publication_year":2023,"publication_date":"2023-07-27","ids":{"openalex":"https://openalex.org/W4385299175","doi":"https://doi.org/10.1109/tai.2023.3299252"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2023.3299252","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2023.3299252","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038499955","display_name":"Amir M. Soufi Enayati","orcid":"https://orcid.org/0000-0002-6736-8016"},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Amir M. Soufi Enayati","raw_affiliation_strings":["Faculty of Engineering and Computer Science, University of Victoria, Victoria, BC, Canada"],"raw_orcid":"https://orcid.org/0000-0002-6736-8016","affiliations":[{"raw_affiliation_string":"Faculty of Engineering and Computer Science, University of Victoria, Victoria, BC, Canada","institution_ids":["https://openalex.org/I212119943"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056595246","display_name":"Ram Dershan","orcid":"https://orcid.org/0009-0006-7771-9613"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]},{"id":"https://openalex.org/I4405260628","display_name":"University of British Columbia, Okanagan Campus","ror":"https://ror.org/04241wz75","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490","https://openalex.org/I4405260628"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Ram Dershan","raw_affiliation_strings":["School of Engineering, University of British Columbia, Kelowna, BC, Canada"],"raw_orcid":"https://orcid.org/0009-0006-7771-9613","affiliations":[{"raw_affiliation_string":"School of Engineering, University of British Columbia, Kelowna, BC, Canada","institution_ids":["https://openalex.org/I141945490","https://openalex.org/I4405260628"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101743605","display_name":"Zengjie Zhang","orcid":"https://orcid.org/0000-0003-1875-1032"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]},{"id":"https://openalex.org/I4405260628","display_name":"University of British Columbia, Okanagan Campus","ror":"https://ror.org/04241wz75","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490","https://openalex.org/I4405260628"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Zengjie Zhang","raw_affiliation_strings":["School of Engineering, University of British Columbia, Kelowna, BC, Canada"],"raw_orcid":"https://orcid.org/0000-0003-1875-1032","affiliations":[{"raw_affiliation_string":"School of Engineering, University of British Columbia, Kelowna, BC, Canada","institution_ids":["https://openalex.org/I141945490","https://openalex.org/I4405260628"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065214497","display_name":"Dean Richert","orcid":"https://orcid.org/0000-0002-5125-2684"},"institutions":[{"id":"https://openalex.org/I141945490","display_name":"University of British Columbia","ror":"https://ror.org/03rmrcq20","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490"]},{"id":"https://openalex.org/I4405260628","display_name":"University of British Columbia, Okanagan Campus","ror":"https://ror.org/04241wz75","country_code":"CA","type":"education","lineage":["https://openalex.org/I141945490","https://openalex.org/I4405260628"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Dean Richert","raw_affiliation_strings":["School of Engineering, University of British Columbia, Kelowna, BC, Canada"],"raw_orcid":"https://orcid.org/0000-0002-5125-2684","affiliations":[{"raw_affiliation_string":"School of Engineering, University of British Columbia, Kelowna, BC, Canada","institution_ids":["https://openalex.org/I141945490","https://openalex.org/I4405260628"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058540009","display_name":"Homayoun Najjaran","orcid":"https://orcid.org/0000-0002-3550-225X"},"institutions":[{"id":"https://openalex.org/I212119943","display_name":"University of Victoria","ror":"https://ror.org/04s5mat29","country_code":"CA","type":"education","lineage":["https://openalex.org/I212119943"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Homayoun Najjaran","raw_affiliation_strings":["Faculty of Engineering and Computer Science, University of Victoria, Victoria, BC, Canada"],"raw_orcid":"https://orcid.org/0000-0002-3550-225X","affiliations":[{"raw_affiliation_string":"Faculty of Engineering and Computer Science, University of Victoria, Victoria, BC, Canada","institution_ids":["https://openalex.org/I212119943"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.979,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.80352669,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"5","issue":"4","first_page":"1791","last_page":"1804"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11195","display_name":"Simulation Techniques and Applications","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7959862947463989},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7497086524963379},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6336888074874878},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5085991621017456},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.5034875273704529},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.48920416831970215},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.43610718846321106},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.41142144799232483},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.32650312781333923},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08162015676498413}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7959862947463989},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7497086524963379},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6336888074874878},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5085991621017456},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.5034875273704529},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.48920416831970215},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.43610718846321106},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.41142144799232483},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.32650312781333923},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08162015676498413},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tai.2023.3299252","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2023.3299252","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3708286853","display_name":null,"funder_award_id":"CRDPJ 543881-19","funder_id":"https://openalex.org/F4320334593","funder_display_name":"Natural Sciences and Engineering Research Council of Canada"}],"funders":[{"id":"https://openalex.org/F4320334593","display_name":"Natural Sciences and Engineering Research Council of Canada","ror":"https://ror.org/01h531d29"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":64,"referenced_works":["https://openalex.org/W1570792896","https://openalex.org/W1977655452","https://openalex.org/W1982546786","https://openalex.org/W1987486506","https://openalex.org/W2105078254","https://openalex.org/W2137052305","https://openalex.org/W2158208985","https://openalex.org/W2165698076","https://openalex.org/W2287910890","https://openalex.org/W2580909119","https://openalex.org/W2605102758","https://openalex.org/W2623491082","https://openalex.org/W2736506089","https://openalex.org/W2736601468","https://openalex.org/W2767050701","https://openalex.org/W2767346351","https://openalex.org/W2884484164","https://openalex.org/W2949600457","https://openalex.org/W2962899390","https://openalex.org/W2967889132","https://openalex.org/W2973229164","https://openalex.org/W2998116579","https://openalex.org/W3002768791","https://openalex.org/W3025899234","https://openalex.org/W3044051321","https://openalex.org/W3082233933","https://openalex.org/W3101442004","https://openalex.org/W3112186687","https://openalex.org/W3121342653","https://openalex.org/W3126316434","https://openalex.org/W3129352929","https://openalex.org/W3134716948","https://openalex.org/W3136347463","https://openalex.org/W3166974263","https://openalex.org/W3206393052","https://openalex.org/W3211145209","https://openalex.org/W3215644105","https://openalex.org/W4200480164","https://openalex.org/W4210939259","https://openalex.org/W4221110788","https://openalex.org/W4225773298","https://openalex.org/W4226280465","https://openalex.org/W4226479436","https://openalex.org/W4242050203","https://openalex.org/W4249314718","https://openalex.org/W4285048301","https://openalex.org/W4296683478","https://openalex.org/W4312759282","https://openalex.org/W4312908419","https://openalex.org/W4317038451","https://openalex.org/W6683633756","https://openalex.org/W6735677848","https://openalex.org/W6736469832","https://openalex.org/W6739193204","https://openalex.org/W6741002519","https://openalex.org/W6755890616","https://openalex.org/W6767084887","https://openalex.org/W6767141496","https://openalex.org/W6769596995","https://openalex.org/W6788773875","https://openalex.org/W6804712669","https://openalex.org/W6811124000","https://openalex.org/W6811341675","https://openalex.org/W6841991137"],"related_works":["https://openalex.org/W2118717649","https://openalex.org/W2413243053","https://openalex.org/W410723623","https://openalex.org/W2015341305","https://openalex.org/W2035068594","https://openalex.org/W4225593417","https://openalex.org/W2573498121","https://openalex.org/W3022298670","https://openalex.org/W3160494304","https://openalex.org/W3006162251"],"abstract_inverted_index":{"Simulation":[0],"is":[1,52,187],"essential":[2],"to":[3,25,48,54,78,88,95,112,162],"reinforcement":[4],"learning":[5],"(RL)":[6],"before":[7],"implementation":[8],"in":[9,99,142,209],"the":[10,26,29,32,37,55,62,114,119,129,139,143,156,195,206],"real":[11,33],"world,":[12,34],"especially":[13],"for":[14,166],"safety-critical":[15],"applications":[16,211],"like":[17,212],"robot":[18,167,213],"manipulation.":[19],"Conventionally,":[20],"RL":[21,80,147,172],"agents":[22,176],"are":[23],"sensitive":[24],"discrepancies":[27],"between":[28],"simulation":[30,69,73,150],"and":[31,75,90,93,105,124,151,158,190],"known":[35],"as":[36],"sim-to-real":[38,207],"gap.":[39],"The":[40,149,170],"application":[41],"of":[42,57,64,67,71,101,103,116,121,132,145,160],"domain":[43,97],"randomization,":[44,186],"a":[45,85,133,202],"technique":[46],"used":[47],"fill":[49],"this":[50],"gap,":[51],"limited":[53],"imposition":[56],"heuristic-randomized":[58],"models.":[59],"We":[60],"investigate":[61],"properties":[63],"intrinsic":[65],"stochasticity":[66,131],"real-time":[68],"(RT-IS)":[70],"off-the-shelf":[72],"software":[74],"its":[76,126],"potential":[77],"improve":[79],"performance.":[81],"This":[82],"improvement":[83],"includes":[84],"higher":[86],"tolerance":[87],"noise":[89],"model":[91],"imprecision":[92],"superiority":[94],"conventional":[96,175,196],"randomization":[98],"terms":[100],"ease":[102],"use":[104],"automation.":[106],"Firstly,":[107],"we":[108,137],"conduct":[109],"analytical":[110],"studies":[111],"measure":[113],"correlation":[115],"RT-IS":[117,140,161,182],"with":[118,128,179],"utilization":[120],"computer":[122],"hardware":[123],"validate":[125],"comparability":[127],"natural":[130],"physical":[134,152],"robot.":[135],"Then,":[136],"exploit":[138],"feature":[141],"training":[144,165],"an":[146],"agent.":[148],"experiment":[153],"results":[154],"verify":[155],"feasibility":[157],"applicability":[159],"robust":[163],"agent":[164,173],"manipulation":[168,214],"tasks.":[169,215],"RT-IS-powered":[171],"outperforms":[174],"on":[177,205],"robots":[178],"modeling":[180],"uncertainties.":[181],"requires":[183],"less":[184],"heuristic":[185],"not":[188],"task-dependent,":[189],"achieves":[191],"better":[192],"generalizability":[193],"than":[194],"domain-randomization-powered":[197],"agents.":[198],"Our":[199],"findings":[200],"provide":[201],"new":[203],"perspective":[204],"problem":[208],"practical":[210]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
