{"id":"https://openalex.org/W4315640913","doi":"https://doi.org/10.3389/frobt.2022.1067502","title":"Sim-to-real via latent prediction: Transferring visual non-prehensile manipulation policies","display_name":"Sim-to-real via latent prediction: Transferring visual non-prehensile manipulation policies","publication_year":2023,"publication_date":"2023-01-12","ids":{"openalex":"https://openalex.org/W4315640913","doi":"https://doi.org/10.3389/frobt.2022.1067502","pmid":"https://pubmed.ncbi.nlm.nih.gov/36714802"},"language":"en","primary_location":{"id":"doi:10.3389/frobt.2022.1067502","is_oa":true,"landing_page_url":"https://doi.org/10.3389/frobt.2022.1067502","pdf_url":"https://www.frontiersin.org/articles/10.3389/frobt.2022.1067502/pdf","source":{"id":"https://openalex.org/S2595095599","display_name":"Frontiers in Robotics and AI","issn_l":"2296-9144","issn":["2296-9144"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Robotics and AI","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.frontiersin.org/articles/10.3389/frobt.2022.1067502/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014912300","display_name":"Carlo Rizzardo","orcid":null},"institutions":[{"id":"https://openalex.org/I30771326","display_name":"Italian Institute of Technology","ror":"https://ror.org/042t93s57","country_code":"IT","type":"facility","lineage":["https://openalex.org/I30771326"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Carlo Rizzardo","raw_affiliation_strings":["Active Perception and Robot Interactive Learning Laboratory, Advanced Robotics, Istituto Italiano di Tecnologia, Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Active Perception and Robot Interactive Learning Laboratory, Advanced Robotics, Istituto Italiano di Tecnologia, Genova, Italy","institution_ids":["https://openalex.org/I30771326"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100405442","display_name":"Fei Chen","orcid":"https://orcid.org/0000-0003-4397-0931"},"institutions":[{"id":"https://openalex.org/I30771326","display_name":"Italian Institute of Technology","ror":"https://ror.org/042t93s57","country_code":"IT","type":"facility","lineage":["https://openalex.org/I30771326"]},{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN","IT"],"is_corresponding":false,"raw_author_name":"Fei Chen","raw_affiliation_strings":["Active Perception and Robot Interactive Learning Laboratory, Advanced Robotics, Istituto Italiano di Tecnologia, Genova, Italy","Department of Mechanical and Automation Engineering, T-Stone Robotics Institute, The Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Active Perception and Robot Interactive Learning Laboratory, Advanced Robotics, Istituto Italiano di Tecnologia, Genova, Italy","institution_ids":["https://openalex.org/I30771326"]},{"raw_affiliation_string":"Department of Mechanical and Automation Engineering, T-Stone Robotics Institute, The Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044243940","display_name":"Darwin G. Caldwell","orcid":"https://orcid.org/0000-0002-6233-9961"},"institutions":[{"id":"https://openalex.org/I30771326","display_name":"Italian Institute of Technology","ror":"https://ror.org/042t93s57","country_code":"IT","type":"facility","lineage":["https://openalex.org/I30771326"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Darwin Caldwell","raw_affiliation_strings":["Active Perception and Robot Interactive Learning Laboratory, Advanced Robotics, Istituto Italiano di Tecnologia, Genova, Italy"],"affiliations":[{"raw_affiliation_string":"Active Perception and Robot Interactive Learning Laboratory, Advanced Robotics, Istituto Italiano di Tecnologia, Genova, Italy","institution_ids":["https://openalex.org/I30771326"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5014912300"],"corresponding_institution_ids":["https://openalex.org/I30771326"],"apc_list":{"value":1900,"currency":"USD","value_usd":1900},"apc_paid":{"value":1900,"currency":"USD","value_usd":1900},"fwci":0.8741,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.77309442,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"9","issue":null,"first_page":"1067502","last_page":"1067502"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9776999950408936,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8018770217895508},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6588484644889832},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5879091024398804},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5721009373664856},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.49882984161376953},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.4774896800518036},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.32305237650871277},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.3201405107975006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8018770217895508},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6588484644889832},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5879091024398804},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5721009373664856},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49882984161376953},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.4774896800518036},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32305237650871277},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.3201405107975006},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3389/frobt.2022.1067502","is_oa":true,"landing_page_url":"https://doi.org/10.3389/frobt.2022.1067502","pdf_url":"https://www.frontiersin.org/articles/10.3389/frobt.2022.1067502/pdf","source":{"id":"https://openalex.org/S2595095599","display_name":"Frontiers in Robotics and AI","issn_l":"2296-9144","issn":["2296-9144"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Robotics and AI","raw_type":"journal-article"},{"id":"pmid:36714802","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36714802","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in robotics and AI","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:9879568","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9879568","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Front Robot AI","raw_type":"Text"},{"id":"pmh:oai:doaj.org/article:9f50428d665d46929f6a26d52ab8ee23","is_oa":true,"landing_page_url":"https://doaj.org/article/9f50428d665d46929f6a26d52ab8ee23","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Frontiers in Robotics and AI, Vol 9 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3389/frobt.2022.1067502","is_oa":true,"landing_page_url":"https://doi.org/10.3389/frobt.2022.1067502","pdf_url":"https://www.frontiersin.org/articles/10.3389/frobt.2022.1067502/pdf","source":{"id":"https://openalex.org/S2595095599","display_name":"Frontiers in Robotics and AI","issn_l":"2296-9144","issn":["2296-9144"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Robotics and AI","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4315640913.pdf"},"referenced_works_count":78,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W1522301498","https://openalex.org/W1565327149","https://openalex.org/W1658008008","https://openalex.org/W1882958252","https://openalex.org/W1909320841","https://openalex.org/W1959608418","https://openalex.org/W2145339207","https://openalex.org/W2159291411","https://openalex.org/W2167340365","https://openalex.org/W2174364281","https://openalex.org/W2584009249","https://openalex.org/W2593768305","https://openalex.org/W2605102758","https://openalex.org/W2736601468","https://openalex.org/W2781726626","https://openalex.org/W2789539638","https://openalex.org/W2904246096","https://openalex.org/W2927928207","https://openalex.org/W2949600457","https://openalex.org/W2962808524","https://openalex.org/W2962899390","https://openalex.org/W2963390419","https://openalex.org/W2963906246","https://openalex.org/W2964043796","https://openalex.org/W2964198579","https://openalex.org/W2964288524","https://openalex.org/W2981030070","https://openalex.org/W2995298643","https://openalex.org/W3015437096","https://openalex.org/W3021708257","https://openalex.org/W3031634197","https://openalex.org/W3101442004","https://openalex.org/W3115293622","https://openalex.org/W3122690883","https://openalex.org/W3129658336","https://openalex.org/W3175558129","https://openalex.org/W3186672455","https://openalex.org/W3194488868","https://openalex.org/W3200266741","https://openalex.org/W3216772467","https://openalex.org/W4286963241","https://openalex.org/W4287811291","https://openalex.org/W4288294128","https://openalex.org/W4297887856","https://openalex.org/W4310895557","https://openalex.org/W6631190155","https://openalex.org/W6639480849","https://openalex.org/W6639732818","https://openalex.org/W6640963894","https://openalex.org/W6683633756","https://openalex.org/W6684393244","https://openalex.org/W6692846177","https://openalex.org/W6733306783","https://openalex.org/W6736179038","https://openalex.org/W6736469832","https://openalex.org/W6744354654","https://openalex.org/W6746282794","https://openalex.org/W6747473740","https://openalex.org/W6751494529","https://openalex.org/W6756256016","https://openalex.org/W6757358677","https://openalex.org/W6760514122","https://openalex.org/W6762585180","https://openalex.org/W6765407481","https://openalex.org/W6768397756","https://openalex.org/W6768511085","https://openalex.org/W6771217966","https://openalex.org/W6776867236","https://openalex.org/W6783988234","https://openalex.org/W6785137750","https://openalex.org/W6787713516","https://openalex.org/W6790314768","https://openalex.org/W6799458897","https://openalex.org/W6801655106","https://openalex.org/W6801964084","https://openalex.org/W6804601995","https://openalex.org/W6966558720"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W3049728571","https://openalex.org/W20361778","https://openalex.org/W2024136090","https://openalex.org/W1508899372"],"abstract_inverted_index":{"Reinforcement":[0,225],"Learning":[1,226],"has":[2],"been":[3],"shown":[4],"to":[5,16,69,140,190,223,274,298],"have":[6],"a":[7,106,113,118,124,129,161,185,258],"great":[8],"potential":[9,67],"for":[10,37,42,52,204,260],"robotics.":[11],"It":[12],"demonstrated":[13],"the":[14,35,50,75,81,93,99,137,143,153,156,164,169,182,196,206,212,216,221,235,239,250,268,278,293,303],"capability":[15],"solve":[17],"complex":[18],"manipulation":[19],"and":[20,58,85,90,128,149,152,254,287],"locomotion":[21],"tasks,":[22],"even":[23],"by":[24],"learning":[25],"end-to-end":[26],"policies":[27,103,299],"that":[28,116],"operate":[29],"directly":[30,301],"on":[31,163,172,227,234,252],"visual":[32,84],"input,":[33],"removing":[34],"need":[36,51,222],"custom":[38],"perception":[39],"systems.":[40],"However,":[41,80],"practical":[43],"robotics":[44],"applications,":[45],"its":[46],"scarce":[47],"sample":[48,71],"efficiency,":[49],"huge":[53],"amounts":[54],"of":[55,77,102,136,146,155,184,238,257,272],"resources,":[56],"data,":[57,229],"computation":[59],"time":[60,295],"can":[61,180],"be":[62],"an":[63],"insurmountable":[64],"obstacle.":[65],"One":[66],"solution":[68],"this":[70,109,178],"efficiency":[72],"issue":[73],"is":[74,270],"use":[76],"simulated":[78],"environments.":[79],"discrepancy":[82],"in":[83,215,277,284,302],"physical":[86],"characteristics":[87],"between":[88],"reality":[89,191],"simulation,":[91],"namely":[92],"sim-to-real":[94,114,144,255],"gap,":[95],"often":[96],"significantly":[97],"reduces":[98],"real-world":[100,173,201,228,244],"performance":[101],"trained":[104,186,300],"within":[105],"simulator.":[107],"In":[108],"work":[110],"we":[111,219,231],"propose":[112],"technique":[115],"trains":[117],"Soft-Actor":[119],"Critic":[120],"agent":[121,187],"together":[122],"with":[123,296],"decoupled":[125,134],"feature":[126,147,170,207,240],"extractor":[127,148,171],"latent-space":[130],"dynamics":[131,157],"model.":[132],"The":[133],"nature":[135],"method":[138,251,269],"allows":[139],"independently":[141],"perform":[142],"transfer":[145,183,256],"control":[150,197,213],"policy,":[151,198],"presence":[154],"model":[158],"acts":[159],"as":[160,282],"constraint":[162],"latent":[165],"representation":[166],"when":[167],"finetuning":[168,195],"data.":[174],"We":[175,248,265],"show":[176],"how":[177,267],"architecture":[179],"allow":[181],"from":[188],"simulation":[189],"without":[192],"retraining":[193],"or":[194],"but":[199],"using":[200],"data":[202],"only":[203,232],"adapting":[205,273],"extractor.":[208],"By":[209],"avoiding":[210],"training":[211,237,294],"policy":[214,259],"real":[217],"domain":[218],"overcome":[220],"apply":[224],"instead,":[230],"focus":[233],"unsupervised":[236],"extractor,":[241],"considerably":[242],"reducing":[243,292],"experience":[245],"collection":[246],"requirements.":[247],"evaluate":[249],"sim-to-sim":[253],"table-top":[261],"robotic":[262],"object":[263],"pushing.":[264],"demonstrate":[266],"capable":[271],"considerable":[275],"variations":[276],"task":[279],"observations,":[280],"such":[281],"changes":[283],"point-of-view,":[285],"colors,":[286],"lighting,":[288],"all":[289],"while":[290],"substantially":[291],"respect":[297],"real.":[304]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2023-01-12T00:00:00"}
