{"id":"https://openalex.org/W4214888817","doi":"https://doi.org/10.1109/icaiic54071.2022.9722630","title":"Two-Policy Cooperative Transfer for Alleviation of Sim-to-Real Gap","display_name":"Two-Policy Cooperative Transfer for Alleviation of Sim-to-Real Gap","publication_year":2022,"publication_date":"2022-02-21","ids":{"openalex":"https://openalex.org/W4214888817","doi":"https://doi.org/10.1109/icaiic54071.2022.9722630"},"language":"en","primary_location":{"id":"doi:10.1109/icaiic54071.2022.9722630","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icaiic54071.2022.9722630","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063926276","display_name":"Liangdong Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liangdong Wu","raw_affiliation_strings":["University of Chinese Academy of Sciences,School of Artificial Intelligence,Beijing,China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"University of Chinese Academy of Sciences,School of Artificial Intelligence,Beijing,China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056039500","display_name":"Fangzhou Xiong","orcid":"https://orcid.org/0000-0002-2592-4096"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fangzhou Xiong","raw_affiliation_strings":["Meituan,Beijing,China","Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan,Beijing,China","institution_ids":["https://openalex.org/I4210087373"]},{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100434504","display_name":"Zhiyong Liu","orcid":"https://orcid.org/0000-0003-2148-1846"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Liu","raw_affiliation_strings":["Institute of Automation Chinese Academy of Sciences,Beijing,China","Institute of Automation Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation Chinese Academy of Sciences,Beijing,China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Institute of Automation Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5063926276"],"corresponding_institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.1326,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49290955,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"156","last_page":"161"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9786999821662903,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6748848557472229},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.665779709815979},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5556429028511047},{"id":"https://openalex.org/keywords/transfer","display_name":"Transfer (computing)","score":0.49101734161376953},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4811747968196869},{"id":"https://openalex.org/keywords/mainstream","display_name":"Mainstream","score":0.46446579694747925},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.46407440304756165},{"id":"https://openalex.org/keywords/information-gap","display_name":"Information gap","score":0.45312172174453735},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.4239789843559265},{"id":"https://openalex.org/keywords/policy-transfer","display_name":"Policy transfer","score":0.414318323135376},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.41048139333724976},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2757309675216675},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.142526775598526},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12034660577774048},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.1047743558883667},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.0909283459186554}],"concepts":[{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6748848557472229},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.665779709815979},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5556429028511047},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.49101734161376953},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4811747968196869},{"id":"https://openalex.org/C2777617010","wikidata":"https://www.wikidata.org/wiki/Q18957","display_name":"Mainstream","level":2,"score":0.46446579694747925},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.46407440304756165},{"id":"https://openalex.org/C2993006568","wikidata":"https://www.wikidata.org/wiki/Q6031094","display_name":"Information gap","level":3,"score":0.45312172174453735},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.4239789843559265},{"id":"https://openalex.org/C2776731479","wikidata":"https://www.wikidata.org/wiki/Q15142682","display_name":"Policy transfer","level":2,"score":0.414318323135376},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.41048139333724976},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2757309675216675},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.142526775598526},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12034660577774048},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.1047743558883667},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0909283459186554},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C3116431","wikidata":"https://www.wikidata.org/wiki/Q31728","display_name":"Public administration","level":1,"score":0.0},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icaiic54071.2022.9722630","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icaiic54071.2022.9722630","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17","score":0.46000000834465027}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W1481659984","https://openalex.org/W2158782408","https://openalex.org/W2530944449","https://openalex.org/W2605102758","https://openalex.org/W2767050701","https://openalex.org/W2781726626","https://openalex.org/W2908261578","https://openalex.org/W2911087563","https://openalex.org/W2962957005","https://openalex.org/W2968116426","https://openalex.org/W2990747716","https://openalex.org/W3088310808","https://openalex.org/W3100789280","https://openalex.org/W3101442004","https://openalex.org/W3111934344","https://openalex.org/W3120778962","https://openalex.org/W3130451601","https://openalex.org/W3204973825","https://openalex.org/W4300799055","https://openalex.org/W6728367041","https://openalex.org/W6731094094","https://openalex.org/W6740801417","https://openalex.org/W6747473740","https://openalex.org/W6780559895","https://openalex.org/W6784298057"],"related_works":["https://openalex.org/W1583826057","https://openalex.org/W2377237701","https://openalex.org/W2360099860","https://openalex.org/W4323893170","https://openalex.org/W2352463596","https://openalex.org/W2380850119","https://openalex.org/W2101450440","https://openalex.org/W4321371032","https://openalex.org/W2555410439","https://openalex.org/W2605246557"],"abstract_inverted_index":{"The":[0],"main":[1],"difficulty":[2],"of":[3,90,95,104,108,116,129,141,144,171],"sim-to-real":[4],"is":[5,27,35,57,63],"the":[6,10,14,28,38,67,77,81,88,93,102,105,113,127,130,134,139,148,153,169,172],"reality":[7],"gap":[8,96,109,137,151],"between":[9],"source":[11],"domain":[12,25],"and":[13,69,92,138,167],"target":[15],"domain.":[16],"In":[17,43],"order":[18],"to":[19,36,65,75,79,125],"solve":[20],"it,":[21],"various":[22],"methods":[23],"where":[24],"randomization":[26],"mainstream":[29],"have":[30],"been":[31],"emerged,":[32],"whose":[33,55],"essence":[34],"make":[37],"single":[39],"policy":[40,60,71,110,119],"more":[41],"robust.":[42],"contrast,":[44],"we":[45,84,156],"propose":[46],"a":[47],"novel":[48],"transfer":[49,114],"method,":[50,101],"namely":[51],"two-policy":[52],"cooperative":[53],"transfer,":[54],"core":[56],"that":[58],"one":[59],"(task":[61],"policy)":[62,73],"used":[64],"complete":[66],"task":[68,91,118],"another":[70],"(gap":[72],"aims":[74],"assist":[76],"former":[78],"cover":[80],"gap,":[82],"hence":[83],"can":[85],"focus":[86],"on":[87,99,112,164],"training":[89],"overcoming":[94],"respectively.":[97],"Based":[98],"this":[100],"setting":[103],"learning":[106],"objective":[107],"depends":[111],"situation":[115],"deploying":[117],"into":[120],"real":[121],"system,":[122],"besides":[123],"how":[124],"conduct":[126],"cooperation":[128],"both":[131],"lies":[132],"in":[133,152],"threshold":[135],"reflecting":[136],"coupling":[140],"output":[142],"actions":[143],"two":[145],"policies.":[146],"For":[147],"typical":[149],"contact-rich":[150],"dynamics":[154],"field,":[155],"design":[157],"an":[158],"adaptive":[159],"object":[160],"pushing":[161],"experiment":[162],"based":[163],"UR3":[165],"robot,":[166],"verify":[168],"effectiveness":[170],"proposed":[173],"method.":[174]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
