{"id":"https://openalex.org/W4389315167","doi":"https://doi.org/10.1109/cog57401.2023.10333204","title":"Naruto Mobile: AI Sparring Partner Using Heterogeneous Deep Reinforcement Learning","display_name":"Naruto Mobile: AI Sparring Partner Using Heterogeneous Deep Reinforcement Learning","publication_year":2023,"publication_date":"2023-08-21","ids":{"openalex":"https://openalex.org/W4389315167","doi":"https://doi.org/10.1109/cog57401.2023.10333204"},"language":"en","primary_location":{"id":"doi:10.1109/cog57401.2023.10333204","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cog57401.2023.10333204","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048485159","display_name":"Elvis S. Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Elvis S. Liu","raw_affiliation_strings":["Tencent Games,China","Tencent Games, China"],"affiliations":[{"raw_affiliation_string":"Tencent Games,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent Games, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006442353","display_name":"Weifan Li","orcid":"https://orcid.org/0000-0003-1871-8355"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weifan Li","raw_affiliation_strings":["Chinese Academy of Sciences,Institute of Automation,China","Institute of Automation, Chinese Academy of Sciences, China"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Institute of Automation,China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045927034","display_name":"Yuan Zhou","orcid":"https://orcid.org/0009-0008-1706-6539"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Zhou","raw_affiliation_strings":["Tencent Games,China","Tencent Games, China"],"affiliations":[{"raw_affiliation_string":"Tencent Games,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent Games, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102587540","display_name":"Hugh Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hugh Cao","raw_affiliation_strings":["Tencent Games,China","Tencent Games, China"],"affiliations":[{"raw_affiliation_string":"Tencent Games,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent Games, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5109079445","display_name":"Zhengwen Zeng","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhengwen Zeng","raw_affiliation_strings":["Tencent Games,China","Tencent Games, China"],"affiliations":[{"raw_affiliation_string":"Tencent Games,China","institution_ids":["https://openalex.org/I2250653659"]},{"raw_affiliation_string":"Tencent Games, China","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5048485159"],"corresponding_institution_ids":["https://openalex.org/I2250653659"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.16011622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"33","issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11197","display_name":"Digital Games and Media","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8385335206985474},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.715848445892334},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5846920013427734},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.5835980772972107},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5546186566352844},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5304255485534668},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5172005891799927},{"id":"https://openalex.org/keywords/video-game","display_name":"Video game","score":0.5013582706451416},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.42881399393081665},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3269491195678711},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0678068995475769}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8385335206985474},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.715848445892334},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5846920013427734},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.5835980772972107},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5546186566352844},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5304255485534668},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5172005891799927},{"id":"https://openalex.org/C3018412434","wikidata":"https://www.wikidata.org/wiki/Q7889","display_name":"Video game","level":2,"score":0.5013582706451416},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.42881399393081665},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3269491195678711},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0678068995475769},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cog57401.2023.10333204","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/cog57401.2023.10333204","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Conference on Games (CoG)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.4300000071525574,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2569196563","https://openalex.org/W2766463513","https://openalex.org/W2808378895","https://openalex.org/W2810602713","https://openalex.org/W2913668833","https://openalex.org/W2982316857","https://openalex.org/W2996037775","https://openalex.org/W2999850024","https://openalex.org/W3041310931","https://openalex.org/W3084241738","https://openalex.org/W3099518626","https://openalex.org/W3107951310","https://openalex.org/W3110979110","https://openalex.org/W4206145040","https://openalex.org/W4214596723","https://openalex.org/W4299802797","https://openalex.org/W6734313880","https://openalex.org/W6738796088","https://openalex.org/W6748638692","https://openalex.org/W6772005887","https://openalex.org/W6785535465"],"related_works":["https://openalex.org/W2032233321","https://openalex.org/W3121970507","https://openalex.org/W2110028391","https://openalex.org/W54497855","https://openalex.org/W217960748","https://openalex.org/W3125814499","https://openalex.org/W4306904969","https://openalex.org/W2090827041","https://openalex.org/W3162204513","https://openalex.org/W2094012830"],"abstract_inverted_index":{"Naruto":[0,71,132,163],"Mobile":[1,72,133,164],"is":[2,52,63,74,195],"a":[3,23,77,93,104,115,207],"popular":[4],"mobile":[5],"Fighting":[6],"Game":[7],"with":[8,59],"over":[9],"100":[10],"million":[11,184],"registered":[12],"players.":[13,47],"AI":[14,117,127,167],"agents":[15,58],"are":[16,148],"deployed":[17],"extensively":[18],"to":[19,38,56,65,67,125,165],"the":[20,142,159,171,189,196],"game":[21],"for":[22],"wide":[24],"variety":[25],"of":[26,79,96,162,173,191],"applications":[27],"such":[28,100],"as":[29,92],"level":[30],"challenges":[31],"and":[32,42,45,89,108,134,145],"player":[33],"training,":[34],"which":[35,73],"require":[36,103],"them":[37],"fight":[39],"like":[40,70],"humans":[41],"imitate":[43],"strong":[44],"weak":[46],"Although":[48],"deep":[49,200],"reinforcement":[50,201],"learning":[51,202],"an":[53],"excellent":[54],"approach":[55,95,119],"creating":[57],"diverse":[60],"behaviors,":[61],"it":[62],"difficult":[64],"apply":[66],"massive-scale":[68,137],"games":[69],"built":[75],"on":[76],"pool":[78],"more":[80,181],"than":[81,182],"300":[82,183],"characters":[83],"that":[84,141,199],"have":[85,177],"unique":[86],"skills,":[87],"speed,":[88],"attack":[90],"range,":[91],"traditional":[94],"self-play":[97,138],"training":[98,109,118,139],"at":[99,170],"scale":[101],"may":[102],"substantial":[105],"computational":[106,143],"cost":[107],"time.In":[110],"this":[111,175,194],"paper,":[112,176],"we":[113],"present":[114],"new":[116],"called":[120],"Heterogeneous":[121],"Exploitation":[122],"Self-Play":[123],"(HESP)":[124],"improve":[126],"agent":[128],"generalization":[129],"ability":[130],"in":[131,180],"optimize":[135],"its":[136],"so":[140],"costs":[144],"train":[146],"time":[147,172,198],"significantly":[149],"reduced.":[150],"The":[151],"proposed":[152],"algorithm":[153],"has":[154,203],"already":[155],"been":[156,178,204],"employed":[157,205],"by":[158,206],"development":[160],"team":[161],"create":[166],"agents,":[168],"which,":[169],"writing":[174],"used":[179],"human-AI":[185],"fighting":[186,209],"matches.":[187],"To":[188],"best":[190],"our":[192],"knowledge,":[193],"first":[197],"commercial":[208],"game.":[210]},"counts_by_year":[],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
