{"id":"https://openalex.org/W2753176368","doi":"https://doi.org/10.1109/snpd.2017.8022767","title":"Developing game AI agent behaving like human by mixing reinforcement learning and supervised learning","display_name":"Developing game AI agent behaving like human by mixing reinforcement learning and supervised learning","publication_year":2017,"publication_date":"2017-06-01","ids":{"openalex":"https://openalex.org/W2753176368","doi":"https://doi.org/10.1109/snpd.2017.8022767","mag":"2753176368"},"language":"en","primary_location":{"id":"doi:10.1109/snpd.2017.8022767","is_oa":false,"landing_page_url":"https://doi.org/10.1109/snpd.2017.8022767","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 18th IEEE/ACIS International Conference on Software Engineering, Artificial Intelligence, Networking and Parallel/Distributed Computing (SNPD)","raw_type":"proceedings-article"},"type":"conference-paper","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064218476","display_name":"Shohei Miyashita","orcid":null},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shohei Miyashita","raw_affiliation_strings":["Department of Computer Science and Systems Engineering, Kobe University, Hyogo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Systems Engineering, Kobe University, Hyogo, Japan","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063628500","display_name":"Xinyu Lian","orcid":"https://orcid.org/0009-0003-8143-4862"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Xinyu Lian","raw_affiliation_strings":["Graduate School of System Informatics, Kobe University, Hyogo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of System Informatics, Kobe University, Hyogo, Japan","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039845750","display_name":"Xiao Zeng","orcid":"https://orcid.org/0000-0001-5638-6545"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Xiao Zeng","raw_affiliation_strings":["Graduate School of System Informatics, Kobe University, Hyogo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of System Informatics, Kobe University, Hyogo, Japan","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068667478","display_name":"Takashi Matsubara","orcid":"https://orcid.org/0000-0003-0642-4800"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takashi Matsubara","raw_affiliation_strings":["Graduate School of System Informatics, Kobe University, Hyogo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of System Informatics, Kobe University, Hyogo, Japan","institution_ids":["https://openalex.org/I65837984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023847482","display_name":"Kuniaki Uehara","orcid":"https://orcid.org/0000-0002-7160-3752"},"institutions":[{"id":"https://openalex.org/I65837984","display_name":"Kobe University","ror":"https://ror.org/03tgsfw79","country_code":"JP","type":"education","lineage":["https://openalex.org/I65837984"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kuniaki Uehara","raw_affiliation_strings":["Graduate School of System Informatics, Kobe University, Hyogo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of System Informatics, Kobe University, Hyogo, Japan","institution_ids":["https://openalex.org/I65837984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I65837984"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"489","last_page":"494"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9884999990463257,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8200611472129822},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7350265979766846},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6868529319763184},{"id":"https://openalex.org/keywords/turing-test","display_name":"Turing test","score":0.6706624031066895},{"id":"https://openalex.org/keywords/video-game","display_name":"Video game","score":0.43982818722724915},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.43444231152534485},{"id":"https://openalex.org/keywords/turing","display_name":"Turing","score":0.41760289669036865},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.41679826378822327},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3939284086227417},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.07997235655784607},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.06723278760910034}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8200611472129822},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7350265979766846},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6868529319763184},{"id":"https://openalex.org/C577917","wikidata":"https://www.wikidata.org/wiki/Q189223","display_name":"Turing test","level":2,"score":0.6706624031066895},{"id":"https://openalex.org/C3018412434","wikidata":"https://www.wikidata.org/wiki/Q7889","display_name":"Video game","level":2,"score":0.43982818722724915},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.43444231152534485},{"id":"https://openalex.org/C9870796","wikidata":"https://www.wikidata.org/wiki/Q490481","display_name":"Turing","level":2,"score":0.41760289669036865},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.41679826378822327},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3939284086227417},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.07997235655784607},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.06723278760910034},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/snpd.2017.8022767","is_oa":false,"landing_page_url":"https://doi.org/10.1109/snpd.2017.8022767","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 18th IEEE/ACIS International Conference on Software Engineering, Artificial Intelligence, Networking and Parallel/Distributed Computing (SNPD)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W656377046","https://openalex.org/W1522301498","https://openalex.org/W1557517019","https://openalex.org/W1574691582","https://openalex.org/W2001771035","https://openalex.org/W2016053056","https://openalex.org/W2026485182","https://openalex.org/W2041224215","https://openalex.org/W2098535914","https://openalex.org/W2130750514","https://openalex.org/W2141559645","https://openalex.org/W2145339207","https://openalex.org/W2156387975","https://openalex.org/W2163605009","https://openalex.org/W2164128966","https://openalex.org/W2182734678","https://openalex.org/W2291634899","https://openalex.org/W2319588593","https://openalex.org/W2546302380","https://openalex.org/W2737560561","https://openalex.org/W2914656440","https://openalex.org/W3103379718","https://openalex.org/W4240117034","https://openalex.org/W6631190155","https://openalex.org/W6682889407","https://openalex.org/W6683971778","https://openalex.org/W6684191040","https://openalex.org/W6697024158"],"related_works":["https://openalex.org/W4243955206","https://openalex.org/W4401606958","https://openalex.org/W102057119","https://openalex.org/W4200331595","https://openalex.org/W2082052067","https://openalex.org/W1783366861","https://openalex.org/W3156272347","https://openalex.org/W4293218357","https://openalex.org/W3038981710","https://openalex.org/W223264744"],"abstract_inverted_index":{"Artificial":[0],"intelligence":[1],"(AI)":[2],"agent":[3,74,87,190,196],"created":[4],"with":[5],"Deep":[6],"Q-Networks":[7],"(DQN)":[8],"can":[9],"defeat":[10],"human":[11,80,110,121,195],"agents":[12,81,96,117],"in":[13,59],"video":[14],"games.":[15,63],"Despite":[16],"its":[17,103],"high":[18],"performance,":[19],"DQN":[20,37],"often":[21,106],"exhibits":[22,88],"odd":[23],"behaviors,":[24],"which":[25],"could":[26],"be":[27,142],"immersion-breaking":[28],"against":[29],"the":[30,43,65,134,171,184],"purpose":[31,114],"of":[32,40,62,79,98,115,133,139,191],"creating":[33],"game":[34,44,172],"AI.":[35],"Moreover,":[36],"is":[38,105,118],"capable":[39],"reacting":[41],"to":[42,56,119],"environment":[45],"much":[46],"faster":[47],"than":[48,93,109,194,200],"humans,":[49],"making":[50],"itself":[51],"invincible":[52],"(thus":[53],"not":[54],"fun":[55],"play":[57,77],"with)":[58],"certain":[60],"types":[61],"On":[64],"other":[66],"hand,":[67],"supervised":[68,153],"learning":[69,86,95,151,154,202],"framework":[70],"trains":[71],"an":[72,188],"AI":[73,116,135,189],"using":[75],"historical":[76],"data":[78],"as":[82],"training":[83,100],"data.":[84,101],"Supervised":[85],"a":[89,127],"more":[90],"human-like":[91],"behavior":[92,129,199],"reinforcement":[94,150,201],"because":[97],"imitating":[99],"However,":[102],"performance":[104,125,193],"no":[107],"better":[108,192],"agents.":[111,203],"The":[112,179],"ultimate":[113],"entertain":[120],"players.":[122],"A":[123],"good":[124],"and":[126,137,152,155,162,174,197],"humanlike":[128],"are":[130],"important":[131],"factors":[132],"agents,":[136],"both":[138],"them":[140],"should":[141],"achieved":[143],"simultaneously.":[144],"This":[145],"study":[146],"proposes":[147],"frameworks":[148,186],"combining":[149],"we":[156],"call":[157],"then":[158],"separated":[159],"network":[160,164],"model":[161],"shared":[163],"model.":[165],"We":[166],"evaluated":[167],"their":[168],"performances":[169],"by":[170,176],"scores":[173],"behaviors":[175],"Turing":[177],"test.":[178],"experimental":[180],"results":[181],"demonstrate":[182],"that":[183],"proposed":[185],"develop":[187],"natural":[198]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2}],"updated_date":"2026-07-14T23:27:15.235271","created_date":"2025-10-10T00:00:00"}