{"id":"https://openalex.org/W2977677027","doi":"https://doi.org/10.1109/ijcnn.2019.8851819","title":"SOM-based Algorithm for Multi-armed Bandit Problem","display_name":"SOM-based Algorithm for Multi-armed Bandit Problem","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2977677027","doi":"https://doi.org/10.1109/ijcnn.2019.8851819","mag":"2977677027"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn.2019.8851819","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2019.8851819","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019058148","display_name":"Nobuhito Manome","orcid":"https://orcid.org/0000-0003-1436-908X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]},{"id":"https://openalex.org/I4210120159","display_name":"SoftBank Group (Japan)","ror":"https://ror.org/02ew2ks20","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210120159"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Nobuhito Manome","raw_affiliation_strings":["SoftBank Robotics Corp., The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"SoftBank Robotics Corp., The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I4210120159","https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021671793","display_name":"Shuji Shinohara","orcid":"https://orcid.org/0000-0001-8442-836X"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shuji Shinohara","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103905991","display_name":"Kouta Suzuki","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]},{"id":"https://openalex.org/I4210120159","display_name":"SoftBank Group (Japan)","ror":"https://ror.org/02ew2ks20","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210120159"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kouta Suzuki","raw_affiliation_strings":["SoftBank Robotics Corp., The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"SoftBank Robotics Corp., The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I4210120159","https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083250031","display_name":"Kosuke Tomonaga","orcid":null},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]},{"id":"https://openalex.org/I4210120159","display_name":"SoftBank Group (Japan)","ror":"https://ror.org/02ew2ks20","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210120159"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kosuke Tomonaga","raw_affiliation_strings":["SoftBank Robotics Corp., The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"SoftBank Robotics Corp., The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I4210120159","https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040101387","display_name":"Shunji Mitsuyoshi","orcid":"https://orcid.org/0000-0002-3441-3335"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shunji Mitsuyoshi","raw_affiliation_strings":["Graduate School of Engineering, The University of Tokyo, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering, The University of Tokyo, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5019058148"],"corresponding_institution_ids":["https://openalex.org/I4210120159","https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.1426702,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multi-armed-bandit","display_name":"Multi-armed bandit","score":0.8072516918182373},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6825989484786987},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5903332233428955},{"id":"https://openalex.org/keywords/thompson-sampling","display_name":"Thompson sampling","score":0.5623168349266052},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5561211109161377},{"id":"https://openalex.org/keywords/lever","display_name":"Lever","score":0.4812862277030945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3804720938205719},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35359644889831543},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1911087930202484},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.17910557985305786},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1218656599521637},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.0942598283290863}],"concepts":[{"id":"https://openalex.org/C123197309","wikidata":"https://www.wikidata.org/wiki/Q2882343","display_name":"Multi-armed bandit","level":3,"score":0.8072516918182373},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6825989484786987},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5903332233428955},{"id":"https://openalex.org/C73602740","wikidata":"https://www.wikidata.org/wiki/Q7795822","display_name":"Thompson sampling","level":3,"score":0.5623168349266052},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5561211109161377},{"id":"https://openalex.org/C107524782","wikidata":"https://www.wikidata.org/wiki/Q40164","display_name":"Lever","level":2,"score":0.4812862277030945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3804720938205719},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35359644889831543},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1911087930202484},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.17910557985305786},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1218656599521637},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.0942598283290863},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn.2019.8851819","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2019.8851819","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1515851193","https://openalex.org/W1679913846","https://openalex.org/W1998498767","https://openalex.org/W2039522160","https://openalex.org/W2108746281","https://openalex.org/W2112420033","https://openalex.org/W2158319693","https://openalex.org/W2168405694","https://openalex.org/W2169728355","https://openalex.org/W2331759129","https://openalex.org/W2551842929","https://openalex.org/W2552689039","https://openalex.org/W2614907933","https://openalex.org/W2726822279","https://openalex.org/W2762229518","https://openalex.org/W2772625704","https://openalex.org/W2791797914","https://openalex.org/W2795488051","https://openalex.org/W2801223223","https://openalex.org/W2802863340","https://openalex.org/W2856780764","https://openalex.org/W2886895914","https://openalex.org/W2896702309","https://openalex.org/W3121632328","https://openalex.org/W4213332169","https://openalex.org/W4214717370","https://openalex.org/W6684673071","https://openalex.org/W6753529177"],"related_works":["https://openalex.org/W2613863488","https://openalex.org/W2331759129","https://openalex.org/W2952186526","https://openalex.org/W2946219535","https://openalex.org/W4221165587","https://openalex.org/W2806567655","https://openalex.org/W4289887588","https://openalex.org/W3165844356","https://openalex.org/W1911551976","https://openalex.org/W4212898069"],"abstract_inverted_index":{"To":[0],"satisfy":[1],"a":[2,5,32,48,56,58,67,103,125,129,169],"user":[3,25,97],"facing":[4],"communication":[6,90],"robot":[7,91],"having":[8],"various":[9],"behavior":[10,18,86],"options,":[11],"it":[12,109,151],"is":[13,20,73,110,159],"necessary":[14],"to":[15,41,74,112,132],"output":[16],"the":[17,24,42,64,71,76,81,85,89,93,96,100,114,118,134,146,156,163,178],"that":[19,78,116,155],"most":[21],"suitable":[22],"for":[23,145],"faster.":[26,121],"Such":[27],"problems":[28],"are":[29],"formulated":[30],"as":[31,92,99,183],"multi-armed":[33,37,135],"bandit":[34,38,136,148],"problem.":[35,137],"The":[36],"problem":[39,43],"refers":[40],"of":[44,88,161],"maximizing":[45],"gain":[46],"in":[47,80,168],"situation":[49,170],"with":[50,66,105,165,171,177],"multiple":[51,139],"arms":[52,65,174],"where,":[53],"by":[54],"pulling":[55],"lever,":[57],"reward":[59,120,167],"can":[60],"be":[61],"obtained":[62],"from":[63],"certain":[68],"probability,":[69],"and":[70,95,150,186],"challenge":[72],"select":[75,113],"arm":[77,115,164],"results":[79],"maximum":[82,119],"reward.":[83],"Considering":[84],"options":[87],"arms,":[94,108],"satisfaction":[98],"reward,":[101],"under":[102],"condition":[104],"even":[106,172],"more":[107,173],"desirable":[111],"produces":[117],"This":[122],"study":[123],"proposes":[124],"new":[126],"algorithm":[127],"using":[128],"self-organizing":[130],"map":[131],"solve":[133],"Moreover,":[138],"numerical":[140],"experiments":[141],"have":[142],"been":[143,153],"conducted":[144],"stochastic":[147],"problem,":[149],"has":[152],"demonstrated":[154],"proposed":[157],"method":[158],"capable":[160],"selecting":[162],"higher":[166],"faster,":[175],"compared":[176],"existing":[179],"representative":[180],"algorithms":[181],"such":[182],"UCB1,":[184],"UCB1-tuned,":[185],"Thompson":[187],"sampling.":[188]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
