{"id":"https://openalex.org/W3160414592","doi":"https://doi.org/10.1109/icpr48806.2021.9412240","title":"Evaluating Initialization of Nelder-Mead Method for Hyperparameter Optimization in Deep Learning","display_name":"Evaluating Initialization of Nelder-Mead Method for Hyperparameter Optimization in Deep Learning","publication_year":2021,"publication_date":"2021-01-10","ids":{"openalex":"https://openalex.org/W3160414592","doi":"https://doi.org/10.1109/icpr48806.2021.9412240","mag":"3160414592"},"language":"en","primary_location":{"id":"doi:10.1109/icpr48806.2021.9412240","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9412240","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078375838","display_name":"Shintaro Takenaga","orcid":"https://orcid.org/0000-0002-6824-7603"},"institutions":[{"id":"https://openalex.org/I916559398","display_name":"Kindai University","ror":"https://ror.org/05kt9ap64","country_code":"JP","type":"education","lineage":["https://openalex.org/I916559398"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Shintaro Takenaga","raw_affiliation_strings":["Kindai University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kindai University","institution_ids":["https://openalex.org/I916559398"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062660811","display_name":"Shuhei Watanabe","orcid":"https://orcid.org/0000-0001-6611-2812"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shuhei Watanabe","raw_affiliation_strings":["AI Research Center:AIST"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AI Research Center:AIST","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101431510","display_name":"Masahiro Nomura","orcid":"https://orcid.org/0000-0002-4945-5984"},"institutions":[{"id":"https://openalex.org/I4210089607","display_name":"CyberAgent (Japan)","ror":"https://ror.org/0060jg679","country_code":"JP","type":"company","lineage":["https://openalex.org/I4210089607"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masahiro Nomura","raw_affiliation_strings":["AI Research Center:AIST & CyberAgent, Inc"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AI Research Center:AIST & CyberAgent, Inc","institution_ids":["https://openalex.org/I4210089607"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020641297","display_name":"Yoshihiko Ozaki","orcid":"https://orcid.org/0000-0001-7911-4470"},"institutions":[{"id":"https://openalex.org/I2799969541","display_name":"The Art Institutes","ror":"https://ror.org/01p2ej961","country_code":"US","type":"education","lineage":["https://openalex.org/I2799969541"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yoshihiko Ozaki","raw_affiliation_strings":["AI Research Center:AIST & GREE, Inc"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AI Research Center:AIST & GREE, Inc","institution_ids":["https://openalex.org/I2799969541"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031341888","display_name":"Masaki Onishi","orcid":"https://orcid.org/0000-0002-4580-4868"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Masaki Onishi","raw_affiliation_strings":["AI Research Center:AIST"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AI Research Center:AIST","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009330022","display_name":"Hitoshi Habe","orcid":"https://orcid.org/0000-0002-7895-2402"},"institutions":[{"id":"https://openalex.org/I916559398","display_name":"Kindai University","ror":"https://ror.org/05kt9ap64","country_code":"JP","type":"education","lineage":["https://openalex.org/I916559398"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hitoshi Habe","raw_affiliation_strings":["Kindai University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kindai University","institution_ids":["https://openalex.org/I916559398"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5078375838"],"corresponding_institution_ids":["https://openalex.org/I916559398"],"apc_list":null,"apc_paid":null,"fwci":0.4198,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.68349483,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"3372","last_page":"3379"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hyperparameter","display_name":"Hyperparameter","score":0.9381946325302124},{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.7401853799819946},{"id":"https://openalex.org/keywords/maxima-and-minima","display_name":"Maxima and minima","score":0.6676857471466064},{"id":"https://openalex.org/keywords/hyperparameter-optimization","display_name":"Hyperparameter optimization","score":0.6495662331581116},{"id":"https://openalex.org/keywords/simplex","display_name":"Simplex","score":0.6320908069610596},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6043069958686829},{"id":"https://openalex.org/keywords/simplex-algorithm","display_name":"Simplex algorithm","score":0.572855532169342},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5638831853866577},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5389087796211243},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4655386209487915},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.42036885023117065},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.41671156883239746},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3318905234336853},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.29445725679397583},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.11527541279792786},{"id":"https://openalex.org/keywords/linear-programming","display_name":"Linear programming","score":0.10828393697738647}],"concepts":[{"id":"https://openalex.org/C8642999","wikidata":"https://www.wikidata.org/wiki/Q4171168","display_name":"Hyperparameter","level":2,"score":0.9381946325302124},{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.7401853799819946},{"id":"https://openalex.org/C186633575","wikidata":"https://www.wikidata.org/wiki/Q845060","display_name":"Maxima and minima","level":2,"score":0.6676857471466064},{"id":"https://openalex.org/C10485038","wikidata":"https://www.wikidata.org/wiki/Q48996162","display_name":"Hyperparameter optimization","level":3,"score":0.6495662331581116},{"id":"https://openalex.org/C62438384","wikidata":"https://www.wikidata.org/wiki/Q331350","display_name":"Simplex","level":2,"score":0.6320908069610596},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6043069958686829},{"id":"https://openalex.org/C144521790","wikidata":"https://www.wikidata.org/wiki/Q134164","display_name":"Simplex algorithm","level":3,"score":0.572855532169342},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5638831853866577},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5389087796211243},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4655386209487915},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.42036885023117065},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41671156883239746},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3318905234336853},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.29445725679397583},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.11527541279792786},{"id":"https://openalex.org/C41045048","wikidata":"https://www.wikidata.org/wiki/Q202843","display_name":"Linear programming","level":2,"score":0.10828393697738647},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icpr48806.2021.9412240","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icpr48806.2021.9412240","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 25th International Conference on Pattern Recognition (ICPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1524954183","https://openalex.org/W1529817821","https://openalex.org/W1995832922","https://openalex.org/W2097998348","https://openalex.org/W2112036188","https://openalex.org/W2112796928","https://openalex.org/W2140691217","https://openalex.org/W2169369819","https://openalex.org/W2171074980","https://openalex.org/W2401231614","https://openalex.org/W2767790836","https://openalex.org/W2809894947","https://openalex.org/W2964137095","https://openalex.org/W3005347330","https://openalex.org/W3118608800","https://openalex.org/W3216490951","https://openalex.org/W4213308398","https://openalex.org/W4238255529","https://openalex.org/W4285719527","https://openalex.org/W6674385629"],"related_works":["https://openalex.org/W2953665647","https://openalex.org/W4281646320","https://openalex.org/W3169687406","https://openalex.org/W2954882791","https://openalex.org/W4388119537","https://openalex.org/W4205712847","https://openalex.org/W1974336862","https://openalex.org/W3014750173","https://openalex.org/W4287818966","https://openalex.org/W3192751261"],"abstract_inverted_index":{"In":[0,85],"deep":[1,26,107,170],"learning,":[2,108],"hyperparameters":[3],"can":[4],"severely":[5],"affect":[6],"the":[7,33,43,49,52,81,101,144,153,164],"learning":[8,139],"model":[9,113],"performance.":[10],"The":[11],"Nelder-Mead":[12],"(NM)":[13],"method":[14],"is":[15,38,57,147],"known":[16],"for":[17,22,93],"showing":[18],"a":[19,61,111,115,157],"superior":[20],"performance":[21,45],"hyperparameter":[23,104,167],"optimization":[24,105,125,168],"in":[25,80,106,137,169],"learning.":[27,171],"An":[28],"initial":[29,34,53,63,74,96,120,159],"simplex,":[30],"one":[31,77],"of":[32,51,103,166],"NM":[35],"method's":[36],"values,":[37],"usually":[39],"determined":[40],"randomly":[41],"while":[42],"search":[44,83],"strongly":[46],"depends":[47],"on":[48],"shape":[50],"simplex.":[54],"Therefore,":[55],"it":[56],"necessary":[58],"to":[59,71,99,124,152,162],"determine":[60],"proper":[62],"simplex":[64,75,97,121,160],"as":[65],"previous":[66],"researchers":[67],"have":[68],"proposed":[69],"methods":[70,92],"construct":[72],"an":[73,95],"from":[76],"starting":[78,145],"point":[79,146],"bounded":[82],"space.":[84],"this":[86],"study,":[87],"we":[88],"verified":[89],"how":[90],"these":[91],"constructing":[94],"contribute":[98],"improving":[100,163],"result":[102,165],"by":[109,126],"using":[110],"simple":[112],"and":[114,155],"complicated":[116],"model.":[117],"A":[118],"smaller":[119],"may":[122],"fail":[123],"bad":[127,134],"local":[128,135],"minima":[129,136],"because":[130],"there":[131],"are":[132],"some":[133],"both":[138],"models.":[140],"We":[141],"concluded":[142],"that":[143,156],"not":[148],"necessarily":[149],"located":[150],"close":[151],"origin,":[154],"larger":[158],"contributes":[161]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2026-05-13T08:25:38.343686","created_date":"2025-10-10T00:00:00"}
