{"id":"https://openalex.org/W4404491734","doi":"https://doi.org/10.1007/s00521-024-10445-2","title":"Scalable reinforcement learning-based neural architecture search","display_name":"Scalable reinforcement learning-based neural architecture search","publication_year":2024,"publication_date":"2024-11-18","ids":{"openalex":"https://openalex.org/W4404491734","doi":"https://doi.org/10.1007/s00521-024-10445-2"},"language":"en","primary_location":{"id":"doi:10.1007/s00521-024-10445-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-024-10445-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-024-10445-2.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00521-024-10445-2.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059626420","display_name":"Amber Cassimon","orcid":"https://orcid.org/0000-0002-7471-2508"},"institutions":[{"id":"https://openalex.org/I149213910","display_name":"University of Antwerp","ror":"https://ror.org/008x57b05","country_code":"BE","type":"education","lineage":["https://openalex.org/I149213910"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Amber Cassimon","raw_affiliation_strings":["IDLab - Faculty of Applied Engineering, University of Antwerp - imec, Sint-Pietersvliet 7, 2000, Antwerp, Antwerp, Belgium"],"raw_orcid":"https://orcid.org/0000-0002-7471-2508","affiliations":[{"raw_affiliation_string":"IDLab - Faculty of Applied Engineering, University of Antwerp - imec, Sint-Pietersvliet 7, 2000, Antwerp, Antwerp, Belgium","institution_ids":["https://openalex.org/I149213910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015248763","display_name":"Siegfried Mercelis","orcid":"https://orcid.org/0000-0001-9355-6566"},"institutions":[{"id":"https://openalex.org/I149213910","display_name":"University of Antwerp","ror":"https://ror.org/008x57b05","country_code":"BE","type":"education","lineage":["https://openalex.org/I149213910"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Siegfried Mercelis","raw_affiliation_strings":["IDLab - Faculty of Applied Engineering, University of Antwerp - imec, Sint-Pietersvliet 7, 2000, Antwerp, Antwerp, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IDLab - Faculty of Applied Engineering, University of Antwerp - imec, Sint-Pietersvliet 7, 2000, Antwerp, Antwerp, Belgium","institution_ids":["https://openalex.org/I149213910"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5084961388","display_name":"Kevin Mets","orcid":"https://orcid.org/0000-0002-4812-4841"},"institutions":[{"id":"https://openalex.org/I149213910","display_name":"University of Antwerp","ror":"https://ror.org/008x57b05","country_code":"BE","type":"education","lineage":["https://openalex.org/I149213910"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Kevin Mets","raw_affiliation_strings":["IDLab - Faculty of Applied Engineering, University of Antwerp - imec, Sint-Pietersvliet 7, 2000, Antwerp, Antwerp, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IDLab - Faculty of Applied Engineering, University of Antwerp - imec, Sint-Pietersvliet 7, 2000, Antwerp, Antwerp, Belgium","institution_ids":["https://openalex.org/I149213910"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5059626420"],"corresponding_institution_ids":["https://openalex.org/I149213910"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":3.9503,"has_fulltext":true,"cited_by_count":13,"citation_normalized_percentile":{"value":0.94470635,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"37","issue":"1","first_page":"231","last_page":"261"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8613107800483704},{"id":"https://openalex.org/keywords/computational-science-and-engineering","display_name":"Computational Science and Engineering","score":0.7916271686553955},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7539262771606445},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6333199143409729},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5815091729164124},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.503523051738739},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.49340954422950745},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.47349557280540466},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4518723487854004},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.09231868386268616},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.07497313618659973}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8613107800483704},{"id":"https://openalex.org/C68597687","wikidata":"https://www.wikidata.org/wiki/Q362601","display_name":"Computational Science and Engineering","level":2,"score":0.7916271686553955},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7539262771606445},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6333199143409729},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5815091729164124},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.503523051738739},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.49340954422950745},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.47349557280540466},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4518723487854004},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09231868386268616},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.07497313618659973},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00521-024-10445-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-024-10445-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-024-10445-2.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00521-024-10445-2","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00521-024-10445-2","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00521-024-10445-2.pdf","source":{"id":"https://openalex.org/S147897268","display_name":"Neural Computing and Applications","issn_l":"0941-0643","issn":["0941-0643","1433-3058"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Neural Computing and Applications","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.6000000238418579}],"awards":[{"id":"https://openalex.org/G1192456679","display_name":null,"funder_award_id":"1SC8821N","funder_id":"https://openalex.org/F4320321730","funder_display_name":"Fonds Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321587","display_name":"Vlaamse Overheid","ror":"https://ror.org/04qxsrb28"},{"id":"https://openalex.org/F4320321730","display_name":"Fonds Wetenschappelijk Onderzoek","ror":"https://ror.org/03qtxy027"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4404491734.pdf"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W2097117768","https://openalex.org/W2119717200","https://openalex.org/W2194775991","https://openalex.org/W2946547492","https://openalex.org/W2954234207","https://openalex.org/W2964081807","https://openalex.org/W2981406437","https://openalex.org/W2997699039","https://openalex.org/W3003257820","https://openalex.org/W3107893198","https://openalex.org/W3150058922","https://openalex.org/W4292787289","https://openalex.org/W4309609199","https://openalex.org/W4312878236","https://openalex.org/W4365397863","https://openalex.org/W4367047454","https://openalex.org/W4372260390","https://openalex.org/W4379984978","https://openalex.org/W4392194134","https://openalex.org/W6600388300","https://openalex.org/W6600778605","https://openalex.org/W6600804061","https://openalex.org/W6602434089","https://openalex.org/W6828894009"],"related_works":["https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W2920061524","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"Abstract":[0],"We":[1,24,63,142],"assess":[2],"the":[3,15,28,40,60,66,92,98,109,125,136,140,147],"feasibility":[4],"of":[5,30,94,113,127,139,149,158],"a":[6,20,45,54,155],"reusable":[7],"neural":[8,47],"architecture":[9],"search":[10,22,81],"agent":[11,35,56,117],"aimed":[12],"at":[13],"amortizing":[14],"initial":[16],"time-investment":[17],"in":[18],"building":[19],"good":[21],"strategy.":[23],"do":[25],"this":[26],"through":[27,154],"use":[29],"Reinforcement":[31],"Learning,":[32],"where":[33],"an":[34],"learns":[36],"to":[37,43,120,134],"iteratively":[38],"select":[39],"best":[41],"way":[42],"modify":[44],"given":[46],"network":[48],"architecture.":[49],"This":[50],"is":[51,102,118],"achieved":[52],"using":[53,59],"transformer-based":[55],"design":[57],"trained":[58],"Ape-X":[61],"algorithm.":[62],"consider":[64],"both":[65,90],"NAS-Bench-101":[67],"and":[68,71,82,162],"NAS-Bench-301":[69,101],"settings,":[70],"compare":[72],"against":[73],"various":[74],"known":[75],"strong":[76,110,122],"baselines,":[77],"such":[78],"as":[79],"local":[80],"random":[83],"search.":[84],"While":[85],"achieving":[86],"competitive":[87],"performance":[88],"on":[89],"benchmarks,":[91],"amount":[93],"training":[95,138],"required":[96],"for":[97,129,146,152],"much":[99],"larger":[100],"only":[103],"marginally":[104],"greater":[105],"than":[106],"NAS-Bench-101,":[107],"illustrating":[108],"scaling":[111],"properties":[112],"our":[114,159],"agent.":[115,141],"Our":[116],"able":[119],"achieve":[121],"performance,":[123],"but":[124],"choice":[126],"values":[128,151],"certain":[130],"parameters":[131],"are":[132],"crucial":[133],"ensuring":[135],"succesful":[137],"provide":[143],"some":[144],"guidance":[145],"selection":[148],"appropriate":[150],"hyperparameters":[153],"detailed":[156],"description":[157],"experimental":[160],"setup":[161],"several":[163],"ablation":[164],"studies.":[165]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":9}],"updated_date":"2026-06-13T06:13:01.061226","created_date":"2025-10-10T00:00:00"}
