{"id":"https://openalex.org/W3016995670","doi":"https://doi.org/10.1109/icaiic48513.2020.9065031","title":"Neural architecture search under black-box objectives with deep reinforcement learning and increasingly-sparse rewards","display_name":"Neural architecture search under black-box objectives with deep reinforcement learning and increasingly-sparse rewards","publication_year":2020,"publication_date":"2020-02-01","ids":{"openalex":"https://openalex.org/W3016995670","doi":"https://doi.org/10.1109/icaiic48513.2020.9065031","mag":"3016995670"},"language":"en","primary_location":{"id":"doi:10.1109/icaiic48513.2020.9065031","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icaiic48513.2020.9065031","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040179673","display_name":"Mitchel Alioscha\u2010Perez","orcid":"https://orcid.org/0000-0002-8488-5824"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Mitchel Alioscha-Perez","raw_affiliation_strings":["Electronics & Informatics Dept., Vrije Universiteit Brussel, VUB-NPU Joint AVSP Lab, Brussels, Belgium"],"affiliations":[{"raw_affiliation_string":"Electronics & Informatics Dept., Vrije Universiteit Brussel, VUB-NPU Joint AVSP Lab, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065477266","display_name":"Abel D\u00edaz Berenguer","orcid":"https://orcid.org/0000-0003-4970-6517"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Abel Diaz Berenguer","raw_affiliation_strings":["Electronics & Informatics Dept., Vrije Universiteit Brussel, VUB-NPU Joint AVSP Lab, Brussels, Belgium"],"affiliations":[{"raw_affiliation_string":"Electronics & Informatics Dept., Vrije Universiteit Brussel, VUB-NPU Joint AVSP Lab, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014851312","display_name":"Ercheng Pei","orcid":"https://orcid.org/0000-0003-3582-6809"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ercheng Pei","raw_affiliation_strings":["Northwestern Polytechnical University, School of Computer Science, VUB-NPU Joint AVSP Lab, Xi'an, China"],"affiliations":[{"raw_affiliation_string":"Northwestern Polytechnical University, School of Computer Science, VUB-NPU Joint AVSP Lab, Xi'an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069268336","display_name":"Meshia C\u00e9dric Oveneke","orcid":"https://orcid.org/0000-0003-4076-4614"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Meshia Cedric Oveneke","raw_affiliation_strings":["Electronics & Informatics Dept., Vrije Universiteit Brussel, VUB-NPU Joint AVSP Lab, Brussels, Belgium"],"affiliations":[{"raw_affiliation_string":"Electronics & Informatics Dept., Vrije Universiteit Brussel, VUB-NPU Joint AVSP Lab, Brussels, Belgium","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073820422","display_name":"Hichem Sahli","orcid":"https://orcid.org/0000-0002-1774-2970"},"institutions":[{"id":"https://openalex.org/I4210114974","display_name":"IMEC","ror":"https://ror.org/02kcbn207","country_code":"BE","type":"nonprofit","lineage":["https://openalex.org/I4210114974"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Hichem Sahli","raw_affiliation_strings":["Interuniv. MicroElectronics Centre, Heverlee, Belgium"],"affiliations":[{"raw_affiliation_string":"Interuniv. MicroElectronics Centre, Heverlee, Belgium","institution_ids":["https://openalex.org/I4210114974"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5040179673"],"corresponding_institution_ids":["https://openalex.org/I13469542"],"apc_list":null,"apc_paid":null,"fwci":0.2947,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.55120231,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"12","issue":null,"first_page":"276","last_page":"281"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7091243863105774},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6484407186508179},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6412391662597656},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6195335388183594},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6144694089889526},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5190037488937378},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.45353201031684875},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42467549443244934},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4166751801967621},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.19464558362960815}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7091243863105774},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6484407186508179},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6412391662597656},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6195335388183594},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6144694089889526},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5190037488937378},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.45353201031684875},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42467549443244934},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4166751801967621},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.19464558362960815},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icaiic48513.2020.9065031","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icaiic48513.2020.9065031","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","raw_type":"proceedings-article"},{"id":"pmh:oai:vubissmart:VUBISSMART:2000:129767","is_oa":false,"landing_page_url":"https://biblio.vub.ac.be/vubir/neural-architecture-search-under-blackbox-objectives-with-deep-reinforcement-learning-and-increasinglysparse-rewards(60f56a78-dd4f-4da5-93fb-368362a8f02f).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306402573","display_name":"VUBIR (Vrije Universiteit Brussel)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I13469542","host_organization_name":"Vrije Universiteit Brussel","host_organization_lineage":["https://openalex.org/I13469542"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1533861849","https://openalex.org/W1798702550","https://openalex.org/W2531409750","https://openalex.org/W2553303224","https://openalex.org/W2556372419","https://openalex.org/W2788853733","https://openalex.org/W2810075754","https://openalex.org/W2924820442","https://openalex.org/W2950277768","https://openalex.org/W2951104886","https://openalex.org/W2955931535","https://openalex.org/W2962750597","https://openalex.org/W2963374479","https://openalex.org/W2963918968","https://openalex.org/W2964024268","https://openalex.org/W2964043796","https://openalex.org/W2964081807","https://openalex.org/W2970866842","https://openalex.org/W2974623198","https://openalex.org/W4288333794","https://openalex.org/W4288409786","https://openalex.org/W6631943919","https://openalex.org/W6638209102","https://openalex.org/W6692846177","https://openalex.org/W6729956949","https://openalex.org/W6730269975","https://openalex.org/W6748587240","https://openalex.org/W6764965709"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176","https://openalex.org/W2586732548","https://openalex.org/W4380075502"],"abstract_inverted_index":{"In":[0,33],"this":[1,34,82],"paper,":[2],"we":[3,104],"address":[4],"the":[5,16,122,133,169,187,202],"problem":[6,83],"of":[7,45,88,135,174,201],"neural":[8,50,137],"architecture":[9,52,147],"search":[10],"(NAS)":[11],"in":[12,57,81,198],"a":[13,22,43,49,58,106],"context":[14,84],"where":[15],"optimality":[17],"policy":[18,113],"is":[19],"driven":[20],"by":[21,145],"black-box":[23],"Oracle":[24],"<tex":[25,36,53,67],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[26,37,54,68],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}$</tex>":[27],"with":[28,115,149,182],"unknown":[29],"form":[30],"and":[31,74,153,156,171],"derivatives.":[32],"scenario,":[35],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathcal{O}(A_{C})$</tex>":[38],"typically":[39],"provides":[40],"readings":[41],"from":[42],"set":[44],"sensors":[46,188],"on":[47,112,121,186],"how":[48],"network":[51],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$A_{C}$</tex>":[55],"fares":[56],"target":[59],"hardware,":[60],"including":[61],"its:":[62],"power":[63],"consumption,":[64],"working":[65],"temperature,":[66],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{cpu}/\\mathbf{gpu}$</tex>":[69],"usage,":[70],"central":[71],"bus":[72],"occupancy,":[73],"more.":[75],"Current":[76],"differentiable":[77],"NAS":[78,96,109],"approaches":[79,97],"fail":[80],"due":[85],"to":[86,90,130,139],"lack":[87],"access":[89],"derivatives,":[91],"whereas":[92],"traditional":[93],"reinforcement":[94,107],"learning":[95,108],"remain":[98],"too":[99],"expensive":[100],"computationally.":[101],"As":[102],"solution,":[103,176],"propose":[105],"strategy":[110,191],"based":[111],"gradient":[114],"increasingly":[116],"sparse":[117],"rewards.":[118],"We":[119],"rely":[120],"fact":[123],"[1]":[124],"that":[125],"one":[126],"does":[127],"not":[128],"need":[129],"fully":[131],"train":[132],"weights":[134,152,163],"two":[136],"networks":[138],"compare":[140],"them.":[141],"Our":[142,190],"solution":[143],"starts":[144],"comparing":[146],"candidates":[148],"almost":[150],"fixed":[151],"no":[154],"training,":[155],"progressively":[157],"shifts":[158],"toward":[159],"comparisons":[160],"under":[161],"full":[162],"training.":[164],"Experimental":[165],"results":[166],"confirmed":[167],"both":[168],"accuracy":[170],"training":[172],"efficiency":[173],"our":[175],"as":[177,179],"well":[178],"its":[180],"compliance":[181],"soft/hard":[183],"constraints":[184],"imposed":[185],"feedback.":[189],"allows":[192],"finding":[193],"near-optimal":[194],"architectures":[195],"significantly":[196],"faster,":[197],"approximately":[199],"1/3":[200],"time":[203],"it":[204],"would":[205],"take":[206],"otherwise.":[207]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
