{"id":"https://openalex.org/W4401215537","doi":"https://doi.org/10.1145/3638530.3654291","title":"Instance Selection for Dynamic Algorithm Configuration with Reinforcement Learning: Improving Generalization","display_name":"Instance Selection for Dynamic Algorithm Configuration with Reinforcement Learning: Improving Generalization","publication_year":2024,"publication_date":"2024-07-14","ids":{"openalex":"https://openalex.org/W4401215537","doi":"https://doi.org/10.1145/3638530.3654291"},"language":"en","primary_location":{"id":"doi:10.1145/3638530.3654291","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3638530.3654291","pdf_url":null,"source":{"id":"https://openalex.org/S4363608771","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference Companion","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference Companion","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035141000","display_name":"Carolin Benjamins","orcid":"https://orcid.org/0009-0007-4643-3564"},"institutions":[{"id":"https://openalex.org/I114112103","display_name":"Leibniz University Hannover","ror":"https://ror.org/0304hq317","country_code":"DE","type":"education","lineage":["https://openalex.org/I114112103"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Carolin Benjamins","raw_affiliation_strings":["Leibniz University Hannover, Hannover, Germany"],"raw_orcid":"https://orcid.org/0009-0007-4643-3564","affiliations":[{"raw_affiliation_string":"Leibniz University Hannover, Hannover, Germany","institution_ids":["https://openalex.org/I114112103"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066396028","display_name":"Gjorgjina Cenikj","orcid":"https://orcid.org/0000-0002-2723-0821"},"institutions":[{"id":"https://openalex.org/I3006985408","display_name":"Jo\u017eef Stefan Institute","ror":"https://ror.org/05060sz93","country_code":"SI","type":"facility","lineage":["https://openalex.org/I3006985408"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Gjorgjina Cenikj","raw_affiliation_strings":["Jozef Stefan Institute, Ljubljana, Slovenia"],"raw_orcid":"https://orcid.org/0000-0002-2723-0821","affiliations":[{"raw_affiliation_string":"Jozef Stefan Institute, Ljubljana, Slovenia","institution_ids":["https://openalex.org/I3006985408"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055785474","display_name":"Ana Nikolikj","orcid":"https://orcid.org/0000-0002-6983-9627"},"institutions":[{"id":"https://openalex.org/I3006985408","display_name":"Jo\u017eef Stefan Institute","ror":"https://ror.org/05060sz93","country_code":"SI","type":"facility","lineage":["https://openalex.org/I3006985408"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Ana Nikolikj","raw_affiliation_strings":["Jozef Stefan Institute, Ljubljana, Slovenia"],"raw_orcid":"https://orcid.org/0000-0002-6983-9627","affiliations":[{"raw_affiliation_string":"Jozef Stefan Institute, Ljubljana, Slovenia","institution_ids":["https://openalex.org/I3006985408"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102919894","display_name":"Aditya Mohan","orcid":"https://orcid.org/0000-0003-0092-3780"},"institutions":[{"id":"https://openalex.org/I114112103","display_name":"Leibniz University Hannover","ror":"https://ror.org/0304hq317","country_code":"DE","type":"education","lineage":["https://openalex.org/I114112103"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Aditya Mohan","raw_affiliation_strings":["Leibniz University Hannover, Hannover, Germany"],"raw_orcid":"https://orcid.org/0000-0003-0092-3780","affiliations":[{"raw_affiliation_string":"Leibniz University Hannover, Hannover, Germany","institution_ids":["https://openalex.org/I114112103"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082115266","display_name":"Tome Eftimov","orcid":"https://orcid.org/0000-0001-7330-1902"},"institutions":[{"id":"https://openalex.org/I3006985408","display_name":"Jo\u017eef Stefan Institute","ror":"https://ror.org/05060sz93","country_code":"SI","type":"facility","lineage":["https://openalex.org/I3006985408"]}],"countries":["SI"],"is_corresponding":false,"raw_author_name":"Tome Eftimov","raw_affiliation_strings":["Jozef Stefan Institute, Ljubljana, Slovenia"],"raw_orcid":"https://orcid.org/0000-0001-7330-1902","affiliations":[{"raw_affiliation_string":"Jozef Stefan Institute, Ljubljana, Slovenia","institution_ids":["https://openalex.org/I3006985408"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045511267","display_name":"Marius Lindauer","orcid":"https://orcid.org/0000-0002-9675-3175"},"institutions":[{"id":"https://openalex.org/I114112103","display_name":"Leibniz University Hannover","ror":"https://ror.org/0304hq317","country_code":"DE","type":"education","lineage":["https://openalex.org/I114112103"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marius Lindauer","raw_affiliation_strings":["Leibniz University Hannover, Hannover, Germany"],"raw_orcid":"https://orcid.org/0000-0002-9675-3175","affiliations":[{"raw_affiliation_string":"Leibniz University Hannover, Hannover, Germany","institution_ids":["https://openalex.org/I114112103"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5035141000"],"corresponding_institution_ids":["https://openalex.org/I114112103"],"apc_list":null,"apc_paid":null,"fwci":0.2859,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.49741736,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"563","last_page":"566"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12205","display_name":"Time Series Analysis and Forecasting","score":0.9850000143051147,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.781739354133606},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.7453657984733582},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7089579105377197},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6291642189025879},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5007956027984619},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.46818554401397705},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4104735553264618},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15971606969833374}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.781739354133606},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.7453657984733582},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7089579105377197},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6291642189025879},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5007956027984619},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.46818554401397705},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4104735553264618},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15971606969833374},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3638530.3654291","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3638530.3654291","pdf_url":null,"source":{"id":"https://openalex.org/S4363608771","display_name":"Proceedings of the Genetic and Evolutionary Computation Conference Companion","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Genetic and Evolutionary Computation Conference Companion","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1117738264","display_name":null,"funder_award_id":"PR-12897","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"},{"id":"https://openalex.org/G6508940539","display_name":null,"funder_award_id":"PR-12393","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"},{"id":"https://openalex.org/G7799930752","display_name":null,"funder_award_id":"J2-4460","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"},{"id":"https://openalex.org/G791504897","display_name":null,"funder_award_id":"P2-0098","funder_id":"https://openalex.org/F4320322554","funder_display_name":"Javna Agencija za Raziskovalno Dejavnost RS"}],"funders":[{"id":"https://openalex.org/F4320320875","display_name":"Deutscher Akademischer Austauschdienst","ror":"https://ror.org/039djdh30"},{"id":"https://openalex.org/F4320322554","display_name":"Javna Agencija za Raziskovalno Dejavnost RS","ror":"https://ror.org/059bp8k51"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W576863261","https://openalex.org/W1471542436","https://openalex.org/W2042892801","https://openalex.org/W2160088187","https://openalex.org/W2560674852","https://openalex.org/W2608239929","https://openalex.org/W2967988901","https://openalex.org/W3004042307","https://openalex.org/W4313395123","https://openalex.org/W4315487473","https://openalex.org/W6606494994"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W4306904969","https://openalex.org/W3162204513","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W3084456289","https://openalex.org/W2024136090","https://openalex.org/W4391331176"],"abstract_inverted_index":{"Dynamic":[0],"Algorithm":[1],"Configuration":[2],"(DAC)":[3],"addresses":[4],"the":[5,42,52,64,91,103,106,113,117,133,137,143,149,159,169,176],"challenge":[6],"of":[7,11,18,46,82,116,127,161,178],"dynamically":[8],"setting":[9],"hyperparameters":[10],"an":[12],"algorithm":[13],"for":[14,105,112,153,185],"a":[15,35,60,72,79],"diverse":[16,186],"set":[17],"instances":[19,66,84],"rather":[20],"than":[21],"focusing":[22],"solely":[23],"on":[24,93,125,142,168],"individual":[25],"tasks.":[26],"Agents":[27],"trained":[28],"with":[29,136],"Deep":[30],"Reinforcement":[31],"Learning":[32],"(RL)":[33],"offer":[34],"pathway":[36],"to":[37,85,96,166],"solve":[38],"such":[39],"settings.":[40],"However,":[41],"limited":[43],"generalization":[44,68,99],"performance":[45],"these":[47],"agents":[48],"has":[49],"significantly":[50],"hindered":[51],"application":[53],"in":[54,63,181],"DAC.":[55],"Our":[56,173],"hypothesis":[57],"is":[58],"that":[59],"potential":[61],"bias":[62],"training":[65,83,167],"limits":[67],"capabilities.":[69],"We":[70],"take":[71],"step":[73],"towards":[74],"mitigating":[75],"this":[76,94],"by":[77,120,132],"selecting":[78],"representative":[80],"subset":[81,95,107],"overcome":[86],"overrepresentation":[87],"and":[88,129,145],"then":[89],"retraining":[90],"agent":[92,119],"improve":[97],"its":[98],"performance.":[100],"For":[101],"constructing":[102],"meta-features":[104],"selection,":[108],"we":[109,157],"particularly":[110],"account":[111],"dynamic":[114],"nature":[115],"RL":[118],"computing":[121],"time":[122],"series":[123],"features":[124],"trajectories":[126],"actions":[128],"rewards":[130],"generated":[131],"agent's":[134],"interaction":[135],"environment.":[138],"Through":[139],"empirical":[140],"evaluations":[141],"Sigmoid":[144],"CMA-ES":[146],"benchmarks":[147],"from":[148],"standard":[150],"benchmark":[151],"library":[152],"DAC,":[154],"called":[155],"DACBench,":[156],"discuss":[158],"potentials":[160],"our":[162],"selection":[163,180],"technique":[164],"compared":[165],"entire":[170],"instance":[171,179,187],"set.":[172],"results":[174],"highlight":[175],"efficacy":[177],"refining":[182],"DAC":[183],"policies":[184],"spaces.":[188]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
