{"id":"https://openalex.org/W2399299813","doi":"https://doi.org/10.3233/978-1-61499-419-0-981","title":"Using Ensemble Techniques and Multi-Objectivization to Solve Reinforcement Learning Problems","display_name":"Using Ensemble Techniques and Multi-Objectivization to Solve Reinforcement Learning Problems","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2399299813","doi":"https://doi.org/10.3233/978-1-61499-419-0-981","mag":"2399299813"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-419-0-981","is_oa":true,"landing_page_url":"https://doi.org/10.3233/978-1-61499-419-0-981","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/978-1-61499-419-0-981","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084002137","display_name":"Tim Brys","orcid":null},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Brys Tim","raw_affiliation_strings":["Vrije Universiteit Brussel, Belgium,"],"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, Belgium,","institution_ids":["https://openalex.org/I13469542"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070914351","display_name":"Matthew E. Taylor","orcid":"https://orcid.org/0000-0001-8946-0211"},"institutions":[{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Taylor Matthew E.","raw_affiliation_strings":["Washington State Univ., WA"],"affiliations":[{"raw_affiliation_string":"Washington State Univ., WA","institution_ids":["https://openalex.org/I72951846"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064553018","display_name":"Ann Now\u00e9","orcid":"https://orcid.org/0000-0001-6346-4564"},"institutions":[{"id":"https://openalex.org/I13469542","display_name":"Vrije Universiteit Brussel","ror":"https://ror.org/006e5kg04","country_code":"BE","type":"education","lineage":["https://openalex.org/I13469542"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Now&eacute; Ann","raw_affiliation_strings":["Vrije Universiteit Brussel, Belgium,"],"affiliations":[{"raw_affiliation_string":"Vrije Universiteit Brussel, Belgium,","institution_ids":["https://openalex.org/I13469542"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5084002137"],"corresponding_institution_ids":["https://openalex.org/I13469542"],"apc_list":null,"apc_paid":null,"fwci":1.3849,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.83116542,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"981","last_page":"982"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9803000092506409,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9605000019073486,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6400690078735352},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6034175157546997},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4410938620567322},{"id":"https://openalex.org/keywords/ensemble-learning","display_name":"Ensemble learning","score":0.41648465394973755},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41049709916114807},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37385594844818115},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11025980114936829},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.045356035232543945}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6400690078735352},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6034175157546997},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4410938620567322},{"id":"https://openalex.org/C45942800","wikidata":"https://www.wikidata.org/wiki/Q245652","display_name":"Ensemble learning","level":2,"score":0.41648465394973755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41049709916114807},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37385594844818115},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11025980114936829},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.045356035232543945}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3233/978-1-61499-419-0-981","is_oa":true,"landing_page_url":"https://doi.org/10.3233/978-1-61499-419-0-981","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},{"id":"mag:2399299813","is_oa":false,"landing_page_url":"https://ai.vub.ac.be/sites/default/files/ECAI-192.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306418308","display_name":"European Conference on Artificial Intelligence","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":"European Conference on Artificial Intelligence","raw_type":null}],"best_oa_location":{"id":"doi:10.3233/978-1-61499-419-0-981","is_oa":true,"landing_page_url":"https://doi.org/10.3233/978-1-61499-419-0-981","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.41999998688697815}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1515851193","https://openalex.org/W1777239053","https://openalex.org/W2002305926","https://openalex.org/W2043806097","https://openalex.org/W2095564494","https://openalex.org/W2097381042","https://openalex.org/W2147492008","https://openalex.org/W2169659168"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474"],"abstract_inverted_index":{"Recent":[0],"work":[1],"on":[2,82],"multi-objectivization":[3],"has":[4],"shown":[5],"how":[6],"a":[7,16,64],"single-objective":[8,42],"reinforcement":[9,74],"learning":[10,75],"problem":[11,18,43],"can":[12,35],"be":[13,36],"turned":[14],"into":[15],"multi-objective":[17],"with":[19],"correlated":[20,33,54],"objectives,":[21],"by":[22],"providing":[23],"multiple":[24],"reward":[25],"shaping":[26],"functions.":[27],"The":[28],"information":[29],"contained":[30],"in":[31],"these":[32],"objectives":[34],"exploited":[37],"to":[38,71],"solve":[39,72],"the":[40,83],"base,":[41],"faster":[44],"and":[45],"better,":[46],"given":[47],"techniques":[48,62],"specifically":[49],"aimed":[50],"at":[51],"handling":[52],"such":[53],"objectives.":[55],"In":[56],"this":[57],"paper,":[58],"we":[59],"identify":[60],"ensemble":[61],"as":[63],"set":[65],"of":[66],"methods":[67],"that":[68],"is":[69],"suitable":[70],"multi-objectivized":[73],"problems.":[76],"We":[77],"empirically":[78],"demonstrate":[79],"their":[80],"use":[81],"Pursuit":[84],"domain.":[85]},"counts_by_year":[{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
