{"id":"https://openalex.org/W2038584310","doi":"https://doi.org/10.1109/icsmc.2010.5642280","title":"Improving reinforcement learning algorithms by the use of data mining techniques for feature and action selection","display_name":"Improving reinforcement learning algorithms by the use of data mining techniques for feature and action selection","publication_year":2010,"publication_date":"2010-10-01","ids":{"openalex":"https://openalex.org/W2038584310","doi":"https://doi.org/10.1109/icsmc.2010.5642280","mag":"2038584310"},"language":"en","primary_location":{"id":"doi:10.1109/icsmc.2010.5642280","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsmc.2010.5642280","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE International Conference on Systems, Man and Cybernetics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085849561","display_name":"Davi C.L. Vieira","orcid":"https://orcid.org/0000-0001-7447-4821"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":true,"raw_author_name":"Davi C. de L. Vieira","raw_affiliation_strings":["Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brazil","Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brasil#TAB#"],"affiliations":[{"raw_affiliation_string":"Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brazil","institution_ids":["https://openalex.org/I25112270"]},{"raw_affiliation_string":"Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brasil#TAB#","institution_ids":["https://openalex.org/I25112270"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049204941","display_name":"Paulo J. L. Adeodato","orcid":"https://orcid.org/0000-0002-0406-2474"},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Paulo J. L. Adeodato","raw_affiliation_strings":["Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brazil","Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brasil#TAB#"],"affiliations":[{"raw_affiliation_string":"Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brazil","institution_ids":["https://openalex.org/I25112270"]},{"raw_affiliation_string":"Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brasil#TAB#","institution_ids":["https://openalex.org/I25112270"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103973147","display_name":"Paulo Gon\u00e7alv\u00e9s","orcid":null},"institutions":[{"id":"https://openalex.org/I25112270","display_name":"Universidade Federal de Pernambuco","ror":"https://ror.org/047908t24","country_code":"BR","type":"education","lineage":["https://openalex.org/I25112270"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Paulo M. Goncalves","raw_affiliation_strings":["Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brazil","Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brasil#TAB#"],"affiliations":[{"raw_affiliation_string":"Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brazil","institution_ids":["https://openalex.org/I25112270"]},{"raw_affiliation_string":"Centro de Inform\u00e1tica, Universidade Federal de Pernambuco, Recife, Brasil#TAB#","institution_ids":["https://openalex.org/I25112270"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5085849561"],"corresponding_institution_ids":["https://openalex.org/I25112270"],"apc_list":null,"apc_paid":null,"fwci":0.9021,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.7997566,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1863","last_page":"1870"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10100","display_name":"Metaheuristic Optimization Algorithms Research","score":0.9284999966621399,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7934820652008057},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6884833574295044},{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.6422227621078491},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.5935015678405762},{"id":"https://openalex.org/keywords/action-selection","display_name":"Action selection","score":0.5490803718566895},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5390933752059937},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5232254862785339},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.5136075019836426},{"id":"https://openalex.org/keywords/data-stream-mining","display_name":"Data stream mining","score":0.45541810989379883},{"id":"https://openalex.org/keywords/learning-classifier-system","display_name":"Learning classifier system","score":0.4398089051246643},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.43333128094673157}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7934820652008057},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6884833574295044},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.6422227621078491},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.5935015678405762},{"id":"https://openalex.org/C166109690","wikidata":"https://www.wikidata.org/wiki/Q4677422","display_name":"Action selection","level":3,"score":0.5490803718566895},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5390933752059937},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5232254862785339},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.5136075019836426},{"id":"https://openalex.org/C89198739","wikidata":"https://www.wikidata.org/wiki/Q3079880","display_name":"Data stream mining","level":2,"score":0.45541810989379883},{"id":"https://openalex.org/C199190896","wikidata":"https://www.wikidata.org/wiki/Q3509276","display_name":"Learning classifier system","level":3,"score":0.4398089051246643},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.43333128094673157},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icsmc.2010.5642280","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icsmc.2010.5642280","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE International Conference on Systems, Man and Cybernetics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W187357405","https://openalex.org/W1570713908","https://openalex.org/W1583833196","https://openalex.org/W1601481856","https://openalex.org/W1987187457","https://openalex.org/W1988821219","https://openalex.org/W1993740947","https://openalex.org/W2006303459","https://openalex.org/W2010798644","https://openalex.org/W2034587361","https://openalex.org/W2041367235","https://openalex.org/W2050206309","https://openalex.org/W2084378698","https://openalex.org/W2104641222","https://openalex.org/W2117341272","https://openalex.org/W2121863487","https://openalex.org/W2123602362","https://openalex.org/W2124776405","https://openalex.org/W2130105540","https://openalex.org/W2150948710","https://openalex.org/W2161879907","https://openalex.org/W2171436656","https://openalex.org/W2285257517","https://openalex.org/W2623293810","https://openalex.org/W2988864014","https://openalex.org/W3011120880","https://openalex.org/W3139377883","https://openalex.org/W4214717370","https://openalex.org/W4237171445","https://openalex.org/W4285719527","https://openalex.org/W6602901451","https://openalex.org/W6635849658","https://openalex.org/W6651865480","https://openalex.org/W6677347465","https://openalex.org/W6775686901","https://openalex.org/W6792155000"],"related_works":["https://openalex.org/W2083347156","https://openalex.org/W2069446265","https://openalex.org/W4255973740","https://openalex.org/W4389449520","https://openalex.org/W2074501513","https://openalex.org/W1667225191","https://openalex.org/W1492078655","https://openalex.org/W1569406210","https://openalex.org/W2031811237","https://openalex.org/W2121764364"],"abstract_inverted_index":{"Data":[0],"mining":[1,43,126],"can":[2],"be":[3,112],"seen":[4],"as":[5],"an":[6,248],"area":[7],"of":[8,21,34,66,74,80,93,137,163,173,182,199,221,233,245,252,262],"artificial":[9],"intelligence":[10],"that":[11,106,218],"seeks":[12],"to":[13,38,70,88,111,134,169,190,254,257,272],"extract":[14],"information":[15],"or":[16,27],"patterns":[17],"from":[18,60],"large":[19],"amounts":[20],"data":[22,42,125,138],"either":[23],"stored":[24],"in":[25,29,123,128,139,195,223,239,242,250],"databases":[26],"flowing":[28],"streams.":[30],"The":[31,64,91,121,214,265],"main":[32],"contribution":[33],"this":[35,67,94,143,159],"work":[36,95],"is":[37,69,132,180,207,269],"present":[39],"how":[40],"LVF":[41],"technique":[44,51],"improves":[45],"Sarsa(\u03bb)":[46,205],"algorithm":[47,206],"combined":[48,209],"with":[49,117,210],"tile-coding":[50,212],"by":[52,83,98,155,228,235],"selecting":[53],"the":[54,72,75,78,84,99,135,156,161,176,191,203,211,219,224,231,258],"most":[55],"relevant":[56],"features":[57,164],"and":[58,77,152,165,186,230,247,274],"actions":[59,153,166,188,234],"reinforcement":[61,129],"learning":[62,130],"environments.":[63],"objective":[65],"selection":[68,162],"reduce":[71],"complexity":[73],"problem":[76,172,179],"amount":[79,220,232],"memory":[81,197,243],"used":[82,208],"agent":[85,192],"thus":[86],"leading":[87],"faster":[89],"convergence.":[90],"motivation":[92],"was":[96],"inspired":[97],"rationale":[100],"behind":[101],"Occam's":[102],"razor,":[103],"which":[104,193,237],"describes":[105],"a":[107,118,140,146,170,196,240],"complex":[108],"model":[109],"tends":[110],"less":[113],"accurate":[114],"than":[115],"another":[116],"lower":[119],"complexity.":[120],"difficulty":[122],"using":[124],"techniques":[127],"environments":[131],"due":[133],"lack":[136],"database,":[141],"so":[142],"paper":[144],"proposes":[145],"storage":[147],"schema":[148],"for":[149],"states":[150],"visited":[151],"performed":[154],"agent.":[157],"In":[158],"study,":[160],"are":[167],"applied":[168],"specific":[171],"RoboCup":[174],"soccer,":[175],"dribble.":[177],"This":[178],"composed":[181],"20":[183],"continuous":[184],"variables":[185,222],"113":[187],"available":[189],"results":[194,216],"consumption":[198,244],"approximately":[200],"4.5mb":[201],"when":[202],"traditional":[204],"technique.":[213],"experiments'":[215],"show":[217],"environment":[225],"were":[226],"reduced":[227],"35%":[229],"65%,":[236],"resulted":[238],"reduction":[241],"43%":[246],"increase":[249],"performance":[251],"up":[253],"23%,":[255],"according":[256],"relative":[259],"frequency":[260],"distribution":[261],"agent's":[263],"success.":[264],"approach":[266],"proposed":[267],"here":[268],"both":[270],"easy":[271],"use":[273],"efficient.":[275]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
