{"id":"https://openalex.org/W2032378315","doi":"https://doi.org/10.1109/tcyb.2014.2311578","title":"A Clustering-Based Graph Laplacian Framework for Value Function Approximation in Reinforcement Learning","display_name":"A Clustering-Based Graph Laplacian Framework for Value Function Approximation in Reinforcement Learning","publication_year":2014,"publication_date":"2014-04-25","ids":{"openalex":"https://openalex.org/W2032378315","doi":"https://doi.org/10.1109/tcyb.2014.2311578","mag":"2032378315","pmid":"https://pubmed.ncbi.nlm.nih.gov/24802018"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2014.2311578","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2014.2311578","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053112608","display_name":"Xin Xu","orcid":"https://orcid.org/0000-0003-3238-745X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Xu","raw_affiliation_strings":["College of Mechatronics and Automation, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Mechatronics and Automation, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103082016","display_name":"Zhenhua Huang","orcid":"https://orcid.org/0000-0003-3178-9721"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenhua Huang","raw_affiliation_strings":["College of Mechatronics and Automation, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Mechatronics and Automation, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101753111","display_name":"Daniel Graves","orcid":"https://orcid.org/0000-0002-5345-6584"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Daniel Graves","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Alberta, Edmonton, AB, Canada"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Alberta, Edmonton, AB, Canada","institution_ids":["https://openalex.org/I154425047"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003799782","display_name":"Witold Pedrycz","orcid":"https://orcid.org/0000-0002-9335-9930"},"institutions":[{"id":"https://openalex.org/I66083562","display_name":"Systems Research Institute","ror":"https://ror.org/0111cp837","country_code":"PL","type":"facility","lineage":["https://openalex.org/I66083562","https://openalex.org/I99542240"]},{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]},{"id":"https://openalex.org/I185163786","display_name":"King Abdulaziz University","ror":"https://ror.org/02ma4wv74","country_code":"SA","type":"education","lineage":["https://openalex.org/I185163786"]},{"id":"https://openalex.org/I99542240","display_name":"Polish Academy of Sciences","ror":"https://ror.org/01dr6c206","country_code":"PL","type":"funder","lineage":["https://openalex.org/I99542240"]}],"countries":["CA","PL","SA"],"is_corresponding":false,"raw_author_name":"Witold Pedrycz","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Faculty of Engineering, King Abdulaziz University, Jeddah, Saudi Arabia","Department of Electrical and Computer Engineering, University of Alberta, Edmonton, AB, Canada","Systems Research Institute, Polish Academy of Sciences, Warsaw, Poland"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Faculty of Engineering, King Abdulaziz University, Jeddah, Saudi Arabia","institution_ids":["https://openalex.org/I185163786"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Alberta, Edmonton, AB, Canada","institution_ids":["https://openalex.org/I154425047"]},{"raw_affiliation_string":"Systems Research Institute, Polish Academy of Sciences, Warsaw, Poland","institution_ids":["https://openalex.org/I66083562","https://openalex.org/I99542240"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5053112608"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":7.4777,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.97665249,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"44","issue":"12","first_page":"2613","last_page":"2625"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7804818153381348},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5502488613128662},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5364869832992554},{"id":"https://openalex.org/keywords/laplace-operator","display_name":"Laplace operator","score":0.4490280747413635},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.44790786504745483},{"id":"https://openalex.org/keywords/laplacian-matrix","display_name":"Laplacian matrix","score":0.4416186809539795},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.43434202671051025},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.37472325563430786},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.29992377758026123},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29622524976730347},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.15314379334449768},{"id":"https://openalex.org/keywords/mathematical-analysis","display_name":"Mathematical analysis","score":0.06476888060569763},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.05567145347595215}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7804818153381348},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5502488613128662},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5364869832992554},{"id":"https://openalex.org/C165700671","wikidata":"https://www.wikidata.org/wiki/Q203484","display_name":"Laplace operator","level":2,"score":0.4490280747413635},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.44790786504745483},{"id":"https://openalex.org/C115178988","wikidata":"https://www.wikidata.org/wiki/Q772067","display_name":"Laplacian matrix","level":3,"score":0.4416186809539795},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43434202671051025},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.37472325563430786},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.29992377758026123},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29622524976730347},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.15314379334449768},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.06476888060569763},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.05567145347595215}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001185","descriptor_name":"Artificial Intelligence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003198","descriptor_name":"Computer Simulation","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008962","descriptor_name":"Models, Theoretical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008962","descriptor_name":"Models, Theoretical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008962","descriptor_name":"Models, Theoretical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009716","descriptor_name":"Numerical Analysis, Computer-Assisted","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009716","descriptor_name":"Numerical Analysis, Computer-Assisted","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D009716","descriptor_name":"Numerical Analysis, Computer-Assisted","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012054","descriptor_name":"Reinforcement, Psychology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2014.2311578","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2014.2311578","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:24802018","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/24802018","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7799999713897705,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G5011351583","display_name":null,"funder_award_id":"91220301","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8665485977","display_name":null,"funder_award_id":"61075072","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1578099820","https://openalex.org/W1626155273","https://openalex.org/W1966086707","https://openalex.org/W1986349306","https://openalex.org/W1995450389","https://openalex.org/W2014729048","https://openalex.org/W2021231414","https://openalex.org/W2043806097","https://openalex.org/W2050838777","https://openalex.org/W2052305027","https://openalex.org/W2063575204","https://openalex.org/W2068155564","https://openalex.org/W2086608109","https://openalex.org/W2094387729","https://openalex.org/W2106451198","https://openalex.org/W2110422826","https://openalex.org/W2111980775","https://openalex.org/W2118556122","https://openalex.org/W2120982017","https://openalex.org/W2122471363","https://openalex.org/W2124175081","https://openalex.org/W2132351269","https://openalex.org/W2132849848","https://openalex.org/W2134569556","https://openalex.org/W2137092694","https://openalex.org/W2141326110","https://openalex.org/W2143958939","https://openalex.org/W2144446635","https://openalex.org/W2147170031","https://openalex.org/W2151268438","https://openalex.org/W2160840682","https://openalex.org/W2161795906","https://openalex.org/W2165726932","https://openalex.org/W2483347049","https://openalex.org/W2487144912","https://openalex.org/W2586680856","https://openalex.org/W3027095131","https://openalex.org/W3103182070","https://openalex.org/W4214717370","https://openalex.org/W4233518571","https://openalex.org/W4239890145","https://openalex.org/W4245296547","https://openalex.org/W4285719527","https://openalex.org/W6634702315","https://openalex.org/W6676174466","https://openalex.org/W6678114464","https://openalex.org/W6679599195","https://openalex.org/W6683841269","https://openalex.org/W7066478640"],"related_works":["https://openalex.org/W2570009360","https://openalex.org/W4321440274","https://openalex.org/W3004345458","https://openalex.org/W2883186538","https://openalex.org/W2051180862","https://openalex.org/W1976439244","https://openalex.org/W2402951419","https://openalex.org/W2896947499","https://openalex.org/W4244587941","https://openalex.org/W2362501828"],"abstract_inverted_index":{"In":[0,30],"order":[1],"to":[2,141],"deal":[3],"with":[4,9,76,102,119,130],"the":[5,93,134,150],"sequential":[6],"decision":[7,73],"problems":[8],"large":[10],"or":[11,60],"continuous":[12,77,120],"state":[13,78,121],"spaces,":[14],"feature":[15,41],"representation":[16,42,111],"and":[17,43,124,149],"function":[18,45],"approximation":[19,46,106],"have":[20],"been":[21],"a":[22,33,64,103,158],"major":[23],"research":[24],"topic":[25],"in":[26,48,71,117],"reinforcement":[27],"learning":[28,151],"(RL).":[29],"this":[31],"paper,":[32],"clustering-based":[34,54,97],"graph":[35,65,94,98],"Laplacian":[36,66,99],"framework":[37],"is":[38,67,100],"presented":[39],"for":[40,83,115,157],"value":[44],"(VFA)":[47],"RL.":[49],"By":[50],"making":[51],"use":[52],"of":[53,92,105,146,160],"techniques,":[55],"that":[56],"is,":[57],"K-means":[58],"clustering":[59],"fuzzy":[61],"C-means":[62],"clustering,":[63],"constructed":[68],"by":[69],"subsampling":[70],"Markov":[72],"processes":[74],"(MDPs)":[75],"spaces.":[79,122],"The":[80,96],"basis":[81,147],"functions":[82,148],"VFA":[84],"can":[85,154],"be":[86,155],"automatically":[87],"generated":[88],"from":[89],"spectral":[90],"analysis":[91],"Laplacian.":[95],"integrated":[101],"class":[104],"policy":[107,112],"iteration":[108,113],"algorithms":[109],"called":[110],"(RPI)":[114],"RL":[116],"MDPs":[118],"Simulation":[123],"experimental":[125],"results":[126],"show":[127],"that,":[128],"compared":[129],"previous":[131],"RPI":[132],"methods,":[133],"proposed":[135],"approach":[136],"needs":[137],"fewer":[138],"sample":[139],"points":[140],"compute":[142],"an":[143],"efficient":[144],"set":[145],"control":[152],"performance":[153],"improved":[156],"variety":[159],"parameter":[161],"settings.":[162]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":10}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
