{"id":"https://openalex.org/W2967043083","doi":"https://doi.org/10.1109/tsmc.2019.2926806","title":"Efficient Batch-Mode Reinforcement Learning Using Extreme Learning Machines","display_name":"Efficient Batch-Mode Reinforcement Learning Using Extreme Learning Machines","publication_year":2019,"publication_date":"2019-08-14","ids":{"openalex":"https://openalex.org/W2967043083","doi":"https://doi.org/10.1109/tsmc.2019.2926806","mag":"2967043083"},"language":"en","primary_location":{"id":"doi:10.1109/tsmc.2019.2926806","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2019.2926806","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102926784","display_name":"Jiahang Liu","orcid":"https://orcid.org/0009-0004-2054-2576"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiahang Liu","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057599028","display_name":"Lei Zuo","orcid":"https://orcid.org/0000-0002-9938-7449"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Zuo","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053112608","display_name":"Xin Xu","orcid":"https://orcid.org/0000-0003-3238-745X"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Xu","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101668802","display_name":"Xinglong Zhang","orcid":"https://orcid.org/0000-0002-0587-2487"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinglong Zhang","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073231890","display_name":"Junkai Ren","orcid":"https://orcid.org/0000-0002-6199-7452"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junkai Ren","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055651722","display_name":"Qiang Fang","orcid":"https://orcid.org/0000-0002-5063-6889"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Fang","raw_affiliation_strings":["College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence Science and Technology, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101727888","display_name":"Xinwang Liu","orcid":"https://orcid.org/0000-0001-9066-1475"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinwang Liu","raw_affiliation_strings":["College of Computer, National University of Defense Technology, Changsha, China"],"affiliations":[{"raw_affiliation_string":"College of Computer, National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5102926784"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.8682,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.80972382,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"51","issue":"6","first_page":"3664","last_page":"3677"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9882000088691711,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10409","display_name":"Fuel Cells and Related Materials","score":0.986299991607666,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8348469734191895},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7660925388336182},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6829688549041748},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.611069917678833},{"id":"https://openalex.org/keywords/extreme-learning-machine","display_name":"Extreme learning machine","score":0.567510187625885},{"id":"https://openalex.org/keywords/batch-processing","display_name":"Batch processing","score":0.5321615934371948},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5299742221832275},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5235480666160583},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.47053131461143494},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.46788114309310913},{"id":"https://openalex.org/keywords/mode","display_name":"Mode (computer interface)","score":0.45569270849227905},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.43557652831077576},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.2666809558868408},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.24220877885818481},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1210198700428009}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8348469734191895},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7660925388336182},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6829688549041748},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.611069917678833},{"id":"https://openalex.org/C2780150128","wikidata":"https://www.wikidata.org/wiki/Q21948731","display_name":"Extreme learning machine","level":3,"score":0.567510187625885},{"id":"https://openalex.org/C172658912","wikidata":"https://www.wikidata.org/wiki/Q661613","display_name":"Batch processing","level":2,"score":0.5321615934371948},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5299742221832275},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5235480666160583},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.47053131461143494},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.46788114309310913},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.45569270849227905},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.43557652831077576},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.2666809558868408},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.24220877885818481},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1210198700428009},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2019.2926806","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2019.2926806","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G1189737475","display_name":null,"funder_award_id":"2018YFB1305105","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G5320757814","display_name":null,"funder_award_id":"U1564214","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7457541925","display_name":null,"funder_award_id":"61751311","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":62,"referenced_works":["https://openalex.org/W166862392","https://openalex.org/W1494474274","https://openalex.org/W1507222174","https://openalex.org/W1589747210","https://openalex.org/W1601081659","https://openalex.org/W1825869920","https://openalex.org/W1963523946","https://openalex.org/W1963616278","https://openalex.org/W1973433968","https://openalex.org/W1982029046","https://openalex.org/W1986278072","https://openalex.org/W1988707322","https://openalex.org/W1996640396","https://openalex.org/W1999912147","https://openalex.org/W2016355702","https://openalex.org/W2018500972","https://openalex.org/W2026131661","https://openalex.org/W2031878488","https://openalex.org/W2032378315","https://openalex.org/W2033956597","https://openalex.org/W2046513829","https://openalex.org/W2072931156","https://openalex.org/W2073384958","https://openalex.org/W2091565802","https://openalex.org/W2101133635","https://openalex.org/W2101674911","https://openalex.org/W2101786389","https://openalex.org/W2104714048","https://openalex.org/W2111072639","https://openalex.org/W2113921460","https://openalex.org/W2118556122","https://openalex.org/W2121863487","https://openalex.org/W2122040390","https://openalex.org/W2127412976","https://openalex.org/W2137983211","https://openalex.org/W2141695047","https://openalex.org/W2145339207","https://openalex.org/W2146957157","https://openalex.org/W2155910151","https://openalex.org/W2159312714","https://openalex.org/W2161795906","https://openalex.org/W2167982865","https://openalex.org/W2188644438","https://openalex.org/W2301408779","https://openalex.org/W2338719424","https://openalex.org/W2472390602","https://openalex.org/W2517537544","https://openalex.org/W2525713298","https://openalex.org/W2561849210","https://openalex.org/W2586680856","https://openalex.org/W2783311157","https://openalex.org/W2901276090","https://openalex.org/W2952108874","https://openalex.org/W3027095131","https://openalex.org/W3146803896","https://openalex.org/W4211221179","https://openalex.org/W4213251304","https://openalex.org/W4214717370","https://openalex.org/W4236439427","https://openalex.org/W4285719527","https://openalex.org/W4307347247","https://openalex.org/W6683841269"],"related_works":["https://openalex.org/W2067443264","https://openalex.org/W4400868993","https://openalex.org/W3096874164","https://openalex.org/W1985560493","https://openalex.org/W2386410636","https://openalex.org/W2357975469","https://openalex.org/W2145363145","https://openalex.org/W1626977535","https://openalex.org/W2341346307","https://openalex.org/W3168977894"],"abstract_inverted_index":{"As":[0],"a":[1,59,230],"class":[2],"of":[3,37,79,112,190,221,248],"batch-mode":[4,61,153],"reinforcement":[5],"learning":[6,81,101,115,180,253],"(RL)":[7],"methods":[8],"for":[9,49,68,132],"Markov":[10],"decision":[11,235],"problems":[12,86,182],"with":[13,64,193,257],"large":[14],"or":[15,47,208],"continuous":[16],"state":[17],"spaces,":[18],"approximate":[19],"policy":[20],"iteration":[21],"(API)":[22],"has":[23,121],"received":[24],"increasing":[25],"attention":[26],"in":[27,34,99,128,152,223,237,252],"the":[28,35,44,110,124,130,143,157,188,202,212,219,226,246,249],"past":[29],"decades.":[30],"One":[31],"open":[32],"problem":[33,236],"design":[36],"API":[38,126,191,214],"algorithms":[39,127,192],"is":[40,105,199],"how":[41],"to":[42,84,114,148,186],"construct":[43],"basis":[45],"functions":[46],"features":[48,67,131],"value":[50],"function":[51],"approximation":[52],"(VFA).":[53],"In":[54,155],"this":[55],"paper,":[56],"we":[57],"propose":[58],"novel":[60],"RL":[62,85],"approach":[63,72,120,159],"randomly":[65],"projected":[66],"VFA.":[69],"The":[70,93,118],"proposed":[71,119],"can":[73,89,134,160,205],"be":[74,90,135,146],"viewed":[75],"as":[76],"an":[77],"extension":[78,111],"extreme":[80],"machines":[82],"(ELMs)":[83],"so":[87],"it":[88],"called":[91],"ELM-API.":[92],"ELMs":[94,113],"have":[95],"been":[96],"popularly":[97],"studied":[98],"supervised":[100],"problems,":[102],"but":[103],"there":[104],"not":[106],"much":[107],"work":[108],"on":[109,177,229],"control":[116,181],"problems.":[117],"advantages":[122],"over":[123],"previous":[125,213],"that":[129,201],"VFA":[133],"quickly":[136],"generated":[137],"without":[138],"complex":[139],"parameter":[140],"selection":[141],"and":[142,163],"performance":[144,189,210],"will":[145],"adaptive":[147],"different":[149,194],"sample":[150,169],"sets":[151,170],"RL.":[154],"particular,":[156],"ELM-API":[158,203,222,250],"realize":[161],"fast":[162],"efficient":[164],"feature":[165,195],"reconstruction":[166],"when":[167],"training":[168],"are":[171,241],"relatively":[172],"small.":[173],"Comprehensive":[174],"simulation":[175,227],"studies":[176],"two":[178],"benchmark":[179],"were":[183],"carried":[184],"out":[185],"test":[187],"construction":[196],"methods.":[197],"It":[198],"shown":[200],"algorithm":[204,251],"obtain":[206],"comparable":[207],"better":[209],"than":[211],"approaches.":[215],"To":[216],"further":[217],"show":[218,245],"effectiveness":[220],"real-world":[224],"applications,":[225],"results":[228],"more":[231],"challenging":[232],"high-dimensional":[233],"lane-changing":[234,255],"dynamic":[238],"traffic":[239],"environment":[240],"also":[242],"reported,":[243],"which":[244],"capability":[247],"satisfactory":[254],"policies":[256],"high":[258],"data":[259],"efficiency.":[260]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
