{"id":"https://openalex.org/W3015302423","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207098","title":"A Novel Update Mechanism for Q-Networks Based On Extreme Learning Machines","display_name":"A Novel Update Mechanism for Q-Networks Based On Extreme Learning Machines","publication_year":2020,"publication_date":"2020-07-01","ids":{"openalex":"https://openalex.org/W3015302423","doi":"https://doi.org/10.1109/ijcnn48605.2020.9207098","mag":"3015302423"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn48605.2020.9207098","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207098","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074200616","display_name":"Callum Wilson","orcid":"https://orcid.org/0000-0003-3736-1355"},"institutions":[{"id":"https://openalex.org/I181647926","display_name":"University of Strathclyde","ror":"https://ror.org/00n3w3b69","country_code":"GB","type":"education","lineage":["https://openalex.org/I181647926"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Callum Wilson","raw_affiliation_strings":["Department of Mechanical and Aerospace Engineering, University of Strathclyde, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical and Aerospace Engineering, University of Strathclyde, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I181647926"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018647644","display_name":"Annalisa Riccardi","orcid":"https://orcid.org/0000-0001-5305-9450"},"institutions":[{"id":"https://openalex.org/I181647926","display_name":"University of Strathclyde","ror":"https://ror.org/00n3w3b69","country_code":"GB","type":"education","lineage":["https://openalex.org/I181647926"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Annalisa Riccardi","raw_affiliation_strings":["Department of Mechanical and Aerospace Engineering, University of Strathclyde, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical and Aerospace Engineering, University of Strathclyde, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I181647926"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015624888","display_name":"Edmondo Minisci","orcid":"https://orcid.org/0000-0001-9951-8528"},"institutions":[{"id":"https://openalex.org/I181647926","display_name":"University of Strathclyde","ror":"https://ror.org/00n3w3b69","country_code":"GB","type":"education","lineage":["https://openalex.org/I181647926"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Edmondo Minisci","raw_affiliation_strings":["Department of Mechanical and Aerospace Engineering, University of Strathclyde, Glasgow, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Mechanical and Aerospace Engineering, University of Strathclyde, Glasgow, United Kingdom","institution_ids":["https://openalex.org/I181647926"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5074200616"],"corresponding_institution_ids":["https://openalex.org/I181647926"],"apc_list":null,"apc_paid":null,"fwci":0.2651,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.6138084,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9763000011444092,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9178593158721924},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.788425087928772},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.714110791683197},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6687750816345215},{"id":"https://openalex.org/keywords/extreme-learning-machine","display_name":"Extreme learning machine","score":0.6445397734642029},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6370616555213928},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5786816477775574},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.5560681223869324},{"id":"https://openalex.org/keywords/learning-classifier-system","display_name":"Learning classifier system","score":0.5435137748718262},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5076361894607544},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.47610291838645935},{"id":"https://openalex.org/keywords/online-machine-learning","display_name":"Online machine learning","score":0.46964141726493835},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.45244520902633667},{"id":"https://openalex.org/keywords/instance-based-learning","display_name":"Instance-based learning","score":0.438048392534256},{"id":"https://openalex.org/keywords/function-approximation","display_name":"Function approximation","score":0.41899335384368896},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.3571244478225708},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07116013765335083}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9178593158721924},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.788425087928772},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.714110791683197},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6687750816345215},{"id":"https://openalex.org/C2780150128","wikidata":"https://www.wikidata.org/wiki/Q21948731","display_name":"Extreme learning machine","level":3,"score":0.6445397734642029},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6370616555213928},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5786816477775574},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.5560681223869324},{"id":"https://openalex.org/C199190896","wikidata":"https://www.wikidata.org/wiki/Q3509276","display_name":"Learning classifier system","level":3,"score":0.5435137748718262},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5076361894607544},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.47610291838645935},{"id":"https://openalex.org/C115903097","wikidata":"https://www.wikidata.org/wiki/Q7094097","display_name":"Online machine learning","level":3,"score":0.46964141726493835},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.45244520902633667},{"id":"https://openalex.org/C24138899","wikidata":"https://www.wikidata.org/wiki/Q17141258","display_name":"Instance-based learning","level":3,"score":0.438048392534256},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.41899335384368896},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.3571244478225708},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07116013765335083},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn48605.2020.9207098","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn48605.2020.9207098","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W46130386","https://openalex.org/W1757796397","https://openalex.org/W1914583973","https://openalex.org/W1980516134","https://openalex.org/W1985368534","https://openalex.org/W1993717606","https://openalex.org/W1994280577","https://openalex.org/W2067444778","https://openalex.org/W2091565802","https://openalex.org/W2111072639","https://openalex.org/W2113207845","https://openalex.org/W2121863487","https://openalex.org/W2124175081","https://openalex.org/W2139162305","https://openalex.org/W2139418546","https://openalex.org/W2141559645","https://openalex.org/W2145339207","https://openalex.org/W2154852616","https://openalex.org/W2155968351","https://openalex.org/W2158782408","https://openalex.org/W2257979135","https://openalex.org/W2289659279","https://openalex.org/W2301541953","https://openalex.org/W2746553466","https://openalex.org/W2754517384","https://openalex.org/W2919115771","https://openalex.org/W2963120839","https://openalex.org/W2964043796","https://openalex.org/W3011120880","https://openalex.org/W4214717370","https://openalex.org/W4298857966","https://openalex.org/W6601865881","https://openalex.org/W6637967152","https://openalex.org/W6677088747","https://openalex.org/W6678114464","https://openalex.org/W6692846177","https://openalex.org/W6696156361","https://openalex.org/W6744123322","https://openalex.org/W6775686901","https://openalex.org/W6780559895"],"related_works":["https://openalex.org/W4205569898","https://openalex.org/W3140225428","https://openalex.org/W3196155444","https://openalex.org/W2766258251","https://openalex.org/W2610686804","https://openalex.org/W4321844043","https://openalex.org/W2230868825","https://openalex.org/W2143680741","https://openalex.org/W3210156800","https://openalex.org/W2171128163"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,6,90,95,130,139],"is":[2,61,108],"a":[3,93,119,127,142],"popular":[4],"machine":[5],"paradigm":[7],"which":[8,51],"can":[9],"find":[10],"near":[11],"optimal":[12],"solutions":[13],"to":[14,31,69,87,92,118,141],"complex":[15],"problems.":[16],"Most":[17],"often,":[18],"these":[19],"procedures":[20],"involve":[21],"function":[22],"approximation":[23],"using":[24],"neural":[25,76],"networks":[26,77],"with":[27],"gradient":[28,102],"based":[29,103],"updates":[30],"optimise":[32],"weights":[33],"for":[34],"the":[35,72,98,123],"problem":[36,96,131],"being":[37],"considered.":[38],"While":[39],"this":[40],"common":[41],"approach":[42],"generally":[43],"works":[44],"well,":[45],"there":[46],"are":[47,52],"other":[48],"update":[49],"mechanisms":[50],"largely":[53],"unexplored":[54],"in":[55,97],"reinforcement":[56,94,129],"learning.":[57],"One":[58],"such":[59],"mechanism":[60],"Extreme":[62,110],"Learning":[63],"Machines.":[64],"These":[65],"were":[66],"initially":[67],"proposed":[68],"drastically":[70],"improve":[71],"training":[73],"speed":[74],"of":[75],"and":[78,133],"have":[79],"since":[80],"seen":[81],"many":[82],"applications.":[83],"Here":[84],"we":[85],"attempt":[86],"apply":[88],"extreme":[89],"machines":[91],"same":[99],"manner":[100],"as":[101],"updates.":[104],"This":[105],"new":[106],"algorithm":[107],"called":[109],"Q-Learning":[111],"Machine":[112],"(EQLM).":[113],"We":[114],"compare":[115],"its":[116],"performance":[117,140],"typical":[120],"Q-Network":[121],"on":[122],"cart-pole":[124],"task":[125],"-":[126,132],"benchmark":[128],"show":[134],"EQLM":[135],"has":[136],"similar":[137],"long-term":[138],"Q-Network.":[143]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
