{"id":"https://openalex.org/W3203618099","doi":"https://doi.org/10.1109/access.2021.3117855","title":"Evaluation of Instance-Based Learning and Q-Learning Algorithms in Dynamic Environments","display_name":"Evaluation of Instance-Based Learning and Q-Learning Algorithms in Dynamic Environments","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3203618099","doi":"https://doi.org/10.1109/access.2021.3117855","mag":"3203618099"},"language":"en","primary_location":{"id":"doi:10.1109/access.2021.3117855","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3117855","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09558862.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09558862.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014436016","display_name":"Anmol Gupta","orcid":"https://orcid.org/0000-0003-0159-8780"},"institutions":[{"id":"https://openalex.org/I154851008","display_name":"Indian Institute of Technology Roorkee","ror":"https://ror.org/00582g326","country_code":"IN","type":"education","lineage":["https://openalex.org/I154851008"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Anmol Gupta","raw_affiliation_strings":["Pattern Recognition, Image processing, And Machine Learning Lab, Indian Institute of Technology Roorkee, Haridwar, India \u2013 247667. (e-mail: agupta@cs.iitr.ac.in)","PARIMAL, Indian Institute of Technology Roorkee, Haridwar, Roorkee, India"],"raw_orcid":"https://orcid.org/0000-0003-0159-8780","affiliations":[{"raw_affiliation_string":"Pattern Recognition, Image processing, And Machine Learning Lab, Indian Institute of Technology Roorkee, Haridwar, India \u2013 247667. (e-mail: agupta@cs.iitr.ac.in)","institution_ids":["https://openalex.org/I154851008"]},{"raw_affiliation_string":"PARIMAL, Indian Institute of Technology Roorkee, Haridwar, Roorkee, India","institution_ids":["https://openalex.org/I154851008"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036208317","display_name":"Partha Pratim Roy","orcid":"https://orcid.org/0000-0002-5735-5254"},"institutions":[{"id":"https://openalex.org/I154851008","display_name":"Indian Institute of Technology Roorkee","ror":"https://ror.org/00582g326","country_code":"IN","type":"education","lineage":["https://openalex.org/I154851008"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Partha Pratim Roy","raw_affiliation_strings":["Pattern Recognition, Image processing, And Machine Learning Lab, Indian Institute of Technology Roorkee, Haridwar, India \u2013 247667","PARIMAL, Indian Institute of Technology Roorkee, Haridwar, Roorkee, India"],"raw_orcid":"https://orcid.org/0000-0002-5735-5254","affiliations":[{"raw_affiliation_string":"Pattern Recognition, Image processing, And Machine Learning Lab, Indian Institute of Technology Roorkee, Haridwar, India \u2013 247667","institution_ids":["https://openalex.org/I154851008"]},{"raw_affiliation_string":"PARIMAL, Indian Institute of Technology Roorkee, Haridwar, Roorkee, India","institution_ids":["https://openalex.org/I154851008"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010689942","display_name":"Varun Dutt","orcid":"https://orcid.org/0000-0002-2151-8314"},"institutions":[{"id":"https://openalex.org/I9579091","display_name":"Indian Institute of Technology Mandi","ror":"https://ror.org/05r9r2f34","country_code":"IN","type":"education","lineage":["https://openalex.org/I9579091"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Varun Dutt","raw_affiliation_strings":["Applied Cognitive Science Laboratory, Indian Institute of Technology Mandi, Himachal Pradesh, India \u2013 175005","Applied Cognitive Science Laboratory, Indian Institute of Technology Mandi, Kamand, Himachal Pradesh, India"],"raw_orcid":"https://orcid.org/0000-0002-2151-8314","affiliations":[{"raw_affiliation_string":"Applied Cognitive Science Laboratory, Indian Institute of Technology Mandi, Himachal Pradesh, India \u2013 175005","institution_ids":["https://openalex.org/I9579091"]},{"raw_affiliation_string":"Applied Cognitive Science Laboratory, Indian Institute of Technology Mandi, Kamand, Himachal Pradesh, India","institution_ids":["https://openalex.org/I9579091"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":1.3993,"has_fulltext":true,"cited_by_count":15,"citation_normalized_percentile":{"value":0.85174914,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":"9","issue":null,"first_page":"138775","last_page":"138790"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.996399998664856,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7721293568611145},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7534710764884949},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.677516520023346},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.6508459448814392},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6161304712295532},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5998333692550659},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.5745754241943359},{"id":"https://openalex.org/keywords/instance-based-learning","display_name":"Instance-based learning","score":0.437517911195755},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.43537724018096924},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.41612038016319275}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7721293568611145},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7534710764884949},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.677516520023346},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.6508459448814392},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6161304712295532},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5998333692550659},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.5745754241943359},{"id":"https://openalex.org/C24138899","wikidata":"https://www.wikidata.org/wiki/Q17141258","display_name":"Instance-based learning","level":3,"score":0.437517911195755},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.43537724018096924},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.41612038016319275},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2021.3117855","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3117855","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09558862.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:a51fb151e90f4b03941e02bedb6740bb","is_oa":true,"landing_page_url":"https://doaj.org/article/a51fb151e90f4b03941e02bedb6740bb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 9, Pp 138775-138790 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2021.3117855","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3117855","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09558862.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3203618099.pdf","grobid_xml":"https://content.openalex.org/works/W3203618099.grobid-xml"},"referenced_works_count":63,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W49761325","https://openalex.org/W117607193","https://openalex.org/W121023703","https://openalex.org/W150117506","https://openalex.org/W1509957369","https://openalex.org/W1564229172","https://openalex.org/W1570270509","https://openalex.org/W1829811225","https://openalex.org/W1924476928","https://openalex.org/W1968394721","https://openalex.org/W1971228271","https://openalex.org/W2005566784","https://openalex.org/W2028145673","https://openalex.org/W2044690406","https://openalex.org/W2047094503","https://openalex.org/W2048317417","https://openalex.org/W2058346590","https://openalex.org/W2059841094","https://openalex.org/W2060256879","https://openalex.org/W2070483480","https://openalex.org/W2071478538","https://openalex.org/W2078969783","https://openalex.org/W2084342166","https://openalex.org/W2092919341","https://openalex.org/W2096130600","https://openalex.org/W2097482594","https://openalex.org/W2108472495","https://openalex.org/W2111840892","https://openalex.org/W2120969335","https://openalex.org/W2121863487","https://openalex.org/W2145339207","https://openalex.org/W2150468603","https://openalex.org/W2158789702","https://openalex.org/W2163569945","https://openalex.org/W2167313771","https://openalex.org/W2167425257","https://openalex.org/W2226341935","https://openalex.org/W2398220880","https://openalex.org/W2575705757","https://openalex.org/W2604382266","https://openalex.org/W2749604329","https://openalex.org/W2792586727","https://openalex.org/W2907626093","https://openalex.org/W2971565213","https://openalex.org/W3100789280","https://openalex.org/W3101940057","https://openalex.org/W3103559770","https://openalex.org/W3103780890","https://openalex.org/W3154434624","https://openalex.org/W4214560811","https://openalex.org/W4214717370","https://openalex.org/W4248808685","https://openalex.org/W6602040102","https://openalex.org/W6604793289","https://openalex.org/W6604963999","https://openalex.org/W6606062670","https://openalex.org/W6630512393","https://openalex.org/W6633940122","https://openalex.org/W6712419019","https://openalex.org/W6757677476","https://openalex.org/W6780559895","https://openalex.org/W6794469413"],"related_works":["https://openalex.org/W3203657119","https://openalex.org/W4286952720","https://openalex.org/W2534140487","https://openalex.org/W3196155444","https://openalex.org/W3183560647","https://openalex.org/W4286799911","https://openalex.org/W4321844043","https://openalex.org/W4386394212","https://openalex.org/W4310801741","https://openalex.org/W3042291365"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,5,8,30,174,200],"is":[2,9,62,69],"an":[3,33,168],"unsupervised":[4],"algorithm,":[6],"where":[7],"based":[10,176],"upon":[11],"feedback":[12],"from":[13],"the":[14,53,58,82,93,103,108,118,125,154,161,171,192],"environment.":[15,105,121,156],"Prior":[16],"research":[17],"has":[18,43],"proposed":[19,166],"cognitive":[20,59],"(e.g.,":[21],"Instance-based":[22],"Learning":[23],"or":[24],"IBL)":[25],"and":[26,57,74,77,84,96,132,203],"statistical":[27,54],"(Q-learning)":[28],"reinforcement":[29,173],"algorithms.":[31,79],"However,":[32],"evaluation":[34],"of":[35,92,102,117,185],"these":[36],"algorithms":[37,110,175],"in":[38,153,191,201],"a":[39,50,99,114],"single":[40],"dynamic":[41,178,204],"environment":[42,137],"not":[44],"been":[45],"explored.":[46],"In":[47],"this":[48],"paper,":[49],"comparison":[51],"between":[52],"Q-learning":[55,76,83],"algorithm":[56,61,127,141,163,194],"IBL":[60,78,85,126,140,162,193],"presented.":[63],"A":[64],"well-known":[65],"environment,":[66],"\"Frozen":[67],"Lake,\"":[68],"used":[70,128],"to":[71,135,145,170],"train,":[72],"generalize,":[73],"scale":[75],"For":[80,106],"generalizing,":[81],"agents":[86],"were":[87,111],"trained":[88],"on":[89,98,113,177],"one":[90],"version":[91,101,116],"Frozen":[94,119],"Lake":[95,120],"tested":[97,112],"permuted":[100],"same":[104],"scaling,":[107],"two":[109],"larger":[115,155],"Results":[122],"revealed":[123],"that":[124,160],"less":[129],"training":[130],"time":[131],"generalized":[133],"better":[134],"different":[136],"variants.":[138],"The":[139,183],"was":[142],"also":[143],"able":[144],"show":[146],"scalability":[147],"by":[148],"retaining":[149],"its":[150],"superior":[151],"performance":[152],"These":[157],"results":[158],"indicate":[159],"could":[164],"be":[165],"as":[167,181,189],"alternative":[169],"standard":[172],"programming":[179],"such":[180],"Q-learning.":[182],"inclusion":[184],"human":[186],"factors":[187],"(such":[188],"memory)":[190],"makes":[195],"it":[196],"suitable":[197],"for":[198],"robust":[199],"complex":[202],"environments.":[205]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":5}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
