{"id":"https://openalex.org/W4415239912","doi":"https://doi.org/10.48550/arxiv.2508.14536","title":"Beyond ReLU: Chebyshev-DQN for Enhanced Deep Q-Networks","display_name":"Beyond ReLU: Chebyshev-DQN for Enhanced Deep Q-Networks","publication_year":2025,"publication_date":"2025-08-20","ids":{"openalex":"https://openalex.org/W4415239912","doi":"https://doi.org/10.48550/arxiv.2508.14536"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2508.14536","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.14536","pdf_url":"https://arxiv.org/pdf/2508.14536","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.14536","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092536120","display_name":"Saman Yazdannik","orcid":"https://orcid.org/0009-0007-8243-3844"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yazdannik, Saman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016811093","display_name":"Morteza Tayefi","orcid":"https://orcid.org/0000-0002-2773-2493"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tayefi, Morteza","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5120021796","display_name":"Shamim Sanisales","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sanisales, Shamim","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5092536120"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.8641999959945679,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.8641999959945679,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12676","display_name":"Machine Learning and ELM","score":0.8490999937057495,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.810699999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8070999979972839},{"id":"https://openalex.org/keywords/polynomial","display_name":"Polynomial","score":0.670799970626831},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6424999833106995},{"id":"https://openalex.org/keywords/chebyshev-polynomials","display_name":"Chebyshev polynomials","score":0.6121000051498413},{"id":"https://openalex.org/keywords/degree","display_name":"Degree (music)","score":0.5554999709129333},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.487199991941452},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.45890000462532043},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42410001158714294}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8070999979972839},{"id":"https://openalex.org/C90119067","wikidata":"https://www.wikidata.org/wiki/Q43260","display_name":"Polynomial","level":2,"score":0.670799970626831},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6424999833106995},{"id":"https://openalex.org/C129785596","wikidata":"https://www.wikidata.org/wiki/Q619511","display_name":"Chebyshev polynomials","level":2,"score":0.6121000051498413},{"id":"https://openalex.org/C2775997480","wikidata":"https://www.wikidata.org/wiki/Q586277","display_name":"Degree (music)","level":2,"score":0.5554999709129333},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5202999711036682},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.487199991941452},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.45890000462532043},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44839999079704285},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42410001158714294},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4018999934196472},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.38499999046325684},{"id":"https://openalex.org/C91873725","wikidata":"https://www.wikidata.org/wiki/Q3445816","display_name":"Function approximation","level":3,"score":0.38100001215934753},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.37299999594688416},{"id":"https://openalex.org/C25878781","wikidata":"https://www.wikidata.org/wiki/Q1473607","display_name":"Degree of a polynomial","level":3,"score":0.3716999888420105},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3517000079154968},{"id":"https://openalex.org/C145242015","wikidata":"https://www.wikidata.org/wiki/Q774123","display_name":"Approximation theory","level":2,"score":0.3375000059604645},{"id":"https://openalex.org/C21424316","wikidata":"https://www.wikidata.org/wiki/Q718621","display_name":"Chebyshev filter","level":2,"score":0.33219999074935913},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.320499986410141},{"id":"https://openalex.org/C5917680","wikidata":"https://www.wikidata.org/wiki/Q2621825","display_name":"Basis function","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2727999985218048}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2508.14536","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.14536","pdf_url":"https://arxiv.org/pdf/2508.14536","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2508.14536","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.14536","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.14536","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.14536","pdf_url":"https://arxiv.org/pdf/2508.14536","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4415239912.pdf","grobid_xml":"https://content.openalex.org/works/W4415239912.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"performance":[1],"of":[2,12,78,114,146,168],"Deep":[3],"Q-Networks":[4],"(DQN)":[5],"is":[6,149],"critically":[7],"dependent":[8],"on":[9,99],"the":[10,20,35,51,61,73,84,100,120,134,144,166,180],"ability":[11],"its":[13],"underlying":[14],"neural":[15],"network":[16],"to":[17,32,64,161],"accurately":[18],"approximate":[19],"action-value":[21],"function.":[22],"Standard":[23],"function":[24,75],"approximators,":[25],"such":[26],"as":[27,153],"multi-layer":[28],"perceptrons,":[29],"may":[30],"struggle":[31],"efficiently":[33,89],"represent":[34],"complex":[36],"value":[37],"landscapes":[38],"inherent":[39],"in":[40,173,183],"many":[41],"reinforcement":[42,175],"learning":[43,176],"problems.":[44],"This":[45,163],"paper":[46],"introduces":[47],"a":[48,56,66,107,111,123,150,154],"novel":[49],"architecture,":[50],"Chebyshev-DQN":[52],"(Ch-DQN),":[53],"which":[54],"integrates":[55],"Chebyshev":[57,79],"polynomial":[58,125,147,171],"basis":[59],"into":[60],"DQN":[62,109],"framework":[63],"create":[65],"more":[67,88],"effective":[68],"feature":[69],"representation.":[70],"By":[71],"leveraging":[72],"powerful":[74],"approximation":[76],"properties":[77],"polynomials,":[80],"we":[81,140],"hypothesize":[82],"that":[83,119,143],"Ch-DQN":[85,121],"can":[86,158],"learn":[87],"and":[90,103],"achieve":[91],"higher":[92],"performance.":[93],"We":[94],"evaluate":[95],"our":[96],"proposed":[97],"model":[98,184],"CartPole-v1":[101],"benchmark":[102],"compare":[104],"it":[105],"against":[106],"standard":[108],"with":[110,122],"comparable":[112],"number":[113],"parameters.":[115],"Our":[116],"results":[117],"demonstrate":[118],"moderate":[124],"degree":[126,148,156],"(N=4)":[127],"achieves":[128],"significantly":[129],"better":[130],"asymptotic":[131],"performance,":[132],"outperforming":[133],"baseline":[135],"by":[136],"approximately":[137],"39\\%.":[138],"However,":[139],"also":[141,178],"find":[142],"choice":[145],"critical":[151],"hyperparameter,":[152],"high":[155],"(N=8)":[157],"be":[159],"detrimental":[160],"learning.":[162],"work":[164],"validates":[165],"potential":[167],"using":[169],"orthogonal":[170],"bases":[172],"deep":[174],"while":[177],"highlighting":[179],"trade-offs":[181],"involved":[182],"complexity.":[185]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-16T00:00:00"}
