{"id":"https://openalex.org/W4401725926","doi":"https://doi.org/10.1109/tiv.2024.3446823","title":"Smooth Filtering Neural Network for Reinforcement Learning","display_name":"Smooth Filtering Neural Network for Reinforcement Learning","publication_year":2024,"publication_date":"2024-08-21","ids":{"openalex":"https://openalex.org/W4401725926","doi":"https://doi.org/10.1109/tiv.2024.3446823"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2024.3446823","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3446823","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084395808","display_name":"Wenxuan Wang","orcid":"https://orcid.org/0000-0002-0193-816X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenxuan Wang","raw_affiliation_strings":["State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0193-816X","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067909017","display_name":"Jingliang Duan","orcid":"https://orcid.org/0000-0002-3697-1576"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingliang Duan","raw_affiliation_strings":["School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3697-1576","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109766535","display_name":"Xujie Song","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xujie Song","raw_affiliation_strings":["State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9155-3035","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028599970","display_name":"Liming Xiao","orcid":"https://orcid.org/0009-0006-4566-1103"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liming Xiao","raw_affiliation_strings":["School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0006-4566-1103","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026361465","display_name":"Liangfa Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liangfa Chen","raw_affiliation_strings":["School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0002-8442-3205","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102869516","display_name":"Yinuo Wang","orcid":"https://orcid.org/0009-0006-8117-4425"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yinuo Wang","raw_affiliation_strings":["State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100640936","display_name":"Bo Cheng","orcid":"https://orcid.org/0000-0002-1753-2922"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Cheng","raw_affiliation_strings":["State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1753-2922","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Green Vehicle and Mobility, School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100747108","display_name":"Shengbo Eben Li","orcid":"https://orcid.org/0000-0003-4923-3633"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengbo Eben Li","raw_affiliation_strings":["School of Vehicle and Mobility &amp; College of AI, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4923-3633","affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility &amp; College of AI, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5084395808"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.9934,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.79987616,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":"10","issue":"5","first_page":"3103","last_page":"3112"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.4975999891757965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.4975999891757965,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7595423460006714},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6020757555961609},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5668513774871826},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5173415541648865},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5164061188697815},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.17480596899986267},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.04608306288719177}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7595423460006714},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6020757555961609},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5668513774871826},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5173415541648865},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5164061188697815},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.17480596899986267},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.04608306288719177}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tiv.2024.3446823","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3446823","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2012451615","https://openalex.org/W2050838777","https://openalex.org/W2103285838","https://openalex.org/W2145339207","https://openalex.org/W2498017881","https://openalex.org/W2944851425","https://openalex.org/W2951360122","https://openalex.org/W2962890638","https://openalex.org/W2962949934","https://openalex.org/W3015082424","https://openalex.org/W3096541186","https://openalex.org/W3100789280","https://openalex.org/W3113349091","https://openalex.org/W3135682060","https://openalex.org/W3167264379","https://openalex.org/W3199764406","https://openalex.org/W3207657697","https://openalex.org/W4224216677","https://openalex.org/W4226176749","https://openalex.org/W4285965606","https://openalex.org/W4294719302","https://openalex.org/W4312734823","https://openalex.org/W4323897042","https://openalex.org/W4362650413","https://openalex.org/W4366158867","https://openalex.org/W4376481351","https://openalex.org/W4390422151","https://openalex.org/W4394006698","https://openalex.org/W6922480057"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,105],"(RL)":[2],"has":[3],"demonstrated":[4],"considerable":[5],"potential":[6],"in":[7,33,52,228],"addressing":[8],"intricate":[9],"control":[10,18,24,79,180,218],"and":[11,19,46,65,136,182,200],"decision":[12],"problems":[13],"such":[14],"as":[15],"vehicle":[16],"tracking":[17],"obstacle":[20,187],"avoidance.":[21],"Nonetheless,":[22],"the":[23,34,50,76,82,101,123,142,172,229],"policies":[25],"acquired":[26],"through":[27,176],"RL":[28,152,167],"often":[29,67],"lack":[30],"smoothness":[31,77,211],"even":[32,47],"presence":[35],"of":[36,78,90,122,145,174],"minor":[37],"noises":[38,215],"or":[39,62],"disturbances,":[40],"which":[41],"may":[42],"induce":[43],"oscillations,":[44],"overheating,":[45],"damage":[48],"to":[49,99,162,165,224,234],"system":[51],"real-world":[53,184],"applications.":[54],"Existing":[55],"methods":[56],"handle":[57],"this":[58],"issue":[59,103],"from":[60,81],"temporal":[61],"spatial":[63],"domains":[64],"are":[66],"tightly":[68],"coupled":[69],"with":[70,93,114,193],"specific":[71],"tasks.":[72],"This":[73],"paper":[74],"studies":[75],"policy":[80,210],"frequency":[83],"domain":[84],"perspective.":[85],"We":[86],"propose":[87],"a":[88,106,150,183,225],"class":[89],"neural":[91],"networks":[92],"low-pass":[94,120],"filtering":[95,116,121,127,143,163],"ability,":[96],"named":[97],"Smonet,":[98,146],"alleviate":[100],"non-smooth":[102],"by":[104,155],"low-frequency":[107],"representation":[108],"within":[109],"hidden":[110],"layers.":[111],"Smonet":[112,175,207],"features":[113],"serial":[115],"layers":[117],"responsible":[118],"for":[119],"input":[124],"signal.":[125],"Each":[126],"layer":[128],"contains":[129],"multiple":[130],"inertia":[131],"cells,":[132],"one":[133,137],"adaptive":[134],"cell,":[135],"activation":[138],"layer.":[139],"To":[140],"facilitate":[141],"ability":[144],"we":[147,170],"further":[148],"proposed":[149],"Smonet-based":[151],"training":[153],"method":[154],"integrating":[156],"an":[157],"extra":[158],"regularization":[159],"term":[160],"relating":[161],"factors":[164],"standard":[166],"loss.":[168],"Finally,":[169],"assess":[171],"efficacy":[173],"diverse":[177],"simulated":[178],"robot":[179,186],"tasks":[181],"mobile":[185],"avoidance":[188],"experiment,":[189],"comparing":[190],"its":[191],"performance":[192],"two":[194],"commonly":[195],"utilized":[196],"networks,":[197],"multi-layer":[198],"perceptron":[199],"gated":[201],"recurrent":[202],"unit.":[203],"Results":[204],"indicate":[205],"that":[206],"consistently":[208],"enhances":[209],"under":[212],"various":[213],"observation":[214],"without":[216],"compromising":[217],"performance.":[219],"Notably,":[220],"it":[221],"achieves":[222],"up":[223],"72.7%":[226],"reduction":[227],"action":[230],"fluctuation":[231],"ratio":[232],"compared":[233],"traditional":[235],"network":[236],"structures.":[237]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
