{"id":"https://openalex.org/W2550302514","doi":"https://doi.org/10.1109/ijcnn.2016.7727655","title":"A general adaptive dynamic programming approach with experience replay","display_name":"A general adaptive dynamic programming approach with experience replay","publication_year":2016,"publication_date":"2016-07-01","ids":{"openalex":"https://openalex.org/W2550302514","doi":"https://doi.org/10.1109/ijcnn.2016.7727655","mag":"2550302514"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn.2016.7727655","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2016.7727655","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115604616","display_name":"Bin Wang","orcid":"https://orcid.org/0000-0002-0267-3749"},"institutions":[{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bin Wang","raw_affiliation_strings":["School of Electrical Engineering, University of Jinan, Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, University of Jinan, Jinan, China","institution_ids":["https://openalex.org/I34949971"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100624298","display_name":"Dongbin Zhao","orcid":"https://orcid.org/0000-0001-8218-9633"},"institutions":[{"id":"https://openalex.org/I4210094879","display_name":"Shandong Institute of Automation","ror":"https://ror.org/00qdtba35","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210094879","https://openalex.org/I4210142748"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongbin Zhao","raw_affiliation_strings":["The State Key Laboratory of Management and Control for Complex Systems Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Management and Control for Complex Systems Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210094879","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101738859","display_name":"Jin Cheng","orcid":"https://orcid.org/0000-0003-0378-0092"},"institutions":[{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Cheng","raw_affiliation_strings":["School of Electrical Engineering, University of Jinan, Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, University of Jinan, Jinan, China","institution_ids":["https://openalex.org/I34949971"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068847367","display_name":"Yuan Xu","orcid":"https://orcid.org/0000-0002-5966-945X"},"institutions":[{"id":"https://openalex.org/I34949971","display_name":"University of Jinan","ror":"https://ror.org/02mjz6f26","country_code":"CN","type":"education","lineage":["https://openalex.org/I34949971"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Xu","raw_affiliation_strings":["School of Electrical Engineering, University of Jinan, Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering, University of Jinan, Jinan, China","institution_ids":["https://openalex.org/I34949971"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100617027","display_name":"Yueyang Li","orcid":"https://orcid.org/0000-0002-1614-0302"},"institutions":[{"id":"https://openalex.org/I154099455","display_name":"Shandong University","ror":"https://ror.org/0207yh398","country_code":"CN","type":"education","lineage":["https://openalex.org/I154099455"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yueyang Li","raw_affiliation_strings":["Shandong University, Jinan, Shandong, CN"],"affiliations":[{"raw_affiliation_string":"Shandong University, Jinan, Shandong, CN","institution_ids":["https://openalex.org/I154099455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5115604616"],"corresponding_institution_ids":["https://openalex.org/I34949971"],"apc_list":null,"apc_paid":null,"fwci":1.0454,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80615953,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"81","issue":null,"first_page":"3550","last_page":"3555"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9290000200271606,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8381880521774292},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6346591711044312},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.633311927318573},{"id":"https://openalex.org/keywords/feed-forward","display_name":"Feed forward","score":0.5566360950469971},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5410929322242737},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5131005048751831},{"id":"https://openalex.org/keywords/feedforward-neural-network","display_name":"Feedforward neural network","score":0.5049424767494202},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4890473783016205},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.4671342372894287},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.2016892433166504},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.12300765514373779},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08293142914772034},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08131346106529236}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8381880521774292},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6346591711044312},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.633311927318573},{"id":"https://openalex.org/C38858127","wikidata":"https://www.wikidata.org/wiki/Q5441228","display_name":"Feed forward","level":2,"score":0.5566360950469971},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5410929322242737},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5131005048751831},{"id":"https://openalex.org/C47702885","wikidata":"https://www.wikidata.org/wiki/Q5441227","display_name":"Feedforward neural network","level":3,"score":0.5049424767494202},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4890473783016205},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.4671342372894287},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.2016892433166504},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.12300765514373779},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08293142914772034},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08131346106529236},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn.2016.7727655","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2016.7727655","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1513689897","https://openalex.org/W1626155273","https://openalex.org/W1629039467","https://openalex.org/W1969959431","https://openalex.org/W1974883306","https://openalex.org/W1980620643","https://openalex.org/W1982262386","https://openalex.org/W1999035253","https://openalex.org/W2050838777","https://openalex.org/W2085194340","https://openalex.org/W2117056304","https://openalex.org/W2141559645","https://openalex.org/W2145339207","https://openalex.org/W2165501837","https://openalex.org/W2963864421","https://openalex.org/W4214717370","https://openalex.org/W6684921986"],"related_works":["https://openalex.org/W2115072676","https://openalex.org/W2357447513","https://openalex.org/W4311212821","https://openalex.org/W2045727192","https://openalex.org/W2378845890","https://openalex.org/W2102065768","https://openalex.org/W4390752998","https://openalex.org/W1529660427","https://openalex.org/W3121106353","https://openalex.org/W2158578859"],"abstract_inverted_index":{"Experience":[0],"replay":[1,26],"is":[2,28],"a":[3,55,67,77],"promising":[4],"approach":[5,22],"to":[6,33,96,120],"improve":[7],"the":[8,24,35,46,64,81,84,87,90,98,101,105,111,122,126],"learning":[9,65,123],"efficiency":[10,124],"of":[11,69,83,100,110,125],"adaptive":[12,18],"dynamic":[13,19],"programming.":[14],"A":[15],"general":[16],"model-free":[17],"programming":[20],"(ADP)":[21],"with":[23,54,59],"experience":[25],"technology":[27],"investigated":[29],"in":[30,39,76,89],"this":[31],"paper":[32],"solve":[34],"optimal":[36],"control":[37],"problems":[38],"continuous":[40],"state":[41],"and":[42,49,104,115],"action":[43,50,102],"spaces.":[44],"Both":[45],"critic":[47,106],"network":[48,51,58,103],"are":[52,74,93,113,118],"modeled":[53],"feedforward":[56],"neural":[57,85],"one":[60],"hidden":[61],"layer.":[62],"During":[63],"process,":[66],"number":[68],"recently":[70],"observed":[71],"data":[72,88],"samples":[73],"recorded":[75],"database.":[78],"When":[79],"updating":[80],"parameters":[82],"networks,":[86],"sample":[91],"database":[92],"repeatedly":[94],"used":[95],"update":[97],"weights":[99],"network.":[107],"Implementation":[108],"details":[109],"algorithm":[112],"given,":[114],"simulation":[116],"experiments":[117],"utilized":[119],"verify":[121],"proposed":[127],"approach.":[128]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
