{"id":"https://openalex.org/W2009533501","doi":"https://doi.org/10.1016/0004-3702(94)00011-o","title":"Learning to act using real-time dynamic programming","display_name":"Learning to act using real-time dynamic programming","publication_year":1995,"publication_date":"1995-01-01","ids":{"openalex":"https://openalex.org/W2009533501","doi":"https://doi.org/10.1016/0004-3702(94)00011-o","mag":"2009533501"},"language":"en","primary_location":{"id":"doi:10.1016/0004-3702(94)00011-o","is_oa":false,"landing_page_url":"https://doi.org/10.1016/0004-3702(94)00011-o","pdf_url":null,"source":{"id":"https://openalex.org/S196139623","display_name":"Artificial Intelligence","issn_l":"0004-3702","issn":["0004-3702","1872-7921"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089808068","display_name":"Andrew G. Barto","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Andrew G. Barto","raw_affiliation_strings":["Department of Computer Science, University of Massachusetts, Amherst, MA 01003, USA","Dept. of Computer Science, University of Massachusetts. Amherst, MA 01003, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Massachusetts, Amherst, MA 01003, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Computer Science, University of Massachusetts. Amherst, MA 01003, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081885151","display_name":"Steven J. Bradtke","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steven J. Bradtke","raw_affiliation_strings":["Department of Computer Science, University of Massachusetts, Amherst, MA 01003, USA","Dept. of Computer Science, University of Massachusetts. Amherst, MA 01003, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Massachusetts, Amherst, MA 01003, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Computer Science, University of Massachusetts. Amherst, MA 01003, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065366930","display_name":"Satinder Singh","orcid":"https://orcid.org/0000-0002-2736-7641"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Satinder P. Singh","raw_affiliation_strings":["Department of Computer Science, University of Massachusetts, Amherst, MA 01003, USA","Dept. of Computer Science, University of Massachusetts. Amherst, MA 01003, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Massachusetts, Amherst, MA 01003, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Computer Science, University of Massachusetts. Amherst, MA 01003, USA","institution_ids":["https://openalex.org/I24603500"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5089808068"],"corresponding_institution_ids":["https://openalex.org/I24603500"],"apc_list":{"value":3670,"currency":"USD","value_usd":3670},"apc_paid":null,"fwci":75.2868,"has_fulltext":false,"cited_by_count":1109,"citation_normalized_percentile":{"value":0.99953002,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"72","issue":"1-2","first_page":"81","last_page":"138"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.76026451587677},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7192804217338562},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6013480424880981},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.597110390663147},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.5778990387916565},{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.5746535062789917},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5304011106491089},{"id":"https://openalex.org/keywords/temporal-difference-learning","display_name":"Temporal difference learning","score":0.47965624928474426},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.42634958028793335},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.22741085290908813}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.76026451587677},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7192804217338562},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6013480424880981},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.597110390663147},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.5778990387916565},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.5746535062789917},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5304011106491089},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.47965624928474426},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42634958028793335},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.22741085290908813},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0}],"mesh":[],"locations_count":8,"locations":[{"id":"doi:10.1016/0004-3702(94)00011-o","is_oa":false,"landing_page_url":"https://doi.org/10.1016/0004-3702(94)00011-o","pdf_url":null,"source":{"id":"https://openalex.org/S196139623","display_name":"Artificial Intelligence","issn_l":"0004-3702","issn":["0004-3702","1872-7921"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:scholarworks.umass.edu:cs_faculty_pubs-1352","is_oa":false,"landing_page_url":"https://scholarworks.umass.edu/cs_faculty_pubs/353","pdf_url":null,"source":{"id":"https://openalex.org/S4306402240","display_name":"ScholarWorks@UMassAmherst (University of Massachusetts Amherst)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I24603500","host_organization_name":"University of Massachusetts Amherst","host_organization_lineage":["https://openalex.org/I24603500"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computer Science Department Faculty Publication Series","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.117.6173","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.117.6173","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-anw.cs.umass.edu/pubs/1995_96/barto_bs_AI95.ps.gz","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.38.7343","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.38.7343","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ftp://ftp.cis.ohio-state.edu/pub/neuroprose/barto.realtime-dp.ps.Z","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.43.6020","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.43.6020","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ftp://ftp.cs.umass.edu/pub/techrept/techreport/1993/UM-CS-1993-002.ps","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.47.9423","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.47.9423","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ftp://ftp.cs.colorado.edu/users/baveja/Papers/realtime-dp.ps.gz","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.84.3495","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.84.3495","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.ualberta.ca/~bulitko/F05/CMPUT651/papers/RTDP.pdf","raw_type":"text"},{"id":"pmh:oai:scholarworks.umass.edu:20.500.14394/10018","is_oa":false,"landing_page_url":"https://hdl.handle.net/20.500.14394/10018","pdf_url":null,"source":{"id":"https://openalex.org/S4306402057","display_name":"Scholarworks (University of Massachusetts Amherst)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I24603500","host_organization_name":"University of Massachusetts Amherst","host_organization_lineage":["https://openalex.org/I24603500"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"published","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":149,"referenced_works":["https://openalex.org/W17303806","https://openalex.org/W20283819","https://openalex.org/W23603061","https://openalex.org/W24691574","https://openalex.org/W25062087","https://openalex.org/W32403112","https://openalex.org/W46130386","https://openalex.org/W50296447","https://openalex.org/W65193931","https://openalex.org/W111328409","https://openalex.org/W132264163","https://openalex.org/W354832773","https://openalex.org/W569156507","https://openalex.org/W640072212","https://openalex.org/W647344759","https://openalex.org/W658381347","https://openalex.org/W1491843047","https://openalex.org/W1505156375","https://openalex.org/W1522632257","https://openalex.org/W1545148916","https://openalex.org/W1551329771","https://openalex.org/W1555519929","https://openalex.org/W1557517019","https://openalex.org/W1565134770","https://openalex.org/W1569296262","https://openalex.org/W1572401739","https://openalex.org/W1573503290","https://openalex.org/W1586172133","https://openalex.org/W1586504939","https://openalex.org/W1595634327","https://openalex.org/W1596324102","https://openalex.org/W1597009674","https://openalex.org/W1597966850","https://openalex.org/W1600437712","https://openalex.org/W1603765807","https://openalex.org/W1610678877","https://openalex.org/W1612069379","https://openalex.org/W1628475528","https://openalex.org/W1640646391","https://openalex.org/W1931792391","https://openalex.org/W1964377184","https://openalex.org/W1968088166","https://openalex.org/W1969166509","https://openalex.org/W1969483458","https://openalex.org/W1971129545","https://openalex.org/W1979071892","https://openalex.org/W1982997797","https://openalex.org/W1990005421","https://openalex.org/W1997696513","https://openalex.org/W2010549090","https://openalex.org/W2020609518","https://openalex.org/W2021061679","https://openalex.org/W2024060531","https://openalex.org/W2030874472","https://openalex.org/W2035446426","https://openalex.org/W2039439610","https://openalex.org/W2040598998","https://openalex.org/W2045031658","https://openalex.org/W2045374782","https://openalex.org/W2051945694","https://openalex.org/W2054940200","https://openalex.org/W2061294832","https://openalex.org/W2064349031","https://openalex.org/W2067352298","https://openalex.org/W2082287757","https://openalex.org/W2091565802","https://openalex.org/W2100677568","https://openalex.org/W2100684997","https://openalex.org/W2102512214","https://openalex.org/W2103626435","https://openalex.org/W2106017103","https://openalex.org/W2106639887","https://openalex.org/W2112483970","https://openalex.org/W2118426468","https://openalex.org/W2119380668","https://openalex.org/W2121832485","https://openalex.org/W2122633037","https://openalex.org/W2129120309","https://openalex.org/W2135630072","https://openalex.org/W2141559645","https://openalex.org/W2149611281","https://openalex.org/W2151742051","https://openalex.org/W2155677642","https://openalex.org/W2155872498","https://openalex.org/W2158091072","https://openalex.org/W2161397207","https://openalex.org/W2161608691","https://openalex.org/W2341171179","https://openalex.org/W2341983526","https://openalex.org/W2413550626","https://openalex.org/W2540877599","https://openalex.org/W2567137345","https://openalex.org/W2914112863","https://openalex.org/W3011120880","https://openalex.org/W3015964010","https://openalex.org/W3022584652","https://openalex.org/W3041202696","https://openalex.org/W3121926921","https://openalex.org/W3183630977","https://openalex.org/W3198350258","https://openalex.org/W3213472335","https://openalex.org/W4243421009","https://openalex.org/W4247446124","https://openalex.org/W4252314834","https://openalex.org/W4285719527","https://openalex.org/W4298068217","https://openalex.org/W6600701548","https://openalex.org/W6600834042","https://openalex.org/W6600979164","https://openalex.org/W6601023721","https://openalex.org/W6601865881","https://openalex.org/W6602038105","https://openalex.org/W6602690695","https://openalex.org/W6604474294","https://openalex.org/W6608280181","https://openalex.org/W6629406372","https://openalex.org/W6630336746","https://openalex.org/W6631356907","https://openalex.org/W6633489894","https://openalex.org/W6633962305","https://openalex.org/W6634103402","https://openalex.org/W6634288218","https://openalex.org/W6634991393","https://openalex.org/W6635329781","https://openalex.org/W6635558854","https://openalex.org/W6635689168","https://openalex.org/W6635902665","https://openalex.org/W6636199354","https://openalex.org/W6636530465","https://openalex.org/W6636932949","https://openalex.org/W6642042007","https://openalex.org/W6649837222","https://openalex.org/W6675282414","https://openalex.org/W6675819118","https://openalex.org/W6675901991","https://openalex.org/W6677444215","https://openalex.org/W6678116171","https://openalex.org/W6678518843","https://openalex.org/W6679174265","https://openalex.org/W6680039697","https://openalex.org/W6681940304","https://openalex.org/W6682025713","https://openalex.org/W6683110158","https://openalex.org/W6704311137","https://openalex.org/W6775686901","https://openalex.org/W6799027959","https://openalex.org/W6804409665","https://openalex.org/W7043180619","https://openalex.org/W7054112703"],"related_works":["https://openalex.org/W2145363145","https://openalex.org/W2341346307","https://openalex.org/W2154399718","https://openalex.org/W4321463377","https://openalex.org/W1914583973","https://openalex.org/W2130711276","https://openalex.org/W4308828368","https://openalex.org/W3088331655","https://openalex.org/W1504584981","https://openalex.org/W3038962357"],"abstract_inverted_index":null,"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":17},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":20},{"year":2022,"cited_by_count":27},{"year":2021,"cited_by_count":41},{"year":2020,"cited_by_count":35},{"year":2019,"cited_by_count":35},{"year":2018,"cited_by_count":31},{"year":2017,"cited_by_count":23},{"year":2016,"cited_by_count":27},{"year":2015,"cited_by_count":34},{"year":2014,"cited_by_count":38},{"year":2013,"cited_by_count":49},{"year":2012,"cited_by_count":45}],"updated_date":"2026-04-06T07:47:59.780226","created_date":"2025-10-10T00:00:00"}
