{"id":"https://openalex.org/W2166610875","doi":"https://doi.org/10.1145/1015330.1015359","title":"Learning and discovery of predictive state representations in dynamical systems with reset","display_name":"Learning and discovery of predictive state representations in dynamical systems with reset","publication_year":2004,"publication_date":"2004-01-01","ids":{"openalex":"https://openalex.org/W2166610875","doi":"https://doi.org/10.1145/1015330.1015359","mag":"2166610875"},"language":"en","primary_location":{"id":"doi:10.1145/1015330.1015359","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1015330.1015359","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Twenty-first international conference on Machine learning  - ICML '04","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066781741","display_name":"M. R. James","orcid":"https://orcid.org/0000-0003-2821-0133"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Michael R. James","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103117754","display_name":"Satinder Singh","orcid":"https://orcid.org/0000-0002-8215-8295"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Satinder Singh","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5066781741"],"corresponding_institution_ids":["https://openalex.org/I27837315"],"apc_list":null,"apc_paid":null,"fwci":9.7047,"has_fulltext":false,"cited_by_count":70,"citation_normalized_percentile":{"value":0.97971786,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"53","last_page":"53"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.7383942604064941},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.642183780670166},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6275904178619385},{"id":"https://openalex.org/keywords/dynamical-systems-theory","display_name":"Dynamical systems theory","score":0.6203694343566895},{"id":"https://openalex.org/keywords/reset","display_name":"Reset (finance)","score":0.607785701751709},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.6029155850410461},{"id":"https://openalex.org/keywords/operator","display_name":"Operator (biology)","score":0.5287777185440063},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4718199670314789},{"id":"https://openalex.org/keywords/dynamical-system","display_name":"Dynamical system (definition)","score":0.4468020796775818},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.41498520970344543},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4131455421447754},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3231954872608185}],"concepts":[{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.7383942604064941},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.642183780670166},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6275904178619385},{"id":"https://openalex.org/C79379906","wikidata":"https://www.wikidata.org/wiki/Q3174497","display_name":"Dynamical systems theory","level":2,"score":0.6203694343566895},{"id":"https://openalex.org/C2779795794","wikidata":"https://www.wikidata.org/wiki/Q7315343","display_name":"Reset (finance)","level":2,"score":0.607785701751709},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.6029155850410461},{"id":"https://openalex.org/C17020691","wikidata":"https://www.wikidata.org/wiki/Q139677","display_name":"Operator (biology)","level":5,"score":0.5287777185440063},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4718199670314789},{"id":"https://openalex.org/C33962884","wikidata":"https://www.wikidata.org/wiki/Q378637","display_name":"Dynamical system (definition)","level":3,"score":0.4468020796775818},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.41498520970344543},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4131455421447754},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3231954872608185},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C158448853","wikidata":"https://www.wikidata.org/wiki/Q425218","display_name":"Repressor","level":4,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C86339819","wikidata":"https://www.wikidata.org/wiki/Q407384","display_name":"Transcription factor","level":3,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C106159729","wikidata":"https://www.wikidata.org/wiki/Q2294553","display_name":"Financial economics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/1015330.1015359","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1015330.1015359","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Twenty-first international conference on Machine learning  - ICML '04","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.107.7820","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.107.7820","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.eecs.umich.edu/~mrjames/resetPSRsdist.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.67.5179","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.67.5179","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://kingman.cs.ualberta.ca/_banff04/icml/pages/papers/117.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W1515891729","https://openalex.org/W1540337045","https://openalex.org/W1550098664","https://openalex.org/W1984735703","https://openalex.org/W2065087844","https://openalex.org/W2123542217","https://openalex.org/W2149960632","https://openalex.org/W2158282517","https://openalex.org/W2798909945","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W4250831671","https://openalex.org/W2230606337","https://openalex.org/W2089869689","https://openalex.org/W4388681848","https://openalex.org/W2078952919","https://openalex.org/W2945666329","https://openalex.org/W2617651062","https://openalex.org/W2330535098","https://openalex.org/W2377513064","https://openalex.org/W2952544653"],"abstract_inverted_index":{"Predictive":[0],"state":[1,32,43],"representations":[2],"(PSRs)":[3],"are":[4,50],"a":[5,130,147],"recently":[6],"proposed":[7,103],"way":[8],"of":[9,18,21,64,141,154],"modeling":[10],"controlled":[11,142],"dynamical":[12,143],"systems.":[13],"PSR-based":[14,56],"models":[15,57,172],"use":[16],"predictions":[17,68],"observable":[19,170],"outcomes":[20],"tests":[22,66],"that":[23,38,77,145],"could":[24],"be":[25],"done":[26],"on":[27,89,113,118,169],"the":[28,41,65,74,79,90,95,125,138],"system":[29],"as":[30,48],"their":[31],"representation,":[33],"and":[34,52,71,116,129],"have":[35,84,146],"model":[36,75],"parameters":[37,76],"define":[39,78],"how":[40],"predictive":[42],"representation":[44],"changes":[45],"over":[46],"time":[47],"actions":[49],"taken":[51],"observations":[53],"noted.":[54],"Learning":[55],"requires":[58],"solving":[59],"two":[60],"subproblems:":[61],"1)":[62],"discovery":[63,91,127],"whose":[67],"constitute":[69],"state,":[70],"2)":[72],"learning":[73,96,132],"dynamics.":[80],"So":[81],"far,":[82],"there":[83],"been":[85,102],"no":[86],"results":[87,110],"available":[88],"subproblem":[92,97],"while":[93],"for":[94,134,137],"an":[98],"approximate-gradient":[99],"algorithm":[100,128,133],"has":[101],"(Singh":[104],"et":[105],"al.,":[106],"2003)":[107],"with":[108],"mixed":[109],"(it":[111],"works":[112],"some":[114],"domains":[115],"not":[117],"others).":[119],"In":[120],"this":[121],"paper,":[122],"we":[123,158],"provide":[124,151],"first":[126],"new":[131],"linear":[135],"PSRs":[136],"special":[139],"class":[140],"systems":[144],"reset":[148],"operation.":[149],"We":[150],"experimental":[152],"verification":[153],"our":[155,161],"algorithms.":[156],"Finally,":[157],"also":[159],"distinguish":[160],"work":[162,165],"from":[163],"prior":[164],"by":[166],"Jaeger":[167],"(2000)":[168],"operator":[171],"(OOMs).":[173]},"counts_by_year":[{"year":2023,"cited_by_count":3},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":3}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
