{"id":"https://openalex.org/W1980648727","doi":"https://doi.org/10.1109/tcyb.2014.2352038","title":"Toward Generalization of Automated Temporal Abstraction to Partially Observable Reinforcement Learning","display_name":"Toward Generalization of Automated Temporal Abstraction to Partially Observable Reinforcement Learning","publication_year":2014,"publication_date":"2014-09-09","ids":{"openalex":"https://openalex.org/W1980648727","doi":"https://doi.org/10.1109/tcyb.2014.2352038","mag":"1980648727","pmid":"https://pubmed.ncbi.nlm.nih.gov/25216494"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2014.2352038","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2014.2352038","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5002885572","display_name":"Erk\u0456n \u00c7\u0456lden","orcid":"https://orcid.org/0000-0003-3451-7326"},"institutions":[{"id":"https://openalex.org/I201799495","display_name":"Middle East Technical University","ror":"https://ror.org/014weej12","country_code":"TR","type":"education","lineage":["https://openalex.org/I201799495"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Erkin Cilden","raw_affiliation_strings":["Department of Computer Engineering, Middle East Technical University, Ankara, Turkey","Dept. of Computer Engineering, Middle East Technical University, Ankara, Turkey#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Middle East Technical University, Ankara, Turkey","institution_ids":["https://openalex.org/I201799495"]},{"raw_affiliation_string":"Dept. of Computer Engineering, Middle East Technical University, Ankara, Turkey#TAB#","institution_ids":["https://openalex.org/I201799495"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016249943","display_name":"Faruk Polat","orcid":"https://orcid.org/0000-0003-0509-9153"},"institutions":[{"id":"https://openalex.org/I201799495","display_name":"Middle East Technical University","ror":"https://ror.org/014weej12","country_code":"TR","type":"education","lineage":["https://openalex.org/I201799495"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Faruk Polat","raw_affiliation_strings":["Department of Computer Engineering, Middle East Technical University, Ankara, Turkey","Dept. of Computer Engineering, Middle East Technical University, Ankara, Turkey#TAB#"],"affiliations":[{"raw_affiliation_string":"Department of Computer Engineering, Middle East Technical University, Ankara, Turkey","institution_ids":["https://openalex.org/I201799495"]},{"raw_affiliation_string":"Dept. of Computer Engineering, Middle East Technical University, Ankara, Turkey#TAB#","institution_ids":["https://openalex.org/I201799495"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5002885572"],"corresponding_institution_ids":["https://openalex.org/I201799495"],"apc_list":null,"apc_paid":null,"fwci":0.4243,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.73475636,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"45","issue":"8","first_page":"1414","last_page":"1425"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11975","display_name":"Evolutionary Algorithms and Applications","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9696999788284302,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.8164709806442261},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.7777222394943237},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.762360692024231},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.761424720287323},{"id":"https://openalex.org/keywords/curse-of-dimensionality","display_name":"Curse of dimensionality","score":0.6762387752532959},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6184395551681519},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.6131808757781982},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5659393668174744},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.46590524911880493},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.4558012783527374},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.42269405722618103},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.41000422835350037},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3387337028980255},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11818766593933105}],"concepts":[{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.8164709806442261},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.7777222394943237},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.762360692024231},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.761424720287323},{"id":"https://openalex.org/C111030470","wikidata":"https://www.wikidata.org/wiki/Q1430460","display_name":"Curse of dimensionality","level":2,"score":0.6762387752532959},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6184395551681519},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.6131808757781982},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5659393668174744},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.46590524911880493},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.4558012783527374},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.42269405722618103},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.41000422835350037},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3387337028980255},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11818766593933105},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/tcyb.2014.2352038","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2014.2352038","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:25216494","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/25216494","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null},{"id":"pmh:oai:open.metu.edu.tr:11511/46018","is_oa":false,"landing_page_url":"https://hdl.handle.net/11511/46018","pdf_url":null,"source":{"id":"https://openalex.org/S4306402495","display_name":"OpenMETU (Middle East Technical University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I201799495","host_organization_name":"Middle East Technical University","host_organization_lineage":["https://openalex.org/I201799495"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.41999998688697815,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G4121987947","display_name":null,"funder_award_id":"113E239","funder_id":"https://openalex.org/F4320322626","funder_display_name":"T\u00fcrkiye Bilimsel ve Teknolojik Ara\u015ft\u0131rma Kurumu"}],"funders":[{"id":"https://openalex.org/F4320322626","display_name":"T\u00fcrkiye Bilimsel ve Teknolojik Ara\u015ft\u0131rma Kurumu","ror":"https://ror.org/04w9kkr77"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W131709709","https://openalex.org/W180325379","https://openalex.org/W1536990779","https://openalex.org/W1539216098","https://openalex.org/W1556824961","https://openalex.org/W1568042657","https://openalex.org/W1583380718","https://openalex.org/W1592847719","https://openalex.org/W1595483645","https://openalex.org/W1598052524","https://openalex.org/W1657674574","https://openalex.org/W1968768508","https://openalex.org/W2082973084","https://openalex.org/W2096132608","https://openalex.org/W2100677568","https://openalex.org/W2107726111","https://openalex.org/W2109910161","https://openalex.org/W2111412461","https://openalex.org/W2115356364","https://openalex.org/W2115502112","https://openalex.org/W2116753650","https://openalex.org/W2121517924","https://openalex.org/W2121863487","https://openalex.org/W2124434282","https://openalex.org/W2126566174","https://openalex.org/W2134802714","https://openalex.org/W2143435603","https://openalex.org/W2149476049","https://openalex.org/W2153947321","https://openalex.org/W2158304715","https://openalex.org/W2164397622","https://openalex.org/W2166515056","https://openalex.org/W2168359464","https://openalex.org/W2271240761","https://openalex.org/W2341171179","https://openalex.org/W2912565033","https://openalex.org/W3011120880","https://openalex.org/W3041202696","https://openalex.org/W4214717370","https://openalex.org/W4249441547","https://openalex.org/W6605390924","https://openalex.org/W6632200469","https://openalex.org/W6634137646","https://openalex.org/W6635158338","https://openalex.org/W6635465357","https://openalex.org/W6635923701","https://openalex.org/W6636922475","https://openalex.org/W6674155736","https://openalex.org/W6677133782","https://openalex.org/W6677456677","https://openalex.org/W6679977494","https://openalex.org/W6680976742","https://openalex.org/W6682802936","https://openalex.org/W6684606548","https://openalex.org/W6694098965","https://openalex.org/W6775686901"],"related_works":["https://openalex.org/W1994680671","https://openalex.org/W2000283393","https://openalex.org/W2002320543","https://openalex.org/W2040927204","https://openalex.org/W2061947244","https://openalex.org/W2150232912","https://openalex.org/W2054940838","https://openalex.org/W3106170641","https://openalex.org/W4321855183","https://openalex.org/W4296209631"],"abstract_inverted_index":{"Temporal":[0],"abstraction":[1,83,122,129],"for":[2,65,91],"reinforcement":[3],"learning":[4,9,20,61],"(RL)":[5],"aims":[6],"to":[7],"decrease":[8],"time":[10],"by":[11,59,134],"making":[12],"use":[13],"of":[14,24,41,102,126],"repeated":[15],"sub-policy":[16],"patterns":[17],"in":[18],"the":[19,39,47,50,53,60,127],"task.":[21],"Automatic":[22],"extraction":[23],"abstractions":[25,64],"during":[26],"RL":[27,68,106],"process":[28],"is":[29,56,69,131],"difficult":[30],"but":[31],"has":[32],"many":[33],"challenges":[34],"such":[35],"as":[36],"dealing":[37],"with":[38,119],"curse":[40],"dimensionality.":[42],"Various":[43],"studies":[44],"have":[45],"explored":[46,73],"subject":[48],"under":[49],"assumption":[51],"that":[52,115],"problem":[54],"domain":[55],"fully":[57,92],"observable":[58,67,93,105],"agent.":[62],"Learning":[63],"partially":[66,104],"a":[70,99],"relatively":[71],"less":[72],"area.":[74],"In":[75],"this":[76,120],"paper,":[77],"we":[78],"adapt":[79],"an":[80],"existing":[81],"automatic":[82],"method,":[84],"namely":[85],"extended":[86],"sequence":[87],"tree,":[88],"originally":[89],"designed":[90],"problems.":[94,139],"The":[95,124],"modified":[96],"method":[97,130],"covers":[98],"certain":[100],"family":[101],"model-based":[103],"settings.":[107],"We":[108],"also":[109],"introduce":[110],"belief":[111],"state":[112],"discretization":[113],"methods":[114],"can":[116],"be":[117],"used":[118],"new":[121],"mechanism.":[123],"effectiveness":[125],"proposed":[128],"shown":[132],"empirically":[133],"experimenting":[135],"on":[136],"well-known":[137],"benchmark":[138]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2017,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
