{"id":"https://openalex.org/W2134911271","doi":"https://doi.org/10.1109/cdc.2005.1582142","title":"Reinforcement Learning of Optimal Supervisor Based on Language Measure","display_name":"Reinforcement Learning of Optimal Supervisor Based on Language Measure","publication_year":2006,"publication_date":"2006-10-04","ids":{"openalex":"https://openalex.org/W2134911271","doi":"https://doi.org/10.1109/cdc.2005.1582142","mag":"2134911271"},"language":"en","primary_location":{"id":"doi:10.1109/cdc.2005.1582142","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc.2005.1582142","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 44th IEEE Conference on Decision and Control","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101427761","display_name":"Takeshi Yamasaki","orcid":"https://orcid.org/0000-0002-6170-7945"},"institutions":[{"id":"https://openalex.org/I206011266","display_name":"Kwansei Gakuin University","ror":"https://ror.org/02qf2tx24","country_code":"JP","type":"education","lineage":["https://openalex.org/I206011266"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"T. Yamasaki","raw_affiliation_strings":["School of Science and Technology, Kwansei Gakuin University, Sanda, Hyogo, Japan","School of Science and Technology, Kwansei Gakuin Universiy, Sanda-shi, Hyogo, 669-1337 Japan tatsushi@ksc.kwansei.ac.jp"],"affiliations":[{"raw_affiliation_string":"School of Science and Technology, Kwansei Gakuin University, Sanda, Hyogo, Japan","institution_ids":["https://openalex.org/I206011266"]},{"raw_affiliation_string":"School of Science and Technology, Kwansei Gakuin Universiy, Sanda-shi, Hyogo, 669-1337 Japan tatsushi@ksc.kwansei.ac.jp","institution_ids":["https://openalex.org/I206011266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025132639","display_name":"Kazuhiro Taniguchi","orcid":"https://orcid.org/0000-0001-5774-5124"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"K. Taniguchi","raw_affiliation_strings":["Graduate School of Engineering Science, Osaka University, Toyonaka, Osaka, Japan","Osaka University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering Science, Osaka University, Toyonaka, Osaka, Japan","institution_ids":["https://openalex.org/I98285908"]},{"raw_affiliation_string":"Osaka University","institution_ids":["https://openalex.org/I98285908"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046686505","display_name":"Toshimitsu Ushio","orcid":"https://orcid.org/0000-0002-4009-270X"},"institutions":[{"id":"https://openalex.org/I98285908","display_name":"Osaka University","ror":"https://ror.org/035t8zc32","country_code":"JP","type":"education","lineage":["https://openalex.org/I98285908"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"T. Ushio","raw_affiliation_strings":["Graduate School of Engineering Science, Osaka University, Toyonaka, Osaka, Japan","Osaka University"],"affiliations":[{"raw_affiliation_string":"Graduate School of Engineering Science, Osaka University, Toyonaka, Osaka, Japan","institution_ids":["https://openalex.org/I98285908"]},{"raw_affiliation_string":"Osaka University","institution_ids":["https://openalex.org/I98285908"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101427761"],"corresponding_institution_ids":["https://openalex.org/I206011266"],"apc_list":null,"apc_paid":null,"fwci":0.6541,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.71524132,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"126","last_page":"131"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11125","display_name":"Petri Nets in System Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11125","display_name":"Petri Nets in System Modeling","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/supervisor","display_name":"Supervisor","score":0.9101543426513672},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.8103813529014587},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7897970676422119},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.735985517501831},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.6406406760215759},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48572856187820435},{"id":"https://openalex.org/keywords/formal-language","display_name":"Formal language","score":0.4161173701286316},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.357060968875885},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3285384774208069},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.23440015316009521},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.1401672065258026}],"concepts":[{"id":"https://openalex.org/C2779110517","wikidata":"https://www.wikidata.org/wiki/Q1240788","display_name":"Supervisor","level":2,"score":0.9101543426513672},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.8103813529014587},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7897970676422119},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.735985517501831},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.6406406760215759},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48572856187820435},{"id":"https://openalex.org/C146072743","wikidata":"https://www.wikidata.org/wiki/Q192161","display_name":"Formal language","level":2,"score":0.4161173701286316},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.357060968875885},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3285384774208069},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.23440015316009521},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.1401672065258026},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cdc.2005.1582142","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cdc.2005.1582142","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 44th IEEE Conference on Decision and Control","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1226734329","https://openalex.org/W1502177156","https://openalex.org/W1557517019","https://openalex.org/W1576452626","https://openalex.org/W1587663028","https://openalex.org/W1979349468","https://openalex.org/W1995131244","https://openalex.org/W2007347868","https://openalex.org/W2059057465","https://openalex.org/W2090821252","https://openalex.org/W2123274964","https://openalex.org/W2126295866","https://openalex.org/W2143990843","https://openalex.org/W2152623443","https://openalex.org/W2153400879","https://openalex.org/W2157338290","https://openalex.org/W2158941525","https://openalex.org/W2163167436","https://openalex.org/W2175973919","https://openalex.org/W2178684067","https://openalex.org/W2911283634","https://openalex.org/W2914656440","https://openalex.org/W4233708513","https://openalex.org/W4297744580","https://openalex.org/W6682402947","https://openalex.org/W6815665964"],"related_works":["https://openalex.org/W4387731985","https://openalex.org/W2755149878","https://openalex.org/W2941808082","https://openalex.org/W2468425257","https://openalex.org/W4379086698","https://openalex.org/W2528721242","https://openalex.org/W4377009725","https://openalex.org/W4320164562","https://openalex.org/W2356364326","https://openalex.org/W2127190708"],"abstract_inverted_index":{"Recently,":[0],"Wang":[1],"and":[2,48,71,108],"Ray":[3],"introduced":[4],"a":[5,13,28,44,54,72,91],"signed":[6],"real":[7],"measure":[8],"for":[9],"formal":[10],"languages,":[11],"called":[12],"language":[14,38],"measure,":[15],"to":[16],"evaluate":[17],"performance":[18,73],"of":[19,31,43,75,94,104,106,111,126],"strings":[20],"generated":[21,78],"by":[22,79,119],"discrete":[23,45,82],"event":[24,46,83],"systems.":[25,84],"They":[26],"proposed":[27,128],"synthesis":[29],"method":[30,93],"an":[32,124],"optimal":[33,96],"supervisor":[34,97],"based":[35,98],"on":[36,99],"the":[37,49,65,68,76,80,87,95,109,127],"measure.":[39],"If":[40],"exact":[41],"description":[42],"system":[47],"specification":[50],"is":[51,57],"not":[52],"available,":[53],"learning-based":[55],"approach":[56],"useful.":[58],"In":[59],"this":[60],"paper,":[61],"first,":[62],"we":[63,89,122],"clarify":[64],"relationship":[66],"between":[67],"Bellman":[69],"equation":[70],"index":[74],"languages":[77],"controlled":[81],"Next,":[85],"using":[86],"relationship,":[88],"propose":[90],"learning":[92,101],"reinforcement":[100],"where":[102],"costs":[103],"disabling":[105],"events":[107],"evaluation":[110],"reaching":[112],"states":[113],"are":[114],"taken":[115],"into":[116],"consideration.":[117],"Finally,":[118],"computer":[120],"simulation,":[121],"illustrate":[123],"efficiency":[125],"method.":[129]},"counts_by_year":[{"year":2015,"cited_by_count":2},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
