{"id":"https://openalex.org/W3214634944","doi":"https://doi.org/10.1007/978-3-030-94583-1_7","title":"Gradient-Descent for Randomized Controllers Under Partial Observability","display_name":"Gradient-Descent for Randomized Controllers Under Partial Observability","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W3214634944","doi":"https://doi.org/10.1007/978-3-030-94583-1_7","mag":"3214634944"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-030-94583-1_7","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-030-94583-1_7","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5071333506","display_name":"Linus Heck","orcid":"https://orcid.org/0000-0002-4774-7609"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Linus Heck","raw_affiliation_strings":["RWTH Aachen University, Aachen, Germany"],"raw_orcid":"https://orcid.org/0000-0002-4774-7609","affiliations":[{"raw_affiliation_string":"RWTH Aachen University, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020384363","display_name":"Jip Spel","orcid":"https://orcid.org/0000-0002-9113-2791"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jip Spel","raw_affiliation_strings":["RWTH Aachen University, Aachen, Germany"],"raw_orcid":"https://orcid.org/0000-0002-9113-2791","affiliations":[{"raw_affiliation_string":"RWTH Aachen University, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018941708","display_name":"Sebastian Junges","orcid":"https://orcid.org/0000-0003-0978-8466"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Sebastian Junges","raw_affiliation_strings":["Radboud University, Nijmegen, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0003-0978-8466","affiliations":[{"raw_affiliation_string":"Radboud University, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058957702","display_name":"Joshua Moerman","orcid":"https://orcid.org/0000-0001-9819-8374"},"institutions":[{"id":"https://openalex.org/I7876267","display_name":"Open University of the Netherlands","ror":"https://ror.org/018dfmf50","country_code":"NL","type":"education","lineage":["https://openalex.org/I7876267"]},{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE","NL"],"is_corresponding":false,"raw_author_name":"Joshua Moerman","raw_affiliation_strings":["Open University of the Netherlands, Heerlen, The Netherlands","RWTH Aachen University, Aachen, Germany"],"raw_orcid":"https://orcid.org/0000-0001-9819-8374","affiliations":[{"raw_affiliation_string":"Open University of the Netherlands, Heerlen, The Netherlands","institution_ids":["https://openalex.org/I7876267"]},{"raw_affiliation_string":"RWTH Aachen University, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090819329","display_name":"Joost-Pieter Katoen","orcid":"https://orcid.org/0000-0002-6143-1926"},"institutions":[{"id":"https://openalex.org/I887968799","display_name":"RWTH Aachen University","ror":"https://ror.org/04xfq0f34","country_code":"DE","type":"education","lineage":["https://openalex.org/I887968799"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Joost-Pieter Katoen","raw_affiliation_strings":["RWTH Aachen University, Aachen, Germany"],"raw_orcid":"https://orcid.org/0000-0002-6143-1926","affiliations":[{"raw_affiliation_string":"RWTH Aachen University, Aachen, Germany","institution_ids":["https://openalex.org/I887968799"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5071333506"],"corresponding_institution_ids":["https://openalex.org/I887968799"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":4.4507,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.95270694,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"127","last_page":"150"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12056","display_name":"Markov Chains and Monte Carlo Methods","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/observability","display_name":"Observability","score":0.9160088300704956},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7855302095413208},{"id":"https://openalex.org/keywords/parametric-statistics","display_name":"Parametric statistics","score":0.6256141066551208},{"id":"https://openalex.org/keywords/gradient-descent","display_name":"Gradient descent","score":0.6063434481620789},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.5392033457756042},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.46306198835372925},{"id":"https://openalex.org/keywords/stochastic-gradient-descent","display_name":"Stochastic gradient descent","score":0.44671958684921265},{"id":"https://openalex.org/keywords/observable","display_name":"Observable","score":0.42767611145973206},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4261242747306824},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4150926470756531},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.409812331199646},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3799765408039093},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2665034234523773},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.1996745467185974},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.18719187378883362},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.14366933703422546},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.12454724311828613},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.08361920714378357}],"concepts":[{"id":"https://openalex.org/C36299963","wikidata":"https://www.wikidata.org/wiki/Q1369844","display_name":"Observability","level":2,"score":0.9160088300704956},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7855302095413208},{"id":"https://openalex.org/C117251300","wikidata":"https://www.wikidata.org/wiki/Q1849855","display_name":"Parametric statistics","level":2,"score":0.6256141066551208},{"id":"https://openalex.org/C153258448","wikidata":"https://www.wikidata.org/wiki/Q1199743","display_name":"Gradient descent","level":3,"score":0.6063434481620789},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.5392033457756042},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46306198835372925},{"id":"https://openalex.org/C206688291","wikidata":"https://www.wikidata.org/wiki/Q7617819","display_name":"Stochastic gradient descent","level":3,"score":0.44671958684921265},{"id":"https://openalex.org/C32848918","wikidata":"https://www.wikidata.org/wiki/Q845789","display_name":"Observable","level":2,"score":0.42767611145973206},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4261242747306824},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4150926470756531},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.409812331199646},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3799765408039093},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2665034234523773},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.1996745467185974},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.18719187378883362},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.14366933703422546},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.12454724311828613},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.08361920714378357},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1007/978-3-030-94583-1_7","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-030-94583-1_7","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:publications.rwth-aachen.de:841719","is_oa":false,"landing_page_url":"https://publications.rwth-aachen.de/record/841719","pdf_url":null,"source":{"id":"https://openalex.org/S4306401033","display_name":"RWTH Publications (RWTH Aachen)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887968799","host_organization_name":"RWTH Aachen University","host_organization_lineage":["https://openalex.org/I887968799"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Verification, Model Checking, and Abstract Interpretation : 23rd International Conference, VMCAI 2022, Philadelphia, PA, USA, January 16\u201318, 2022, Proceedings / edited by Bernd Finkbeiner, Thomas Wies<br/>23. International Conference on Verification, Model Checking, and Abstract Interpretation, VMCAI 2022, Philadelphia, PA, USA, 2022-01-16 - 2022-01-18","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:repository.ubn.ru.nl:2066/250748","is_oa":false,"landing_page_url":"https://repository.ubn.ru.nl/handle/2066/250748","pdf_url":null,"source":{"id":"https://openalex.org/S4306401067","display_name":"Radboud Repository (Radboud University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I145872427","host_organization_name":"Radboud University Nijmegen","host_organization_lineage":["https://openalex.org/I145872427"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article in monograph or in proceedings"},{"id":"pmh:ou:oai:research.ou.nl:publications/ea797d31-e998-4ced-ace8-806ea680b42b","is_oa":false,"landing_page_url":"https://research.ou.nl/en/publications/ea797d31-e998-4ced-ace8-806ea680b42b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Verification, model Checking, and Abstract Interpretation: 23rd International Conference, VMCAI 2022 Philadelphia, PA, USA, January 16\u201318, 2022 Proceedings, 127 - 150","raw_type":"info:eu-repo/semantics/conferencepaper"},{"id":"pmh:ru:oai:repository.ubn.ru.nl:2066/250748","is_oa":false,"landing_page_url":"http://hdl.handle.net/2066/250748","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Finkbeiner, B. (ed.), Verification, Model Checking, and Abstract Interpretation: 23rd International Conference, VMCAI 2022, Philadelphia, PA, USA, January 16\u201318, 2022, Proceedings, 127 - 150. Cham : Springer International Publishing","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Climate action","id":"https://metadata.un.org/sdg/13","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W754964377","https://openalex.org/W1176136657","https://openalex.org/W1498432697","https://openalex.org/W1532041863","https://openalex.org/W1559540003","https://openalex.org/W1574505635","https://openalex.org/W1600556058","https://openalex.org/W1622676895","https://openalex.org/W1643571618","https://openalex.org/W1851152565","https://openalex.org/W1862398452","https://openalex.org/W1880436303","https://openalex.org/W1892040981","https://openalex.org/W1977070092","https://openalex.org/W2000865099","https://openalex.org/W2010875998","https://openalex.org/W2111765806","https://openalex.org/W2114879646","https://openalex.org/W2135776689","https://openalex.org/W2149476049","https://openalex.org/W2158907787","https://openalex.org/W2168359464","https://openalex.org/W2284340808","https://openalex.org/W2336416123","https://openalex.org/W2587263590","https://openalex.org/W2594789366","https://openalex.org/W2604176721","https://openalex.org/W2803246896","https://openalex.org/W2808100232","https://openalex.org/W2809011908","https://openalex.org/W2930056168","https://openalex.org/W2932972683","https://openalex.org/W2938736712","https://openalex.org/W2962989424","https://openalex.org/W2963307044","https://openalex.org/W2982115117","https://openalex.org/W2995644129","https://openalex.org/W3019187101","https://openalex.org/W3034246012","https://openalex.org/W3081134170","https://openalex.org/W3097686825","https://openalex.org/W3109856706","https://openalex.org/W3134410578","https://openalex.org/W3142023506","https://openalex.org/W3162128423","https://openalex.org/W3179132544","https://openalex.org/W3214634944","https://openalex.org/W4253020087","https://openalex.org/W6629794996","https://openalex.org/W6637967152","https://openalex.org/W6674236629","https://openalex.org/W6767164110"],"related_works":["https://openalex.org/W11481024","https://openalex.org/W2895097035","https://openalex.org/W4206903459","https://openalex.org/W2754816816","https://openalex.org/W4366280654","https://openalex.org/W3160167280","https://openalex.org/W4362706668","https://openalex.org/W4231621013","https://openalex.org/W3171021120","https://openalex.org/W3008318776"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
