{"id":"https://openalex.org/W2889269551","doi":"https://doi.org/10.1007/978-3-319-99978-4_17","title":"Bounded Rational Decision-Making with Adaptive Neural Network Priors","display_name":"Bounded Rational Decision-Making with Adaptive Neural Network Priors","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2889269551","doi":"https://doi.org/10.1007/978-3-319-99978-4_17","mag":"2889269551"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-319-99978-4_17","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-319-99978-4_17","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-319-99978-4_17.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-319-99978-4_17.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5078338213","display_name":"Heinke Hihn","orcid":"https://orcid.org/0000-0002-3244-3661"},"institutions":[{"id":"https://openalex.org/I196349391","display_name":"Universit\u00e4t Ulm","ror":"https://ror.org/032000t02","country_code":"DE","type":"education","lineage":["https://openalex.org/I196349391"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Heinke Hihn","raw_affiliation_strings":["Faculty of Engineering, Computer Science, and Psychology, Institute for Neural Information Processing, Ulm University, Ulm, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Computer Science, and Psychology, Institute for Neural Information Processing, Ulm University, Ulm, Germany","institution_ids":["https://openalex.org/I196349391"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085415063","display_name":"Sebastian Gottwald","orcid":"https://orcid.org/0000-0003-2906-3577"},"institutions":[{"id":"https://openalex.org/I196349391","display_name":"Universit\u00e4t Ulm","ror":"https://ror.org/032000t02","country_code":"DE","type":"education","lineage":["https://openalex.org/I196349391"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sebastian Gottwald","raw_affiliation_strings":["Faculty of Engineering, Computer Science, and Psychology, Institute for Neural Information Processing, Ulm University, Ulm, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Computer Science, and Psychology, Institute for Neural Information Processing, Ulm University, Ulm, Germany","institution_ids":["https://openalex.org/I196349391"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036520551","display_name":"Daniel Braun","orcid":"https://orcid.org/0000-0001-8120-3368"},"institutions":[{"id":"https://openalex.org/I196349391","display_name":"Universit\u00e4t Ulm","ror":"https://ror.org/032000t02","country_code":"DE","type":"education","lineage":["https://openalex.org/I196349391"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Daniel A. Braun","raw_affiliation_strings":["Faculty of Engineering, Computer Science, and Psychology, Institute for Neural Information Processing, Ulm University, Ulm, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, Computer Science, and Psychology, Institute for Neural Information Processing, Ulm University, Ulm, Germany","institution_ids":["https://openalex.org/I196349391"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5078338213"],"corresponding_institution_ids":["https://openalex.org/I196349391"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":{"value":5000,"currency":"EUR","value_usd":5392},"fwci":2.4436,"has_fulltext":true,"cited_by_count":11,"citation_normalized_percentile":{"value":0.91776864,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"213","last_page":"225"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.9868999719619751,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7909131646156311},{"id":"https://openalex.org/keywords/bounded-rationality","display_name":"Bounded rationality","score":0.7278411388397217},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.6663782596588135},{"id":"https://openalex.org/keywords/markov-chain-monte-carlo","display_name":"Markov chain Monte Carlo","score":0.5548930764198303},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.5466681718826294},{"id":"https://openalex.org/keywords/kullback\u2013leibler-divergence","display_name":"Kullback\u2013Leibler divergence","score":0.5298642516136169},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.5225248336791992},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.4936562478542328},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47295185923576355},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4717065989971161},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.46127864718437195},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4419032633304596},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.41991251707077026},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.3685157895088196},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.1984218955039978},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14179858565330505}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7909131646156311},{"id":"https://openalex.org/C58694771","wikidata":"https://www.wikidata.org/wiki/Q814385","display_name":"Bounded rationality","level":2,"score":0.7278411388397217},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.6663782596588135},{"id":"https://openalex.org/C111350023","wikidata":"https://www.wikidata.org/wiki/Q1191869","display_name":"Markov chain Monte Carlo","level":3,"score":0.5548930764198303},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.5466681718826294},{"id":"https://openalex.org/C171752962","wikidata":"https://www.wikidata.org/wiki/Q255166","display_name":"Kullback\u2013Leibler divergence","level":2,"score":0.5298642516136169},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.5225248336791992},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.4936562478542328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47295185923576355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4717065989971161},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.46127864718437195},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4419032633304596},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.41991251707077026},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3685157895088196},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.1984218955039978},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14179858565330505},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/978-3-319-99978-4_17","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-319-99978-4_17","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-319-99978-4_17.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},{"id":"pmh:oai:arXiv.org:1809.01575","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1809.01575","pdf_url":"https://arxiv.org/pdf/1809.01575","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:oparu.uni-ulm.de:123456789/10240","is_oa":true,"landing_page_url":"http://nbn-resolving.de/urn:nbn:de:bsz:289-oparu-10240-7","pdf_url":null,"source":{"id":"https://openalex.org/S4306400353","display_name":"OPen Access Repositorium der Universit\u00e4t Ulm (OPARU) (Ulm University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I196349391","host_organization_name":"Universit\u00e4t Ulm","host_organization_lineage":["https://openalex.org/I196349391"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/conferenceObject"},{"id":"doi:10.18725/oparu-10183","is_oa":true,"landing_page_url":"https://doi.org/10.18725/oparu-10183","pdf_url":null,"source":{"id":"https://openalex.org/S7407052964","display_name":"Universit\u00e4t Ulm, Kommunikations- und Informationszentrum (kiz)","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1007/978-3-319-99978-4_17","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-319-99978-4_17","pdf_url":"https://link.springer.com/content/pdf/10.1007%2F978-3-319-99978-4_17.pdf","source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7300000190734863,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2889269551.pdf","grobid_xml":"https://content.openalex.org/works/W2889269551.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W1487708124","https://openalex.org/W1489119587","https://openalex.org/W1824523713","https://openalex.org/W1959608418","https://openalex.org/W2068238590","https://openalex.org/W2093524643","https://openalex.org/W2097815751","https://openalex.org/W2101692583","https://openalex.org/W2121813011","https://openalex.org/W2128909582","https://openalex.org/W2157201325","https://openalex.org/W2163119409","https://openalex.org/W2163230106","https://openalex.org/W2211766770","https://openalex.org/W2239029832","https://openalex.org/W2250513429","https://openalex.org/W2257979135","https://openalex.org/W2289746565","https://openalex.org/W2569616450","https://openalex.org/W2744355733","https://openalex.org/W2768578623","https://openalex.org/W2951570923","https://openalex.org/W2962887178","https://openalex.org/W2963133245","https://openalex.org/W2963817734","https://openalex.org/W2964177217","https://openalex.org/W4298404235","https://openalex.org/W6604466195"],"related_works":["https://openalex.org/W2580650124","https://openalex.org/W4386190339","https://openalex.org/W2968424575","https://openalex.org/W3142333283","https://openalex.org/W3122088529","https://openalex.org/W3041320102","https://openalex.org/W2111669074","https://openalex.org/W2085259108","https://openalex.org/W3123087812","https://openalex.org/W4283770175"],"abstract_inverted_index":{"Abstract":[0],"Bounded":[1],"rationality":[2,15],"investigates":[3],"utility-optimizing":[4],"decision-makers":[5],"with":[6,128],"limited":[7],"information-processing":[8],"power.":[9],"In":[10,114],"particular,":[11],"information":[12],"theoretic":[13],"bounded":[14],"models":[16,89],"formalize":[17],"resource":[18],"constraints":[19],"abstractly":[20],"in":[21],"terms":[22],"of":[23,54,83,95],"relative":[24],"Shannon":[25],"information,":[26],"namely":[27],"the":[28,32,55,81,93,100],"Kullback-Leibler":[29],"Divergence":[30],"between":[31],"agents\u2019":[33],"prior":[34,39,72,101,109],"and":[35,40,73],"posterior":[36,41],"policy.":[37],"Between":[38],"lies":[42],"an":[43],"anytime":[44,129],"deliberation":[45],"process":[46],"that":[47,97,107,124],"can":[48,74],"be":[49],"instantiated":[50],"by":[51],"sample-based":[52,130],"evaluations":[53],"utility":[56],"function":[57],"through":[58],"Markov":[59],"Chain":[60],"Monte":[61],"Carlo":[62],"(MCMC)":[63],"optimization.":[64],"The":[65],"most":[66],"simple":[67],"model":[68],"assumes":[69],"a":[70],"fixed":[71],"relate":[75],"abstract":[76],"information-theoretic":[77],"processing":[78],"costs":[79],"to":[80],"number":[82],"sample":[84],"evaluations.":[85],"However,":[86],"more":[87,112],"advanced":[88],"would":[90],"also":[91],"address":[92],"question":[94],"learning,":[96],"is":[98,102],"how":[99],"adapted":[103],"over":[104],"time":[105],"such":[106,133],"generated":[108],"proposals":[110],"become":[111],"efficient.":[113],"this":[115,138],"work":[116],"we":[117],"investigate":[118],"generative":[119],"neural":[120],"networks":[121],"as":[122,134],"priors":[123],"are":[125],"optimized":[126],"concurrently":[127],"decision-making":[131],"processes":[132],"MCMC.":[135],"We":[136],"evaluate":[137],"approach":[139],"on":[140],"toy":[141],"examples.":[142]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":3}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
