{"id":"https://openalex.org/W4213455538","doi":"https://doi.org/10.1109/tac.2022.3153278","title":"Expedited Online Learning With Spatial Side Information","display_name":"Expedited Online Learning With Spatial Side Information","publication_year":2022,"publication_date":"2022-02-24","ids":{"openalex":"https://openalex.org/W4213455538","doi":"https://doi.org/10.1109/tac.2022.3153278"},"language":"en","primary_location":{"id":"doi:10.1109/tac.2022.3153278","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tac.2022.3153278","pdf_url":null,"source":{"id":"https://openalex.org/S184954342","display_name":"IEEE Transactions on Automatic Control","issn_l":"0018-9286","issn":["0018-9286","1558-2523","2334-3303"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automatic Control","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023184269","display_name":"Pranay Thangeda","orcid":"https://orcid.org/0000-0002-0680-6334"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pranay Thangeda","raw_affiliation_strings":["Department of Aerospace Engineering and the Coordinated Science Laboratory, University of Illinois at Urbana-Champaign, Urbana, USA"],"raw_orcid":"https://orcid.org/0000-0002-0680-6334","affiliations":[{"raw_affiliation_string":"Department of Aerospace Engineering and the Coordinated Science Laboratory, University of Illinois at Urbana-Champaign, Urbana, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070897457","display_name":"Melkior Ornik","orcid":"https://orcid.org/0000-0002-8510-8787"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Melkior Ornik","raw_affiliation_strings":["Department of Aerospace Engineering and the Coordinated Science Laboratory, University of Illinois at Urbana-Champaign, Urbana, USA"],"raw_orcid":"https://orcid.org/0000-0002-8510-8787","affiliations":[{"raw_affiliation_string":"Department of Aerospace Engineering and the Coordinated Science Laboratory, University of Illinois at Urbana-Champaign, Urbana, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5068441112","display_name":"Ufuk Topcu","orcid":"https://orcid.org/0000-0003-0819-9985"},"institutions":[{"id":"https://openalex.org/I86519309","display_name":"The University of Texas at Austin","ror":"https://ror.org/00hj54h04","country_code":"US","type":"education","lineage":["https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ufuk Topcu","raw_affiliation_strings":["Department of Aerospace Engineering and Engineering Mechanics, and the Oden Institute for Computational Engineering and Sciences, The University of Texas at Austin, Austin, USA"],"raw_orcid":"https://orcid.org/0000-0003-0819-9985","affiliations":[{"raw_affiliation_string":"Department of Aerospace Engineering and Engineering Mechanics, and the Oden Institute for Computational Engineering and Sciences, The University of Texas at Austin, Austin, USA","institution_ids":["https://openalex.org/I86519309"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5549,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.70838859,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"68","issue":"3","first_page":"1479","last_page":"1491"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9954000115394592,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7517244815826416},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7141676545143127},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5386170744895935},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5308055877685547},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5271567702293396},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5180611610412598},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.517760694026947},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.4205777645111084},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.324496865272522}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7517244815826416},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7141676545143127},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5386170744895935},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5308055877685547},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5271567702293396},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5180611610412598},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.517760694026947},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.4205777645111084},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.324496865272522},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tac.2022.3153278","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tac.2022.3153278","pdf_url":null,"source":{"id":"https://openalex.org/S184954342","display_name":"IEEE Transactions on Automatic Control","issn_l":"0018-9286","issn":["0018-9286","1558-2523","2334-3303"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automatic Control","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306101","display_name":"National Aeronautics and Space Administration","ror":"https://ror.org/027ka1x80"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W325088472","https://openalex.org/W1505831061","https://openalex.org/W1588797187","https://openalex.org/W1975867865","https://openalex.org/W1980516134","https://openalex.org/W1988526405","https://openalex.org/W2003048154","https://openalex.org/W2006501475","https://openalex.org/W2115356364","https://openalex.org/W2123447947","https://openalex.org/W2124352385","https://openalex.org/W2125710232","https://openalex.org/W2137351138","https://openalex.org/W2236244207","https://openalex.org/W2334782222","https://openalex.org/W2489939061","https://openalex.org/W2863106311","https://openalex.org/W2890278535","https://openalex.org/W2914335791","https://openalex.org/W2963778636","https://openalex.org/W3046018659","https://openalex.org/W4213251304","https://openalex.org/W4214587036","https://openalex.org/W4233413206","https://openalex.org/W4251942419","https://openalex.org/W4287726780","https://openalex.org/W4297780563","https://openalex.org/W6678481081","https://openalex.org/W6678635437","https://openalex.org/W6680367670","https://openalex.org/W6682367392","https://openalex.org/W6780575690"],"related_works":["https://openalex.org/W2964604098","https://openalex.org/W2374820792","https://openalex.org/W2997512100","https://openalex.org/W4319083788","https://openalex.org/W3022038857","https://openalex.org/W1874176344","https://openalex.org/W4379255972","https://openalex.org/W2098964857","https://openalex.org/W4289490967","https://openalex.org/W2893605337"],"abstract_inverted_index":{"The":[0],"applicability":[1],"of":[2,14,26,67,88,90,184,202,212,219],"model-based":[3,115],"online":[4],"reinforcement":[5,116],"learning":[6,18,52,117],"algorithms":[7,118,215],"is":[8,35],"often":[9],"limited":[10],"by":[11,95,119,151],"the":[12,19,23,48,53,65,70,79,91,100,121,144,168,176,182,185,191,203,206,210,213,235],"amount":[13],"exploration":[15,159],"required":[16],"for":[17,51,142],"environment":[20],"model":[21],"to":[22,31,36,62,109,155],"desired":[24],"level":[25],"accuracy.":[27],"A":[28],"promising":[29],"approach":[30],"addressing":[32],"this":[33,83],"issue":[34],"exploit":[37],"side":[38,111,153,236],"information,":[39],"available":[40],"either":[41],"<italic":[42],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[43],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">a":[44],"priori</i>":[45],"or":[46],"during":[47,187],"agent\u2019s":[49],"mission,":[50],"unknown":[54,149],"dynamics.":[55,136],"Side":[56],"information":[57,63,84,112,129,154],"in":[58,64,78,148,175,194,200,216],"our":[59],"context":[60],"refers":[61],"form":[66],"bounds":[68],"on":[69],"differences":[71],"between":[72,158],"transition":[73],"probabilities":[74],"at":[75,102,125],"different":[76,103],"states":[77,126,133],"environment.":[80],"We":[81,105,162,189,208],"use":[82],"as":[85,234],"a":[86,107,172,217,220,229],"measure":[87],"reusability":[89],"direct":[92],"experience":[93],"gained":[94],"performing":[96],"actions":[97],"and":[98,160,228],"observing":[99],"outcomes":[101],"states.":[104],"propose":[106,139],"framework":[108],"integrate":[110],"into":[113],"existing":[114],"complementing":[120],"samples":[122],"obtained":[123,130],"directly":[124],"with":[127,134,165,223],"second-hand":[128],"from":[131,225],"other":[132],"similar":[135],"Additionally,":[137],"we":[138],"an":[140],"algorithm":[141,170],"synthesizing":[143],"optimal":[145],"control":[146],"strategy":[147],"environments":[150],"using":[152],"effectively":[156],"balance":[157],"exploitation.":[161],"prove":[163],"that,":[164],"high":[166],"probability,":[167],"proposed":[169,214],"yields":[171],"near-optimal":[173,192],"policy":[174,193],"Bayesian":[177],"sense,":[178],"while":[179],"also":[180],"guaranteeing":[181],"safety":[183],"agent":[186],"exploration.":[188],"obtain":[190],"time":[195],"steps":[196],"that":[197],"are":[198],"polynomial":[199],"terms":[201],"parameters":[204],"describing":[205],"model.":[207],"illustrate":[209],"utility":[211],"setting":[218],"Mars":[221],"rover,":[222],"data":[224],"onboard":[226],"sensors":[227],"companion":[230],"aerial":[231],"vehicle":[232],"acting":[233],"information.":[237]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
