{"id":"https://openalex.org/W2140219596","doi":"https://doi.org/10.1109/iros.2004.1389903","title":"Reinforcement learning for sensing strategies","display_name":"Reinforcement learning for sensing strategies","publication_year":2005,"publication_date":"2005-04-12","ids":{"openalex":"https://openalex.org/W2140219596","doi":"https://doi.org/10.1109/iros.2004.1389903","mag":"2140219596"},"language":"en","primary_location":{"id":"doi:10.1109/iros.2004.1389903","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2004.1389903","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2004 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS) (IEEE Cat. No.04CH37566)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111310852","display_name":"Chin Yuen Kwok","orcid":null},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"C. Kwok","raw_affiliation_strings":["Computer Science & Engineering, University of Washington, Seattle, WA, USA","Dept. of Comput. Sci. & Eng., Washington Univ., Seattle, WA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Computer Science & Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"Dept. of Comput. Sci. & Eng., Washington Univ., Seattle, WA, USA#TAB#","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108302275","display_name":"D. Fox","orcid":"https://orcid.org/0009-0004-7622-7196"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"D. Fox","raw_affiliation_strings":["Computer Science & Engineering, University of Washington, Seattle, WA, USA","Dept. of Comput. Sci. & Eng., Washington Univ., Seattle, WA, USA#TAB#"],"affiliations":[{"raw_affiliation_string":"Computer Science & Engineering, University of Washington, Seattle, WA, USA","institution_ids":["https://openalex.org/I201448701"]},{"raw_affiliation_string":"Dept. of Comput. Sci. & Eng., Washington Univ., Seattle, WA, USA#TAB#","institution_ids":["https://openalex.org/I201448701"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5111310852"],"corresponding_institution_ids":["https://openalex.org/I201448701"],"apc_list":null,"apc_paid":null,"fwci":5.0236,"has_fulltext":false,"cited_by_count":61,"citation_normalized_percentile":{"value":0.95208765,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"4","issue":null,"first_page":"3158","last_page":"3163"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12784","display_name":"Modular Robots and Swarm Intelligence","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8738906383514404},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7315879464149475},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7111815810203552},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.6969770193099976},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5922380685806274},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.4796041250228882},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.47128409147262573},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4438351094722748},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.4238147735595703},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.41377922892570496},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15613001585006714},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07561087608337402}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8738906383514404},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7315879464149475},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7111815810203552},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.6969770193099976},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5922380685806274},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.4796041250228882},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.47128409147262573},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4438351094722748},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.4238147735595703},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.41377922892570496},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15613001585006714},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07561087608337402},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iros.2004.1389903","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros.2004.1389903","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2004 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS) (IEEE Cat. No.04CH37566)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.107.6261","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.107.6261","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.utexas.edu/users/AustinVilla/legged/papers/active-sensing.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.97.4710","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.97.4710","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.washington.edu/homes/fox/postscripts/active-sensing-iros-04.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1531532259","https://openalex.org/W1546266526","https://openalex.org/W1582069131","https://openalex.org/W1597303641","https://openalex.org/W2032097519","https://openalex.org/W2099833070","https://openalex.org/W2102621601","https://openalex.org/W2104207191","https://openalex.org/W2106237563","https://openalex.org/W2115853680","https://openalex.org/W2120712855","https://openalex.org/W2121863487","https://openalex.org/W2137633880","https://openalex.org/W2144691386","https://openalex.org/W2154727088","https://openalex.org/W2155791599","https://openalex.org/W2155971774","https://openalex.org/W4214717370","https://openalex.org/W6635120896","https://openalex.org/W6635767209","https://openalex.org/W6675086535","https://openalex.org/W6675657953","https://openalex.org/W6682864419"],"related_works":["https://openalex.org/W2122871747","https://openalex.org/W3114279067","https://openalex.org/W2930863966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W2643884694","https://openalex.org/W2165180011","https://openalex.org/W4220829754","https://openalex.org/W3165944253"],"abstract_inverted_index":{"Since":[0],"sensors":[1],"have":[2,10,85],"limited":[3],"range":[4],"and":[5,69,98,121,138],"coverage,":[6],"mobile":[7],"robots":[8],"often":[9],"to":[11,16,27,39,84,92,96,99,115,134,155],"make":[12,100],"decisions":[13],"on":[14],"where":[15,130],"point":[17],"their":[18],"sensors.":[19],"A":[20],"good":[21],"sensing":[22,42,88,159],"strategy":[23],"allows":[24],"a":[25,53,109,136],"robot":[26,76,81,132],"collect":[28],"information":[29],"that":[30,47,149],"is":[31,153],"useful":[32],"for":[33],"its":[34],"tasks.":[35],"Most":[36],"existing":[37],"solutions":[38],"this":[40,105,117],"active":[41],"problem":[43,60],"choose":[44],"the":[45,50,72,75,101,123,127,131,143],"direction":[46],"maximally":[48],"reduces":[49],"uncertainty":[51],"in":[52,65,77,90,126],"single":[54],"state":[55,67],"variable.":[56],"In":[57,104],"more":[58,86],"complex":[59],"domains,":[61],"however,":[62],"uncertainties":[63,95],"exist":[64],"multiple":[66],"variables,":[68],"they":[70],"affect":[71],"performance":[73],"of":[74],"different":[78],"ways.":[79],"The":[80],"thus":[82],"needs":[83],"sophisticated":[87],"strategies":[89],"order":[91],"decide":[93],"which":[94],"reduce,":[97],"correct":[102],"trade-offs.":[103],"work,":[106],"we":[107],"apply":[108],"least":[110],"squares":[111],"reinforcement":[112],"learning":[113,124],"method":[114],"solve":[116],"problem.":[118],"We":[119,145],"implemented":[120],"tested":[122],"approach":[125,152],"RoboCup":[128],"domain,":[129],"attempts":[133],"reach":[135],"ball":[137],"accurately":[139],"kick":[140],"it":[141],"into":[142],"goal.":[144],"present":[146],"experimental":[147],"results":[148],"suggest":[150],"our":[151],"able":[154],"learn":[156],"highly":[157],"effective":[158],"strategies.":[160]},"counts_by_year":[{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":5},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":6}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
