{"id":"https://openalex.org/W2139636730","doi":"https://doi.org/10.1109/irds.2002.1041507","title":"Learning optimal switching policies for path tracking tasks on a mobile robot","display_name":"Learning optimal switching policies for path tracking tasks on a mobile robot","publication_year":2003,"publication_date":"2003-06-25","ids":{"openalex":"https://openalex.org/W2139636730","doi":"https://doi.org/10.1109/irds.2002.1041507","mag":"2139636730"},"language":"en","primary_location":{"id":"doi:10.1109/irds.2002.1041507","is_oa":false,"landing_page_url":"https://doi.org/10.1109/irds.2002.1041507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/RSJ International Conference on Intelligent Robots and System","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110817778","display_name":"Yunqing Wang","orcid":"https://orcid.org/0000-0002-2164-0766"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yunqing Wang","raw_affiliation_strings":["Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053037033","display_name":"Bryan J. Thibodeau","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"B. Thibodeau","raw_affiliation_strings":["Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046874645","display_name":"Andrew H. Fagg","orcid":"https://orcid.org/0000-0002-5636-9697"},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A.H. Fagg","raw_affiliation_strings":["Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111628193","display_name":"Roderic A. Grupen","orcid":null},"institutions":[{"id":"https://openalex.org/I24603500","display_name":"University of Massachusetts Amherst","ror":"https://ror.org/0072zz521","country_code":"US","type":"education","lineage":["https://openalex.org/I24603500"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"R.A. Grupen","raw_affiliation_strings":["Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA"],"affiliations":[{"raw_affiliation_string":"Laboratory for Perceptual Robotics, Department of Computer Science, University of Massachusetts, Amherst, USA","institution_ids":["https://openalex.org/I24603500"]},{"raw_affiliation_string":"Dept. of Comput. Sci., Massachusetts Univ., Amherst, MA, USA","institution_ids":["https://openalex.org/I24603500"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5110817778"],"corresponding_institution_ids":["https://openalex.org/I24603500"],"apc_list":null,"apc_paid":null,"fwci":0.8178,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.80522344,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"1","issue":null,"first_page":"915","last_page":"920"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8388127684593201},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7219499945640564},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.6895489692687988},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.6552730798721313},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.5503928661346436},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5175173282623291},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.513582706451416},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5109123587608337},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5048559308052063},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4638504981994629},{"id":"https://openalex.org/keywords/impedance-control","display_name":"Impedance control","score":0.45748841762542725},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4432127773761749},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4052774906158447},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3828886151313782},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.37036240100860596},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.21476799249649048}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8388127684593201},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7219499945640564},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.6895489692687988},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.6552730798721313},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.5503928661346436},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5175173282623291},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.513582706451416},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5109123587608337},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5048559308052063},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4638504981994629},{"id":"https://openalex.org/C2777984285","wikidata":"https://www.wikidata.org/wiki/Q17098134","display_name":"Impedance control","level":3,"score":0.45748841762542725},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4432127773761749},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4052774906158447},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3828886151313782},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.37036240100860596},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.21476799249649048},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/irds.2002.1041507","is_oa":false,"landing_page_url":"https://doi.org/10.1109/irds.2002.1041507","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/RSJ International Conference on Intelligent Robots and System","raw_type":"proceedings-article"},{"id":"pmh:oai:scholarworks.umass.edu:cs_faculty_pubs-1536","is_oa":false,"landing_page_url":"https://scholarworks.umass.edu/cs_faculty_pubs/537","pdf_url":null,"source":{"id":"https://openalex.org/S4306402240","display_name":"ScholarWorks@UMassAmherst (University of Massachusetts Amherst)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I24603500","host_organization_name":"University of Massachusetts Amherst","host_organization_lineage":["https://openalex.org/I24603500"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computer Science Department Faculty Publication Series","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.12.4264","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.12.4264","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-robotics.cs.umass.edu/Papers/iros02learning.ps","raw_type":"text"},{"id":"pmh:oai:scholarworks.umass.edu:20.500.14394/10161","is_oa":false,"landing_page_url":"https://hdl.handle.net/20.500.14394/10161","pdf_url":null,"source":{"id":"https://openalex.org/S4306402240","display_name":"ScholarWorks@UMassAmherst (University of Massachusetts Amherst)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I24603500","host_organization_name":"University of Massachusetts Amherst","host_organization_lineage":["https://openalex.org/I24603500"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"published","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W1556694669","https://openalex.org/W1890116610","https://openalex.org/W1978023077","https://openalex.org/W2016482167","https://openalex.org/W2058927747","https://openalex.org/W2063138845","https://openalex.org/W2142573751","https://openalex.org/W2911283634","https://openalex.org/W2914656440","https://openalex.org/W6644756748","https://openalex.org/W6665205786"],"related_works":["https://openalex.org/W3096874164","https://openalex.org/W4376605461","https://openalex.org/W2357975469","https://openalex.org/W2136202932","https://openalex.org/W3087814763","https://openalex.org/W2892507673","https://openalex.org/W2361647908","https://openalex.org/W2937181779","https://openalex.org/W2537866915","https://openalex.org/W2089415692"],"abstract_inverted_index":{"A":[0],"set":[1],"of":[2,25,28],"impedance":[3,29],"controllers":[4,30],"is":[5,20,33],"used":[6,46],"for":[7],"both":[8],"state":[9],"estimation":[10,19],"and":[11,31],"tracking":[12,32,59],"control":[13],"on":[14,22],"a":[15,26,36,57],"mobile":[16],"robot.":[17],"State":[18],"based":[21],"the":[23],"states":[24],"family":[27],"implemented":[34],"through":[35],"single":[37],"controller":[38],"from":[39],"this":[40],"set.":[41],"Reinforcement":[42],"learning":[43],"techniques":[44],"are":[45],"to":[47],"create":[48],"switching":[49],"policies":[50],"that":[51],"optimize":[52],"time":[53],"or":[54],"energy":[55],"in":[56],"path":[58],"task.":[60]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
