{"id":"https://openalex.org/W3144576563","doi":"https://doi.org/10.1109/ccwc51732.2021.9375906","title":"Improving Reward Functions in Robots Playing Capture the Flag Using Q-Learning","display_name":"Improving Reward Functions in Robots Playing Capture the Flag Using Q-Learning","publication_year":2021,"publication_date":"2021-01-27","ids":{"openalex":"https://openalex.org/W3144576563","doi":"https://doi.org/10.1109/ccwc51732.2021.9375906","mag":"3144576563"},"language":"en","primary_location":{"id":"doi:10.1109/ccwc51732.2021.9375906","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ccwc51732.2021.9375906","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 11th Annual Computing and Communication Workshop and Conference (CCWC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080439215","display_name":"Trevor Powers","orcid":null},"institutions":[{"id":"https://openalex.org/I192545095","display_name":"United States Military Academy","ror":"https://ror.org/01jepya76","country_code":"US","type":"education","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I192545095","https://openalex.org/I4210088792"]},{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Trevor Powers","raw_affiliation_strings":["Robotics Research Center, United States Military Academy,West Point,NY","Robotics Research Center, United States Military Academy, West Point, NY"],"affiliations":[{"raw_affiliation_string":"Robotics Research Center, United States Military Academy,West Point,NY","institution_ids":["https://openalex.org/I192545095"]},{"raw_affiliation_string":"Robotics Research Center, United States Military Academy, West Point, NY","institution_ids":["https://openalex.org/I192545095","https://openalex.org/I4210116723"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041735888","display_name":"Michael Novitzky","orcid":"https://orcid.org/0000-0002-8760-651X"},"institutions":[{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]},{"id":"https://openalex.org/I192545095","display_name":"United States Military Academy","ror":"https://ror.org/01jepya76","country_code":"US","type":"education","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I192545095","https://openalex.org/I4210088792"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Novitzky","raw_affiliation_strings":["Robotics Research Center, United States Military Academy,West Point,NY","Robotics Research Center, United States Military Academy, West Point, NY"],"affiliations":[{"raw_affiliation_string":"Robotics Research Center, United States Military Academy,West Point,NY","institution_ids":["https://openalex.org/I192545095"]},{"raw_affiliation_string":"Robotics Research Center, United States Military Academy, West Point, NY","institution_ids":["https://openalex.org/I192545095","https://openalex.org/I4210116723"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5029166980","display_name":"Christopher Korpela","orcid":"https://orcid.org/0000-0001-6643-5291"},"institutions":[{"id":"https://openalex.org/I192545095","display_name":"United States Military Academy","ror":"https://ror.org/01jepya76","country_code":"US","type":"education","lineage":["https://openalex.org/I1304082316","https://openalex.org/I1330347796","https://openalex.org/I192545095","https://openalex.org/I4210088792"]},{"id":"https://openalex.org/I4210116723","display_name":"Robotics Research (United States)","ror":"https://ror.org/020w2fr77","country_code":"US","type":"company","lineage":["https://openalex.org/I4210116723"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Korpela","raw_affiliation_strings":["Robotics Research Center, United States Military Academy,West Point,NY","Robotics Research Center, United States Military Academy, West Point, NY"],"affiliations":[{"raw_affiliation_string":"Robotics Research Center, United States Military Academy,West Point,NY","institution_ids":["https://openalex.org/I192545095"]},{"raw_affiliation_string":"Robotics Research Center, United States Military Academy, West Point, NY","institution_ids":["https://openalex.org/I192545095","https://openalex.org/I4210116723"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5080439215"],"corresponding_institution_ids":["https://openalex.org/I192545095","https://openalex.org/I4210116723"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03983493,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"0426","last_page":"0431"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9682999849319458,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/flag","display_name":"Flag (linear algebra)","score":0.8796324729919434},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.8098798990249634},{"id":"https://openalex.org/keywords/adversary","display_name":"Adversary","score":0.7169489860534668},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5687355995178223},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5685065984725952},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.5491676926612854},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.501096248626709},{"id":"https://openalex.org/keywords/heading","display_name":"Heading (navigation)","score":0.4754495322704315},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4126773774623871},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3508220314979553},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3467264175415039},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.26219362020492554},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.1619565486907959},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14552971720695496},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.05528557300567627}],"concepts":[{"id":"https://openalex.org/C2776730729","wikidata":"https://www.wikidata.org/wiki/Q1392130","display_name":"Flag (linear algebra)","level":3,"score":0.8796324729919434},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.8098798990249634},{"id":"https://openalex.org/C41065033","wikidata":"https://www.wikidata.org/wiki/Q2825412","display_name":"Adversary","level":2,"score":0.7169489860534668},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5687355995178223},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5685065984725952},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.5491676926612854},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.501096248626709},{"id":"https://openalex.org/C2776937971","wikidata":"https://www.wikidata.org/wiki/Q4384217","display_name":"Heading (navigation)","level":2,"score":0.4754495322704315},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4126773774623871},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3508220314979553},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3467264175415039},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.26219362020492554},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.1619565486907959},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14552971720695496},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.05528557300567627},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ccwc51732.2021.9375906","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ccwc51732.2021.9375906","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE 11th Annual Computing and Communication Workshop and Conference (CCWC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Life below water","id":"https://metadata.un.org/sdg/14","score":0.5099999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1965569281","https://openalex.org/W2013798700","https://openalex.org/W2164576815","https://openalex.org/W2581869884","https://openalex.org/W2728420778","https://openalex.org/W2782624333","https://openalex.org/W2796281591","https://openalex.org/W2808470116","https://openalex.org/W2911121076","https://openalex.org/W4232866525"],"related_works":["https://openalex.org/W2324035390","https://openalex.org/W2963151310","https://openalex.org/W3175137310","https://openalex.org/W2583526987","https://openalex.org/W3034984450","https://openalex.org/W2695311495","https://openalex.org/W3139271019","https://openalex.org/W2098156551","https://openalex.org/W2122871747","https://openalex.org/W3114279067"],"abstract_inverted_index":{"This":[0,24,71,120,190],"paper":[1,25,72,121,191],"builds":[2],"on":[3,28,78,99,216],"previous":[4,156,172],"work":[5,181,213],"that":[6],"used":[7],"Q-Learning":[8],"to":[9,14,34,47,58,65,85,103,111,132,151,179,182,203,220],"teach":[10],"simulated":[11],"marine":[12],"robots":[13],"play":[15],"capture":[16,134,164,221],"the":[17,29,39,48,52,59,66,79,82,86,100,104,108,112,117,135,139,152,155,159,165,171,175,187,205,208,222],"flag":[18,106,136,153,166,223],"against":[19],"an":[20,225],"unintelligent":[21],"enemy":[22,91,105],"robot.":[23,141],"will":[26,192,214],"focus":[27,215],"improvement":[30],"of":[31,55,128,138,197,207],"reward":[32,74,129,201],"functions":[33,202],"achieve":[35,183],"two":[36,95],"goals:":[37],"make":[38],"attacking":[40,53,67,83,140,160,209],"robot":[41,54,68,84,161],"more":[42,148,199],"tactical":[43],"in":[44,146,195],"its":[45,56],"approach":[46],"flag,":[49],"and":[50,90,93,107],"rid":[51],"indifference":[57],"enemy's":[60,113],"location":[61],"(which":[62],"often":[63],"leads":[64],"being":[69],"captured).":[70],"alters":[73],"function":[75,130],"components":[76,97,131],"(dependent":[77,98],"distance":[80],"from":[81,224],"nearest":[87],"boundary,":[88],"enemy,":[89],"flag)":[92],"contributes":[94],"new":[96],"robot's":[101,109,210],"angle":[102,110],"heading,":[114],"known":[115],"as":[116,167,170],"deviation":[118],"angle).":[119],"then":[122],"trains":[123],"four":[124],"models":[125,143],"with":[126],"variations":[127],"improve":[133],"behavior":[137],"The":[142],"were":[144],"successful":[145],"finding":[147,198],"efficient":[149,200],"approaches":[150],"than":[154,186],"project,":[157],"although":[158],"did":[162],"not":[163],"many":[168],"times":[169],"project.":[173,189],"However,":[174],"findings":[176],"give":[177],"potential":[178],"follow-on":[180],"better":[184],"results":[185],"parent":[188],"be":[193],"continued":[194],"hopes":[196],"increase":[204],"intelligence":[206],"approach.":[211],"Future":[212],"teaching":[217],"multi-robot":[218],"teams":[219],"intelligent":[226],"adversary.":[227]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
