{"id":"https://openalex.org/W3132589907","doi":"https://doi.org/10.1109/tetci.2021.3132365","title":"Annotating Motion Primitives for Simplifying Action Search in Reinforcement Learning","display_name":"Annotating Motion Primitives for Simplifying Action Search in Reinforcement Learning","publication_year":2022,"publication_date":"2022-01-07","ids":{"openalex":"https://openalex.org/W3132589907","doi":"https://doi.org/10.1109/tetci.2021.3132365","mag":"3132589907"},"language":"en","primary_location":{"id":"doi:10.1109/tetci.2021.3132365","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2021.3132365","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049310005","display_name":"Isaac J. Sledge","orcid":"https://orcid.org/0000-0002-7755-5886"},"institutions":[{"id":"https://openalex.org/I1320354487","display_name":"Target (United States)","ror":"https://ror.org/05mkyac79","country_code":"US","type":"company","lineage":["https://openalex.org/I1320354487"]},{"id":"https://openalex.org/I2802287952","display_name":"Naval Surface Warfare Center","ror":"https://ror.org/03d4ecn10","country_code":"US","type":"facility","lineage":["https://openalex.org/I1328969757","https://openalex.org/I1330347796","https://openalex.org/I2802287952","https://openalex.org/I3130687028"]},{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Isaac J. Sledge","raw_affiliation_strings":["Advanced Signal Processing and Automated Target Recognition Branch, Naval Surface Warfare Center, Panama City, FL, USA"],"affiliations":[{"raw_affiliation_string":"Advanced Signal Processing and Automated Target Recognition Branch, Naval Surface Warfare Center, Panama City, FL, USA","institution_ids":["https://openalex.org/I2802287952","https://openalex.org/I4210121626","https://openalex.org/I1320354487"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085463907","display_name":"Darshan Bryner","orcid":"https://orcid.org/0000-0003-4987-9274"},"institutions":[{"id":"https://openalex.org/I1320354487","display_name":"Target (United States)","ror":"https://ror.org/05mkyac79","country_code":"US","type":"company","lineage":["https://openalex.org/I1320354487"]},{"id":"https://openalex.org/I2802287952","display_name":"Naval Surface Warfare Center","ror":"https://ror.org/03d4ecn10","country_code":"US","type":"facility","lineage":["https://openalex.org/I1328969757","https://openalex.org/I1330347796","https://openalex.org/I2802287952","https://openalex.org/I3130687028"]},{"id":"https://openalex.org/I4210121626","display_name":"Signal Processing (United States)","ror":"https://ror.org/021gzyw51","country_code":"US","type":"company","lineage":["https://openalex.org/I4210121626"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Darshan W. Bryner","raw_affiliation_strings":["Advanced Signal Processing and Automated Target Recognition Branch, Naval Surface Warfare Center, Panama City, FL, USA"],"affiliations":[{"raw_affiliation_string":"Advanced Signal Processing and Automated Target Recognition Branch, Naval Surface Warfare Center, Panama City, FL, USA","institution_ids":["https://openalex.org/I2802287952","https://openalex.org/I4210121626","https://openalex.org/I1320354487"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019504861","display_name":"Jos\u00e9 C. Pr\u0131\u0301ncipe","orcid":"https://orcid.org/0000-0002-3449-3531"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jose C. Principe","raw_affiliation_strings":["Department of Electrical and Computer Engineering, and the Department of Biomedical Engineering, University of Florida, Gainesville, FL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, and the Department of Biomedical Engineering, University of Florida, Gainesville, FL, USA","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5049310005"],"corresponding_institution_ids":["https://openalex.org/I1320354487","https://openalex.org/I2802287952","https://openalex.org/I4210121626"],"apc_list":null,"apc_paid":null,"fwci":0.5104,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.61855086,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"6","issue":"5","first_page":"1137","last_page":"1156"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8035507202148438},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7999874949455261},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6997202634811401},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6391144394874573},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5818435549736023},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5203582644462585},{"id":"https://openalex.org/keywords/kinematics","display_name":"Kinematics","score":0.4776819348335266},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.46951907873153687},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4531635344028473},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.419574111700058}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8035507202148438},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7999874949455261},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6997202634811401},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6391144394874573},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5818435549736023},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5203582644462585},{"id":"https://openalex.org/C39920418","wikidata":"https://www.wikidata.org/wiki/Q11476","display_name":"Kinematics","level":2,"score":0.4776819348335266},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.46951907873153687},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4531635344028473},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.419574111700058},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tetci.2021.3132365","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2021.3132365","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.46000000834465027,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G1713947010","display_name":null,"funder_award_id":"N00014-19-WX-00636","funder_id":"https://openalex.org/F4320337345","funder_display_name":"Office of Naval Research"}],"funders":[{"id":"https://openalex.org/F4320337345","display_name":"Office of Naval Research","ror":"https://ror.org/00rk2pe57"},{"id":"https://openalex.org/F4320337644","display_name":"Naval Sea Systems Command","ror":"https://ror.org/03dm1p143"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":100,"referenced_works":["https://openalex.org/W45528431","https://openalex.org/W157898781","https://openalex.org/W1487322600","https://openalex.org/W1539716820","https://openalex.org/W1592847719","https://openalex.org/W1814494663","https://openalex.org/W1950788856","https://openalex.org/W1965524806","https://openalex.org/W1976126972","https://openalex.org/W1983364832","https://openalex.org/W1985415289","https://openalex.org/W1994529670","https://openalex.org/W2004030284","https://openalex.org/W2007206727","https://openalex.org/W2008775992","https://openalex.org/W2010399676","https://openalex.org/W2015186727","https://openalex.org/W2017611213","https://openalex.org/W2022760091","https://openalex.org/W2025415230","https://openalex.org/W2025632878","https://openalex.org/W2036930518","https://openalex.org/W2037694098","https://openalex.org/W2062429977","https://openalex.org/W2063346060","https://openalex.org/W2078765782","https://openalex.org/W2079247031","https://openalex.org/W2089619576","https://openalex.org/W2091791686","https://openalex.org/W2096691069","https://openalex.org/W2097412577","https://openalex.org/W2098339052","https://openalex.org/W2100657858","https://openalex.org/W2106996050","https://openalex.org/W2108535023","https://openalex.org/W2111693792","https://openalex.org/W2114451917","https://openalex.org/W2116931983","https://openalex.org/W2118686230","https://openalex.org/W2121863487","https://openalex.org/W2122319321","https://openalex.org/W2123513798","https://openalex.org/W2124017786","https://openalex.org/W2125074935","https://openalex.org/W2125340118","https://openalex.org/W2129418188","https://openalex.org/W2134042548","https://openalex.org/W2134197408","https://openalex.org/W2135658380","https://openalex.org/W2135997697","https://openalex.org/W2136853139","https://openalex.org/W2136917337","https://openalex.org/W2137766593","https://openalex.org/W2141494606","https://openalex.org/W2141559645","https://openalex.org/W2142194269","https://openalex.org/W2142203883","https://openalex.org/W2150147323","https://openalex.org/W2150555551","https://openalex.org/W2153947321","https://openalex.org/W2155027007","https://openalex.org/W2156094778","https://openalex.org/W2157286417","https://openalex.org/W2164276476","https://openalex.org/W2172131460","https://openalex.org/W2172207578","https://openalex.org/W2173758409","https://openalex.org/W2594564328","https://openalex.org/W2749028154","https://openalex.org/W2765699677","https://openalex.org/W2787471386","https://openalex.org/W2896405912","https://openalex.org/W2962717849","https://openalex.org/W2963021451","https://openalex.org/W2963199420","https://openalex.org/W2963611966","https://openalex.org/W2963876278","https://openalex.org/W2963935758","https://openalex.org/W3009585715","https://openalex.org/W3101477643","https://openalex.org/W3105659172","https://openalex.org/W3142970622","https://openalex.org/W4214717370","https://openalex.org/W4312108234","https://openalex.org/W6676557315","https://openalex.org/W6676772908","https://openalex.org/W6677826109","https://openalex.org/W6678545291","https://openalex.org/W6680171673","https://openalex.org/W6680235470","https://openalex.org/W6680307681","https://openalex.org/W6680313055","https://openalex.org/W6682802936","https://openalex.org/W6683204974","https://openalex.org/W6684863604","https://openalex.org/W6718190810","https://openalex.org/W6740879895","https://openalex.org/W6741977017","https://openalex.org/W6847727672","https://openalex.org/W7075606714"],"related_works":["https://openalex.org/W2468279273","https://openalex.org/W2354198838","https://openalex.org/W1989130879","https://openalex.org/W2103419012","https://openalex.org/W2988126442","https://openalex.org/W1974414866","https://openalex.org/W2789522126","https://openalex.org/W2066693961","https://openalex.org/W2063982682","https://openalex.org/W2768698792"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,174,188],"in":[2,17,120,131],"large-scale":[3],"environments":[4],"is":[5,191,211],"challenging":[6],"due":[7],"to":[8,137,180,204,219],"the":[9,32,36,64,73,99,116,139,202,217,232],"many":[10],"possible":[11],"actions":[12,47,69],"that":[13,62,172,206,224],"can":[14,75,215],"be":[15,76],"taken":[16,48],"specific":[18],"situations.":[19],"We":[20,104,127,169],"have":[21,60],"previously":[22],"developed":[23],"a":[24,50,54,90,108,134,142],"means":[25,95],"of":[26,38,45,56,96,118,145],"constraining,":[27],"and":[28,68,93,102,155,200],"hence":[29],"speeding":[30],"up,":[31],"search":[33,74],"process":[34],"through":[35,107],"use":[37,128],"motion":[39,41,65,81,122,154,194],"primitives;":[40],"primitives":[42,82,140,161,195],"are":[43,70],"sequences":[44,123],"pre-specified":[46],"across":[49],"state":[51],"series.":[52],"As":[53],"byproduct":[55],"this":[57,106,129],"work,":[58],"we":[59,88,151],"found":[61],"if":[63],"primitives\u2019":[66],"motions":[67,101],"labeled,":[71],"then":[72],"sped":[77],"up":[78],"further.":[79],"Since":[80],"may":[83],"initially":[84],"lack":[85],"such":[86],"details,":[87],"propose":[89],"theoretically":[91],"viewpoint-insensitive":[92],"speed-insensitive":[94],"automatically":[97],"annotating":[98],"underlying":[100],"actions.":[103],"do":[105,225],"differential-geometric,":[109],"spatio-temporal":[110],"kinematics":[111],"descriptor,":[112],"which":[113],"analyzes":[114],"how":[115],"poses":[117],"entities":[119],"two":[121],"change":[124],"over":[125],"time.":[126],"descriptor":[130],"conjunction":[132],"with":[133,162],"weighted-nearest-neighbor":[135],"classifier":[136],"label":[138],"using":[141,175],"limited":[143],"set":[144],"training":[146,167],"examples.":[147],"In":[148],"our":[149],"experiments,":[150],"achieve":[152],"high":[153],"action":[156,222,233],"annotation":[157],"rates":[158],"for":[159],"human-action-derived":[160],"as":[163,165],"few":[164],"one":[166],"sample.":[168],"also":[170,212],"demonstrate":[171],"reinforcement":[173,187],"accurately":[176],"labeled":[177],"trajectories":[178],"leads":[179],"high-performing":[181],"policies":[182],"more":[183],"quickly":[184],"than":[185],"standard":[186],"techniques.":[189],"This":[190],"partly":[192],"because":[193,213],"encode":[196],"prior":[197],"domain":[198],"knowledge":[199,207],"preempt":[201],"need":[203],"re-discover":[205],"during":[208],"training.":[209],"It":[210],"agents":[214],"leverage":[216],"labels":[218],"systematically":[220],"ignore":[221],"classes":[223],"not":[226],"facilitate":[227],"task":[228],"objectives,":[229],"thereby":[230],"reducing":[231],"space.":[234]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
