{"id":"https://openalex.org/W4414972673","doi":"https://doi.org/10.48550/arxiv.2510.04901","title":"Focused Skill Discovery: Learning to Control Specific State Variables while Minimizing Side Effects","display_name":"Focused Skill Discovery: Learning to Control Specific State Variables while Minimizing Side Effects","publication_year":2025,"publication_date":"2025-10-06","ids":{"openalex":"https://openalex.org/W4414972673","doi":"https://doi.org/10.48550/arxiv.2510.04901"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2510.04901","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.04901","pdf_url":"https://arxiv.org/pdf/2510.04901","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.04901","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Carr, Jonathan Cola\u00e7o","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Carr, Jonathan Cola\u00e7o","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Sun, Qinyi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Qinyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5061301686","display_name":"Cameron Allen","orcid":"https://orcid.org/0000-0001-9954-6684"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Allen, Cameron","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.980400025844574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12884","display_name":"Educational Assessment and Pedagogy","score":0.9350000023841858,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T14025","display_name":"Educational Technology and Assessment","score":0.907800018787384,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.6421999931335449},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6388000249862671},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.5248000025749207},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.4884999990463257},{"id":"https://openalex.org/keywords/downstream","display_name":"Downstream (manufacturing)","score":0.42739999294281006},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.35989999771118164},{"id":"https://openalex.org/keywords/transferable-skills-analysis","display_name":"Transferable skills analysis","score":0.3319999873638153}],"concepts":[{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.6421999931335449},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6388000249862671},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6097999811172485},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.5248000025749207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5081999897956848},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.4884999990463257},{"id":"https://openalex.org/C2776207758","wikidata":"https://www.wikidata.org/wiki/Q5303302","display_name":"Downstream (manufacturing)","level":2,"score":0.42739999294281006},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40290001034736633},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.35989999771118164},{"id":"https://openalex.org/C20574239","wikidata":"https://www.wikidata.org/wiki/Q7834033","display_name":"Transferable skills analysis","level":3,"score":0.3319999873638153},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C47932503","wikidata":"https://www.wikidata.org/wiki/Q5395689","display_name":"Error-driven learning","level":3,"score":0.295199990272522},{"id":"https://openalex.org/C182365436","wikidata":"https://www.wikidata.org/wiki/Q50701","display_name":"Variable (mathematics)","level":2,"score":0.29190000891685486},{"id":"https://openalex.org/C97082442","wikidata":"https://www.wikidata.org/wiki/Q1934361","display_name":"Skills management","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.2639999985694885},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.2547000050544739}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2510.04901","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.04901","pdf_url":"https://arxiv.org/pdf/2510.04901","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2510.04901","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.04901","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.04901","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.04901","pdf_url":"https://arxiv.org/pdf/2510.04901","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4414972673.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Skills":[0],"are":[1],"essential":[2],"for":[3],"unlocking":[4],"higher":[5],"levels":[6],"of":[7,58,122],"problem":[8],"solving.":[9],"A":[10],"common":[11],"approach":[12,114],"to":[13,18,30,72,77,100],"discovering":[14],"these":[15,96],"skills":[16,55,69,103,105],"is":[17,87],"learn":[19,73,101],"ones":[20],"that":[21,52,94,106],"reliably":[22],"reach":[23],"different":[24],"states,":[25],"thus":[26],"empowering":[27],"the":[28,41,53,85],"agent":[29],"control":[31,57,109],"its":[32],"environment.":[33],"However,":[34],"existing":[35],"skill":[36,97],"discovery":[37,98],"algorithms":[38,99],"often":[39],"overlook":[40],"natural":[42],"state":[43,60,111,116],"variables":[44],"present":[45],"in":[46,81,134],"many":[47],"reinforcement":[48],"learning":[49,126],"problems,":[50],"meaning":[51],"discovered":[54],"lack":[56],"specific":[59,110],"variables.":[61,112],"This":[62],"can":[63],"significantly":[64],"hamper":[65],"exploration":[66],"efficiency,":[67],"make":[68],"more":[70],"challenging":[71],"with,":[74],"and":[75,108,128],"lead":[76],"negative":[78,131],"side":[79,132],"effects":[80,133],"downstream":[82,135],"tasks":[83],"when":[84],"goal":[86],"under-specified.":[88],"We":[89],"introduce":[90],"a":[91,120],"general":[92],"method":[93],"enables":[95],"focused":[102],"--":[104],"target":[107],"Our":[113],"improves":[115],"space":[117],"coverage":[118],"by":[119],"factor":[121],"three,":[123],"unlocks":[124],"new":[125],"capabilities,":[127],"automatically":[129],"avoids":[130],"tasks.":[136]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-09T00:00:00"}
