{"id":"https://openalex.org/W4385488822","doi":"https://doi.org/10.1109/ijcnn54540.2023.10191536","title":"T3S: Improving Multi-Task Reinforcement Learning with Task-Specific Feature Selector and Scheduler","display_name":"T3S: Improving Multi-Task Reinforcement Learning with Task-Specific Feature Selector and Scheduler","publication_year":2023,"publication_date":"2023-06-18","ids":{"openalex":"https://openalex.org/W4385488822","doi":"https://doi.org/10.1109/ijcnn54540.2023.10191536"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn54540.2023.10191536","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn54540.2023.10191536","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013972839","display_name":"Yuanqiang Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuanqiang Yu","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University,Tianjin,China","College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101619771","display_name":"Tianpei Yang","orcid":"https://orcid.org/0000-0002-5497-7146"},"institutions":[{"id":"https://openalex.org/I154425047","display_name":"University of Alberta","ror":"https://ror.org/0160cpw27","country_code":"CA","type":"education","lineage":["https://openalex.org/I154425047"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Tianpei Yang","raw_affiliation_strings":["University of Alberta and Alberta Machine Intelligence Institute,Department of Computing Science,Edmonton,Canada","Department of Computing Science, University of Alberta and Alberta Machine Intelligence Institute, Edmonton, Canada"],"affiliations":[{"raw_affiliation_string":"University of Alberta and Alberta Machine Intelligence Institute,Department of Computing Science,Edmonton,Canada","institution_ids":["https://openalex.org/I154425047"]},{"raw_affiliation_string":"Department of Computing Science, University of Alberta and Alberta Machine Intelligence Institute, Edmonton, Canada","institution_ids":["https://openalex.org/I154425047"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110922112","display_name":"Yongliang Lv","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongliang Lv","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University,Tianjin,China","College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084937471","display_name":"Yan Zheng","orcid":"https://orcid.org/0000-0003-2741-058X"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Zheng","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University,Tianjin,China","College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045895968","display_name":"Jianye Hao","orcid":null},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianye Hao","raw_affiliation_strings":["College of Intelligence and Computing, Tianjin University,Tianjin,China","College of Intelligence and Computing, Tianjin University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University,Tianjin,China","institution_ids":["https://openalex.org/I162868743"]},{"raw_affiliation_string":"College of Intelligence and Computing, Tianjin University, Tianjin, China","institution_ids":["https://openalex.org/I162868743"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5013972839"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":0.3491,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.644883,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9811999797821045,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8454984426498413},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7947734594345093},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.6641893982887268},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.652426540851593},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6190688014030457},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5851610898971558},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.572917640209198},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.47938990592956543},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.47653278708457947},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.4609909653663635},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07571050524711609}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8454984426498413},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7947734594345093},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.6641893982887268},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.652426540851593},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6190688014030457},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5851610898971558},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.572917640209198},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.47938990592956543},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47653278708457947},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.4609909653663635},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07571050524711609},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn54540.2023.10191536","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn54540.2023.10191536","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2089217417","https://openalex.org/W2145339207","https://openalex.org/W2166519220","https://openalex.org/W2187089797","https://openalex.org/W2257979135","https://openalex.org/W2296073425","https://openalex.org/W2583993537","https://openalex.org/W2809290718","https://openalex.org/W2904246096","https://openalex.org/W2963072899","https://openalex.org/W2963430933","https://openalex.org/W2963877604","https://openalex.org/W2981344907","https://openalex.org/W2991309414","https://openalex.org/W2996037775","https://openalex.org/W3000499753","https://openalex.org/W3013821552","https://openalex.org/W3087549734","https://openalex.org/W3087931390","https://openalex.org/W3093298238","https://openalex.org/W3100944043","https://openalex.org/W3106539628","https://openalex.org/W3121095832","https://openalex.org/W3126321819","https://openalex.org/W3127561923","https://openalex.org/W3176624977","https://openalex.org/W3205279237","https://openalex.org/W3209406073","https://openalex.org/W3212494843","https://openalex.org/W3213112773","https://openalex.org/W4287120375","https://openalex.org/W4293579911","https://openalex.org/W4297730607","https://openalex.org/W4298174377","https://openalex.org/W6685726866","https://openalex.org/W6703533685","https://openalex.org/W6732837357","https://openalex.org/W6740072298","https://openalex.org/W6757592117","https://openalex.org/W6769596995","https://openalex.org/W6770205404","https://openalex.org/W6771876938","https://openalex.org/W6773319185","https://openalex.org/W6775647304","https://openalex.org/W6783566936","https://openalex.org/W6796764164","https://openalex.org/W6802584362","https://openalex.org/W6802732210","https://openalex.org/W6803156713","https://openalex.org/W6864424756"],"related_works":["https://openalex.org/W2237537322","https://openalex.org/W2950678851","https://openalex.org/W4301248618","https://openalex.org/W2165343651","https://openalex.org/W2242427765","https://openalex.org/W2075830955","https://openalex.org/W2343790552","https://openalex.org/W3111398917","https://openalex.org/W4385507578","https://openalex.org/W2949157572"],"abstract_inverted_index":{"Multi-task":[0],"reinforcement":[1],"learning":[2,51,111,130],"(MTRL)":[3],"is":[4,46,119],"a":[5,17,59,75,79],"technique":[6],"to":[7,20,88,101,122],"train":[8,16],"multiple":[9],"tasks":[10,23,45,109],"simultaneously,":[11],"where":[12,115],"previous":[13],"works":[14],"usually":[15],"single":[18],"model":[19],"solve":[21,54],"different":[22],"by":[24,97],"sharing":[25],"parameters":[26,40],"across":[27,44],"various":[28,144],"tasks.":[29,147],"However,":[30],"these":[31,55],"methods":[32],"are":[33],"faced":[34],"with":[35],"inter-task":[36],"interference":[37],"since":[38],"what":[39],"should":[41],"be":[42,95],"shared":[43,99],"not":[47],"addressed,":[48],"dramatically":[49],"reducing":[50],"efficiency.":[52],"To":[53],"problems,":[56],"we":[57],"propose":[58],"novel":[60],"MTRL":[61,141],"framework":[62],"called":[63],"Task-Specific":[64],"feature":[65,76,84],"Selector":[66],"and":[67,78,128],"Scheduler":[68],"(T3S),":[69],"which":[70,93],"consists":[71],"of":[72],"two":[73,113],"components:":[74],"selector":[77],"task":[80,106,123,129],"scheduler.":[81],"Specifically,":[82],"the":[83,116,139],"selectors":[85],"employ":[86],"hypernetworks":[87],"construct":[89,102],"task-specific":[90,103],"soft":[91],"masks,":[92],"can":[94],"applied":[96],"globally":[98],"representation":[100],"features.":[104],"The":[105],"scheduler":[107],"selects":[108],"for":[110],"through":[112],"metrics,":[114],"selection":[117],"probability":[118],"inversely":[120],"proportional":[121],"progress":[124],"(e.g.,":[125],"success":[126],"rate)":[127],"speed.":[131],"Experimental":[132],"results":[133],"show":[134],"that":[135],"T3S":[136],"consistently":[137],"outperforms":[138],"state-of-the-art":[140],"algorithms":[142],"on":[143],"robotics":[145],"manipulation":[146]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
