{"id":"https://openalex.org/W4401806183","doi":"https://doi.org/10.1109/access.2024.3449072","title":"Multi-Task Reinforcement Learning Based on Parallel Recombination Networks","display_name":"Multi-Task Reinforcement Learning Based on Parallel Recombination Networks","publication_year":2024,"publication_date":"2024-08-23","ids":{"openalex":"https://openalex.org/W4401806183","doi":"https://doi.org/10.1109/access.2024.3449072"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3449072","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3449072","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2024.3449072","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083012464","display_name":"Manlu Liu","orcid":"https://orcid.org/0000-0003-2503-8817"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Manlu Liu","raw_affiliation_strings":["School of Information Engineering, Southwest University of Science and Technology, Mianyang, China","chool of Information Engineering, Southwest University of Science and Technology, Mian Yang, China"],"raw_orcid":"https://orcid.org/0000-0003-2503-8817","affiliations":[{"raw_affiliation_string":"School of Information Engineering, Southwest University of Science and Technology, Mianyang, China","institution_ids":["https://openalex.org/I1297991670"]},{"raw_affiliation_string":"chool of Information Engineering, Southwest University of Science and Technology, Mian Yang, China","institution_ids":["https://openalex.org/I1297991670"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102903790","display_name":"Qingbo Zhang","orcid":"https://orcid.org/0000-0002-7751-4443"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingbo Zhang","raw_affiliation_strings":["School of Information Engineering, Southwest University of Science and Technology, Mianyang, China","chool of Information Engineering, Southwest University of Science and Technology, Mian Yang, China"],"raw_orcid":"https://orcid.org/0000-0002-7751-4443","affiliations":[{"raw_affiliation_string":"School of Information Engineering, Southwest University of Science and Technology, Mianyang, China","institution_ids":["https://openalex.org/I1297991670"]},{"raw_affiliation_string":"chool of Information Engineering, Southwest University of Science and Technology, Mian Yang, China","institution_ids":["https://openalex.org/I1297991670"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035459203","display_name":"Weimin Qian","orcid":null},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weimin Qian","raw_affiliation_strings":["School of Information Engineering, Southwest University of Science and Technology, Mianyang, China","chool of Information Engineering, Southwest University of Science and Technology, Mian Yang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Information Engineering, Southwest University of Science and Technology, Mianyang, China","institution_ids":["https://openalex.org/I1297991670"]},{"raw_affiliation_string":"chool of Information Engineering, Southwest University of Science and Technology, Mian Yang, China","institution_ids":["https://openalex.org/I1297991670"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5083012464"],"corresponding_institution_ids":["https://openalex.org/I1297991670"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14189319,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"13","issue":null,"first_page":"80113","last_page":"80122"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T14225","display_name":"Advanced Sensor and Control Systems","score":0.7587000131607056,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T14225","display_name":"Advanced Sensor and Control Systems","score":0.7587000131607056,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13832","display_name":"Advanced Decision-Making Techniques","score":0.6675000190734863,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14474","display_name":"Industrial Technology and Control Systems","score":0.6401000022888184,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.779992401599884},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6737989783287048},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5817073583602905},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.47583794593811035},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32377296686172485},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.12413892149925232},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09443780779838562}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.779992401599884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6737989783287048},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5817073583602905},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.47583794593811035},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32377296686172485},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.12413892149925232},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09443780779838562},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3449072","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3449072","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:9c67e8b4169047d58e68c821685a3653","is_oa":true,"landing_page_url":"https://doaj.org/article/9c67e8b4169047d58e68c821685a3653","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 13, Pp 80113-80122 (2025)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3449072","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3449072","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4228831696","display_name":null,"funder_award_id":"24ycx2019","funder_id":"https://openalex.org/F4320322559","funder_display_name":"Southwest University of Science and Technology"},{"id":"https://openalex.org/G5041081093","display_name":null,"funder_award_id":"22zx7164","funder_id":"https://openalex.org/F4320322559","funder_display_name":"Southwest University of Science and Technology"}],"funders":[{"id":"https://openalex.org/F4320322559","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W2158782408","https://openalex.org/W2910668273","https://openalex.org/W2913340405","https://openalex.org/W2963216850","https://openalex.org/W2967167513","https://openalex.org/W2973262547","https://openalex.org/W3038822267","https://openalex.org/W3100789280","https://openalex.org/W3141797743","https://openalex.org/W3165566836","https://openalex.org/W3210258147","https://openalex.org/W4293566197","https://openalex.org/W4323338424","https://openalex.org/W4362650413","https://openalex.org/W4376269829","https://openalex.org/W4386285856","https://openalex.org/W4387358066","https://openalex.org/W4391093797","https://openalex.org/W4391770177","https://openalex.org/W4394911033","https://openalex.org/W4394937440","https://openalex.org/W4399074796","https://openalex.org/W4399928162","https://openalex.org/W6684921986","https://openalex.org/W6740879895","https://openalex.org/W6747473740","https://openalex.org/W6748648269","https://openalex.org/W6749966379","https://openalex.org/W6754610480","https://openalex.org/W6762717864","https://openalex.org/W6769596995","https://openalex.org/W6770205404","https://openalex.org/W6771876938","https://openalex.org/W6775647304","https://openalex.org/W6778826543","https://openalex.org/W6779247072","https://openalex.org/W6790190981"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588"],"abstract_inverted_index":{"Multi-task":[0],"Reinforcement":[1],"learning":[2,28,94],"is":[3,24,120,178],"a":[4,20,59,117,159,162],"key":[5],"current":[6,171,176],"trend":[7],"in":[8,29,49,95,104,185,228],"the":[9,39,50,82,87,90,105,125,133,145,155,166,170,175,182,188,194,202,210,215,220],"field":[10],"of":[11,41,86,92,135,230],"reinforcement":[12],"learning.":[13],"It":[14],"can":[15,66],"accomplish":[16],"multiple":[17],"tasks":[18,48,102,148],"using":[19],"single":[21],"network,":[22],"which":[23,65,122,180],"superior":[25],"to":[26,43,76],"single-task":[27],"integrating":[30],"information":[31,69,83],"from":[32,149],"different":[33],"tasks.":[34],"However,":[35],"uncertainty":[36],"remains":[37],"on":[38,209],"issue":[40],"how":[42],"effectively":[44],"share":[45,67],"parameters":[46],"across":[47,70],"network.":[51,88,164,191],"To":[52],"address":[53],"this":[54,56,96],"problem,":[55],"paper":[57,97],"proposes":[58],"\u2019soft":[60],"parallel":[61,150,189],"recombination":[62,151,190],"network\u2019":[63],"approach,":[64],"task":[68,130,160],"network":[71,119],"layers":[72],"without":[73],"being":[74,138],"limited":[75],"between":[77,147,169],"adjacent":[78],"layers,":[79],"thus":[80],"enhancing":[81],"sharing":[84],"capability":[85],"Specifically,":[89],"types":[91],"multi-task":[93,212],"include":[98],"various":[99],"manipulator":[100],"control":[101],"executed":[103],"Meta-world":[106,211],"environment,":[107],"such":[108],"as":[109],"pick-and-place,":[110],"push,":[111],"and":[112,131,153,174,206,233],"stacking.":[113],"For":[114],"optimal":[115,126,156],"performance,":[116],"weight":[118,163,167],"introduced":[121],"automatically":[123],"determines":[124,154],"path":[127,157],"for":[128,158],"each":[129,136],"outputs":[132],"probability":[134],"module":[137],"selected.":[139],"The":[140],"proposed":[141,195,221],"method":[142,200,222],"efficiently":[143],"learns":[144],"relationships":[146],"networks":[152],"through":[161],"Further,":[165],"relationship":[168],"training":[172,183,213],"samples":[173],"strategy":[177],"found,":[179],"improves":[181],"efficiency":[184,232],"combination":[186],"with":[187,201],"By":[192],"combining":[193],"\u2019Soft":[196],"Parallel":[197],"Recombination":[198],"Network\u2019":[199],"SAC":[203],"algorithm":[204],"(PRSAC)":[205],"validating":[207],"it":[208],"platform,":[214],"experimental":[216],"results":[217],"demonstrate":[218],"that":[219],"significantly":[223],"outperforms":[224],"existing":[225],"baseline":[226],"algorithms":[227],"terms":[229],"sample":[231],"performance.":[234]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
