{"id":"https://openalex.org/W4402351687","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651270","title":"Task-agnostic Decision Transformer for Multi-type Agent Control with Federated Split Training","display_name":"Task-agnostic Decision Transformer for Multi-type Agent Control with Federated Split Training","publication_year":2024,"publication_date":"2024-06-30","ids":{"openalex":"https://openalex.org/W4402351687","doi":"https://doi.org/10.1109/ijcnn60899.2024.10651270"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn60899.2024.10651270","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651270","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115596884","display_name":"Zhiyuan Wang","orcid":"https://orcid.org/0009-0004-1401-4654"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiyuan Wang","raw_affiliation_strings":["Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084153521","display_name":"Bokui Chen","orcid":"https://orcid.org/0000-0002-4947-5619"},"institutions":[{"id":"https://openalex.org/I4210114105","display_name":"Tsinghua\u2013Berkeley Shenzhen Institute","ror":"https://ror.org/02hhwwz98","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210114105","https://openalex.org/I95457486","https://openalex.org/I99065089"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bokui Chen","raw_affiliation_strings":["Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Tsinghua Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101586244","display_name":"Xiaoyang Qu","orcid":"https://orcid.org/0000-0001-8353-4064"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]},{"id":"https://openalex.org/I4401726822","display_name":"Ping An (China)","ror":"https://ror.org/004yv2z91","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726822"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyang Qu","raw_affiliation_strings":["Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I4401726822"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022252099","display_name":"Zhenhou Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726822","display_name":"Ping An (China)","ror":"https://ror.org/004yv2z91","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726822"]},{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenhou Hong","raw_affiliation_strings":["Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I4401726822"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101623807","display_name":"Jing Xiao","orcid":"https://orcid.org/0000-0002-0833-5679"},"institutions":[{"id":"https://openalex.org/I4401726822","display_name":"Ping An (China)","ror":"https://ror.org/004yv2z91","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726822"]},{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Xiao","raw_affiliation_strings":["Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I4401726822"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5074472751","display_name":"Jianzong Wang","orcid":"https://orcid.org/0000-0002-9237-4231"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]},{"id":"https://openalex.org/I4401726822","display_name":"Ping An (China)","ror":"https://ror.org/004yv2z91","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726822"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianzong Wang","raw_affiliation_strings":["Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Ping An Technology (Shenzhen) Co., Ltd.,Shenzhen,China","institution_ids":["https://openalex.org/I4210152380","https://openalex.org/I4401726822"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5115596884"],"corresponding_institution_ids":["https://openalex.org/I4210114105","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.12887544,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12879","display_name":"Distributed Sensor Networks and Detection Algorithms","score":0.9661999940872192,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10791","display_name":"Advanced Control Systems Optimization","score":0.955299973487854,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7977001070976257},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.632082998752594},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5679396390914917},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.45402365922927856},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.4488334357738495},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3872980773448944},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3254232108592987},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09885945916175842},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.09489774703979492},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.08247730135917664},{"id":"https://openalex.org/keywords/systems-engineering","display_name":"Systems engineering","score":0.06579574942588806}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7977001070976257},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.632082998752594},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5679396390914917},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.45402365922927856},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.4488334357738495},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3872980773448944},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3254232108592987},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09885945916175842},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.09489774703979492},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.08247730135917664},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.06579574942588806}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn60899.2024.10651270","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/ijcnn60899.2024.10651270","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.6399999856948853,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320337986","display_name":"Tsinghua Shenzhen International Graduate School","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W2155130498","https://openalex.org/W2947150733","https://openalex.org/W2978455699","https://openalex.org/W2991355586","https://openalex.org/W3018102029","https://openalex.org/W3033324992","https://openalex.org/W3099314130","https://openalex.org/W3102626224","https://openalex.org/W3157503981","https://openalex.org/W3169291081","https://openalex.org/W3214419470","https://openalex.org/W4281663178","https://openalex.org/W4289147263","https://openalex.org/W4300427714","https://openalex.org/W4307974632","https://openalex.org/W4311607213","https://openalex.org/W4312352414","https://openalex.org/W4318619660","https://openalex.org/W4318812474","https://openalex.org/W4319778953","https://openalex.org/W4385245566","https://openalex.org/W4385644834","https://openalex.org/W4385767986","https://openalex.org/W4392902663","https://openalex.org/W6728757088","https://openalex.org/W6738383168","https://openalex.org/W6747473740","https://openalex.org/W6756436328","https://openalex.org/W6759226220","https://openalex.org/W6759238902","https://openalex.org/W6761704562","https://openalex.org/W6763704811","https://openalex.org/W6771270455","https://openalex.org/W6779265984","https://openalex.org/W6784336702","https://openalex.org/W6796289742","https://openalex.org/W6803981037","https://openalex.org/W6810745647","https://openalex.org/W6838779861","https://openalex.org/W6838931476","https://openalex.org/W6839142035","https://openalex.org/W6852609763"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4224009465","https://openalex.org/W4306674287","https://openalex.org/W4286629047","https://openalex.org/W4389443772","https://openalex.org/W4205958290","https://openalex.org/W4384212932","https://openalex.org/W2169395074","https://openalex.org/W4391019359","https://openalex.org/W3098003361"],"abstract_inverted_index":{"With":[0],"the":[1,7,19,46,68,105,111,116,168,171],"rapid":[2],"advancements":[3],"in":[4,22,122,133,157,174],"artificial":[5],"intelligence,":[6],"development":[8],"of":[9,70,119,170],"knowledgeable":[10],"and":[11,25,92,98,135,153],"personalized":[12,29,71,127],"agents":[13,30,72,97],"has":[14],"become":[15],"increasingly":[16],"prevalent.":[17],"However,":[18],"inherent":[20],"variability":[21],"state":[23],"variables":[24],"action":[26],"spaces":[27],"among":[28],"poses":[31],"significant":[32,131],"aggregation":[33],"challenges":[34],"for":[35,57,77,126,150],"traditional":[36,140],"federated":[37,123],"learning":[38,125,156,180],"algorithms.":[39],"To":[40],"tackle":[41],"these":[42],"challenges,":[43],"we":[44],"introduce":[45],"Federated":[47],"Split":[48],"Decision":[49],"Transformer":[50],"(FSDT),":[51],"an":[52],"innovative":[53],"framework":[54,64,146,173],"designed":[55],"explicitly":[56],"AI":[58],"agent":[59,186],"decision":[60,163,187],"tasks.":[61],"The":[62,144],"FSDT":[63,145,172],"excels":[65],"at":[66],"navigating":[67],"intricacies":[69],"by":[73],"harnessing":[74],"distributed":[75,177],"data":[76,81,181],"training":[78,87,142],"while":[79],"preserving":[80],"privacy.":[82],"It":[83],"employs":[84],"a":[85,99],"two-stage":[86],"process,":[88],"with":[89,130],"local":[90],"embedding":[91],"prediction":[93],"models":[94],"on":[95,104],"client":[96],"global":[100],"transformer":[101],"decoder":[102],"model":[103],"server.":[106],"Our":[107,165],"comprehensive":[108],"evaluation":[109],"using":[110],"benchmark":[112],"D4RL":[113],"dataset":[114],"highlights":[115],"superior":[117],"performance":[118],"our":[120],"algorithm":[121],"split":[124],"agents,":[128],"coupled":[129],"reductions":[132],"communication":[134],"computational":[136],"overhead":[137],"compared":[138],"to":[139,182],"centralized":[141],"approaches.":[143],"demonstrates":[147],"strong":[148],"potential":[149],"enabling":[151],"efficient":[152],"privacy-preserving":[154],"collaborative":[155],"applications":[158],"such":[159],"as":[160],"autonomous":[161],"driving":[162],"systems.":[164,188],"findings":[166],"underscore":[167],"efficacy":[169],"effectively":[175],"leveraging":[176],"offline":[178],"reinforcement":[179],"enable":[183],"powerful":[184],"multi-type":[185]},"counts_by_year":[],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
