{"id":"https://openalex.org/W4394923534","doi":"https://doi.org/10.1145/3627703.3650083","title":"ScheMoE: An Extensible Mixture-of-Experts Distributed Training System with Tasks Scheduling","display_name":"ScheMoE: An Extensible Mixture-of-Experts Distributed Training System with Tasks Scheduling","publication_year":2024,"publication_date":"2024-04-18","ids":{"openalex":"https://openalex.org/W4394923534","doi":"https://doi.org/10.1145/3627703.3650083"},"language":"en","primary_location":{"id":"doi:10.1145/3627703.3650083","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627703.3650083","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth European Conference on Computer Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016836702","display_name":"Shaohuai Shi","orcid":"https://orcid.org/0000-0002-1418-5160"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shaohuai Shi","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016665007","display_name":"Xinglin Pan","orcid":"https://orcid.org/0000-0002-1172-9935"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xinglin Pan","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou)"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou)","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018867983","display_name":"Qiang Wang","orcid":"https://orcid.org/0000-0002-2986-967X"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiang Wang","raw_affiliation_strings":["Harbin Institute of Technology, Shenzhen"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology, Shenzhen","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027626597","display_name":"Chengjian Liu","orcid":"https://orcid.org/0000-0002-0103-4670"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengjian Liu","raw_affiliation_strings":["Shenzhen Technology University"],"affiliations":[{"raw_affiliation_string":"Shenzhen Technology University","institution_ids":["https://openalex.org/I4210152380"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079912837","display_name":"Xiaozhe Ren","orcid":"https://orcid.org/0000-0002-0432-5510"},"institutions":[{"id":"https://openalex.org/I4210108585","display_name":"Central Research Institute","ror":"https://ror.org/01wnfae18","country_code":"IN","type":"facility","lineage":["https://openalex.org/I4210108585"]},{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["GB","IN"],"is_corresponding":false,"raw_author_name":"Xiaozhe Ren","raw_affiliation_strings":["Huawei Central Research Institute, Huawei Technologies"],"affiliations":[{"raw_affiliation_string":"Huawei Central Research Institute, Huawei Technologies","institution_ids":["https://openalex.org/I4210160618","https://openalex.org/I4210108585"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075481740","display_name":"Zhongzhe Hu","orcid":"https://orcid.org/0000-0002-6708-3942"},"institutions":[{"id":"https://openalex.org/I4210108585","display_name":"Central Research Institute","ror":"https://ror.org/01wnfae18","country_code":"IN","type":"facility","lineage":["https://openalex.org/I4210108585"]},{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["GB","IN"],"is_corresponding":false,"raw_author_name":"Zhongzhe Hu","raw_affiliation_strings":["Huawei Central Research Institute, Huawei Technologies"],"affiliations":[{"raw_affiliation_string":"Huawei Central Research Institute, Huawei Technologies","institution_ids":["https://openalex.org/I4210160618","https://openalex.org/I4210108585"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095771100","display_name":"Yu Yang","orcid":"https://orcid.org/0009-0001-1544-956X"},"institutions":[{"id":"https://openalex.org/I4210108585","display_name":"Central Research Institute","ror":"https://ror.org/01wnfae18","country_code":"IN","type":"facility","lineage":["https://openalex.org/I4210108585"]},{"id":"https://openalex.org/I4210160618","display_name":"Huawei Technologies (United Kingdom)","ror":"https://ror.org/056gzgs71","country_code":"GB","type":"company","lineage":["https://openalex.org/I2250955327","https://openalex.org/I4210160618"]}],"countries":["GB","IN"],"is_corresponding":false,"raw_author_name":"Yu Yang","raw_affiliation_strings":["Huawei Central Research Institute, Huawei Technologies"],"affiliations":[{"raw_affiliation_string":"Huawei Central Research Institute, Huawei Technologies","institution_ids":["https://openalex.org/I4210160618","https://openalex.org/I4210108585"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060171629","display_name":"Bo Li","orcid":"https://orcid.org/0000-0003-2955-750X"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Bo Li","raw_affiliation_strings":["The Hong Kong University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100730785","display_name":"Xiaowen Chu","orcid":"https://orcid.org/0000-0001-9745-4372"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Xiaowen Chu","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou) and The Hong Kong University of Science and Technology"],"affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou) and The Hong Kong University of Science and Technology","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5016836702"],"corresponding_institution_ids":["https://openalex.org/I204983213"],"apc_list":null,"apc_paid":null,"fwci":4.9857,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.9627061,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"236","last_page":"249"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9865000247955322,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10444","display_name":"Context-Aware Activity Recognition Systems","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8514467477798462},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6631209850311279},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.5459094047546387},{"id":"https://openalex.org/keywords/extensibility","display_name":"Extensibility","score":0.49737098813056946},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.4869907796382904},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1424953043460846},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10664153099060059}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8514467477798462},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6631209850311279},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.5459094047546387},{"id":"https://openalex.org/C32833848","wikidata":"https://www.wikidata.org/wiki/Q4115054","display_name":"Extensibility","level":2,"score":0.49737098813056946},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4869907796382904},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1424953043460846},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10664153099060059},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3627703.3650083","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627703.3650083","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth European Conference on Computer Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-138573","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-138573","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W1566289585","https://openalex.org/W2018346931","https://openalex.org/W2052440657","https://openalex.org/W2257408573","https://openalex.org/W2595551253","https://openalex.org/W2734941459","https://openalex.org/W2963786636","https://openalex.org/W2969388332","https://openalex.org/W2975712713","https://openalex.org/W3043278179","https://openalex.org/W3081168214","https://openalex.org/W3119866685","https://openalex.org/W3193250980","https://openalex.org/W3204998121","https://openalex.org/W3214578629","https://openalex.org/W4220838824","https://openalex.org/W4220967350","https://openalex.org/W4226079124","https://openalex.org/W4287121196","https://openalex.org/W4287391717","https://openalex.org/W4310282800","https://openalex.org/W4318541692","https://openalex.org/W4321636575","https://openalex.org/W4364382874","https://openalex.org/W4376652719","https://openalex.org/W4386260498","https://openalex.org/W4386396242","https://openalex.org/W6796487566","https://openalex.org/W6810737565"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W1948607442","https://openalex.org/W3004004161","https://openalex.org/W2044615423","https://openalex.org/W4247766898","https://openalex.org/W4244765761","https://openalex.org/W2361584951","https://openalex.org/W2364420803"],"abstract_inverted_index":{"In":[0,76],"recent":[1],"years,":[2],"large-scale":[3],"models":[4,112],"can":[5],"be":[6,41,114],"easily":[7],"scaled":[8],"to":[9,40,44,113],"trillions":[10],"of":[11,57,140],"parameters":[12],"with":[13,92],"sparsely":[14],"activated":[15],"mixture-of-experts":[16],"(MoE),":[17],"which":[18,89,128],"significantly":[19],"improves":[20],"the":[21,37,67,104,162],"model":[22],"quality":[23],"while":[24,148],"only":[25],"requiring":[26],"a":[27,45,98,158],"sub-linear":[28],"increase":[29],"in":[30,64,109,116],"computational":[31],"costs.":[32],"However,":[33],"MoE":[34,65,85,111,170],"layers":[35],"require":[36],"input":[38],"data":[39,58,145],"dynamically":[42],"routed":[43],"particular":[46],"GPU":[47,74],"for":[48],"computing":[49],"during":[50],"distributed":[51],"training.":[52],"The":[53],"highly":[54],"dynamic":[55],"property":[56],"routing":[59],"and":[60,83,106,132,144,161,173],"high":[61],"communication":[62,105],"costs":[63],"make":[66],"training":[68,86,110],"system":[69],"low":[70],"scaling":[71],"efficiency":[72],"on":[73,157],"clusters.":[75],"this":[77],"work,":[78],"we":[79],"propose":[80],"an":[81,117],"extensible":[82],"efficient":[84],"system,":[87],"ScheMoE,":[88],"is":[90],"equipped":[91],"several":[93],"features.":[94],"1)":[95],"ScheMoE":[96,121,136,166],"provides":[97],"generic":[99],"scheduling":[100,151],"framework":[101],"that":[102,165],"allows":[103],"computation":[107],"tasks":[108],"scheduled":[115],"optimal":[118],"way.":[119],"2)":[120],"integrates":[122],"our":[123,150],"proposed":[124],"novel":[125],"all-to-all":[126,142],"collective":[127],"better":[129],"utilizes":[130],"intra-":[131],"inter-connect":[133],"bandwidths.":[134],"3)":[135],"supports":[137],"easy":[138],"extensions":[139],"customized":[141],"collectives":[143],"compression":[146],"approaches":[147],"enjoying":[149],"algorithm.":[152],"Extensive":[153],"experiments":[154],"are":[155],"conducted":[156],"32-GPU":[159],"cluster":[160],"results":[163],"show":[164],"outperforms":[167],"existing":[168],"state-of-the-art":[169],"systems,":[171],"Tutel":[172],"Faster-MoE,":[174],"by":[175],"9%-30%.":[176]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":16},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
