{"id":"https://openalex.org/W7154139261","doi":"https://doi.org/10.1109/ojcoms.2026.3683080","title":"OMLSched: Computation-Driven Flow Scheduling for Optical Machine Learning Training Clusters","display_name":"OMLSched: Computation-Driven Flow Scheduling for Optical Machine Learning Training Clusters","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7154139261","doi":"https://doi.org/10.1109/ojcoms.2026.3683080"},"language":"en","primary_location":{"id":"doi:10.1109/ojcoms.2026.3683080","is_oa":true,"landing_page_url":"https://doi.org/10.1109/ojcoms.2026.3683080","pdf_url":null,"source":{"id":"https://openalex.org/S4210202420","display_name":"IEEE Open Journal of the Communications Society","issn_l":"2644-125X","issn":["2644-125X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310316002","host_organization_name":"IEEE Communications Society","host_organization_lineage":["https://openalex.org/P4310316002","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Communications Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Open Journal of the Communications Society","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/ojcoms.2026.3683080","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001549734","display_name":"Qiaojun Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qiaojun Hu","raw_affiliation_strings":["School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China"],"raw_orcid":"https://orcid.org/0009-0008-3723-2186","affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Wei Wang","orcid":"https://orcid.org/0000-0002-0503-2816"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-0503-2816","affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133548401","display_name":"Xiaoyu Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210130112","display_name":"China Academy of Information and Communications Technology","ror":"https://ror.org/038dte259","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210130112","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyu Wang","raw_affiliation_strings":["CTTL, China Academy of Information and Communications Technology, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"CTTL, China Academy of Information and Communications Technology, Beijing, China","institution_ids":["https://openalex.org/I4210130112"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yajie Li","orcid":"https://orcid.org/0000-0002-8751-7947"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yajie Li","raw_affiliation_strings":["School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-8751-7947","affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yongli Zhao","orcid":"https://orcid.org/0000-0003-3716-8248"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongli Zhao","raw_affiliation_strings":["School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3716-8248","affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101500619","display_name":"Yanxia Tan","orcid":"https://orcid.org/0000-0003-0541-5275"},"institutions":[{"id":"https://openalex.org/I6507939","display_name":"China United Network Communications Group (China)","ror":"https://ror.org/028w99c90","country_code":"CN","type":"company","lineage":["https://openalex.org/I6507939"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanxia Tan","raw_affiliation_strings":["Broadband Network Research Laboratory, China Unicom Research Institute, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Broadband Network Research Laboratory, China Unicom Research Institute, Beijing, China","institution_ids":["https://openalex.org/I6507939"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5133486405","display_name":"Jie Zhang","orcid":"https://orcid.org/0000-0001-7750-2197"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Zhang","raw_affiliation_strings":["School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7750-2197","affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Beijing University of Posts and Telecommunications (BUPT), Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5001549734"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":{"value":1750,"currency":"USD","value_usd":1750},"apc_paid":{"value":1750,"currency":"USD","value_usd":1750},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.76532464,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"7","issue":null,"first_page":"4100","last_page":"4111"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.2289000004529953,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12611","display_name":"Neural Networks and Reservoir Computing","score":0.2289000004529953,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.19439999759197235,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.061500001698732376,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.5340999960899353},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.49309998750686646},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.3521000146865845},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.32089999318122864},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.28999999165534973}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6509000062942505},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5382999777793884},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.5340999960899353},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.49309998750686646},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45509999990463257},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.3521000146865845},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.28999999165534973},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.27059999108314514},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.26010000705718994}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ojcoms.2026.3683080","is_oa":true,"landing_page_url":"https://doi.org/10.1109/ojcoms.2026.3683080","pdf_url":null,"source":{"id":"https://openalex.org/S4210202420","display_name":"IEEE Open Journal of the Communications Society","issn_l":"2644-125X","issn":["2644-125X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310316002","host_organization_name":"IEEE Communications Society","host_organization_lineage":["https://openalex.org/P4310316002","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Communications Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Open Journal of the Communications Society","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:1b17f48bcc3c435ea4c6935181dc1bc9","is_oa":true,"landing_page_url":"https://doaj.org/article/1b17f48bcc3c435ea4c6935181dc1bc9","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Open Journal of the Communications Society, Vol 7, Pp 4100-4111 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/ojcoms.2026.3683080","is_oa":true,"landing_page_url":"https://doi.org/10.1109/ojcoms.2026.3683080","pdf_url":null,"source":{"id":"https://openalex.org/S4210202420","display_name":"IEEE Open Journal of the Communications Society","issn_l":"2644-125X","issn":["2644-125X"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310316002","host_organization_name":"IEEE Communications Society","host_organization_lineage":["https://openalex.org/P4310316002","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Communications Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Open Journal of the Communications Society","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5162505927","display_name":null,"funder_award_id":"2023YFF0612901","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0,166],"AI":[1],"model":[2,109],"size":[3],"and":[4,48,72,130,158,181],"the":[5,14,35,39,45,110,139,144,154],"amount":[6],"of":[7,17,37,156,176],"training":[8,46,179],"data":[9],"have":[10],"increased":[11],"dramatically,":[12],"causing":[13],"computing":[15,31],"power":[16,32],"one":[18],"single":[19],"GPU":[20,76,111,184],"to":[21,56,60,100,137],"be":[22],"insufficient.":[23],"Although":[24],"distributed":[25],"machine":[26],"learning":[27],"(DML)":[28],"can":[29,172],"enhance":[30],"by":[33],"increasing":[34],"number":[36],"GPUs,":[38],"communication":[40],"overhead":[41],"between":[42],"GPUs":[43],"limits":[44],"speed":[47,180],"utilization.":[49],"Optical":[50],"circuit":[51],"switches":[52],"(OCSes)":[53],"are":[54,65,98],"used":[55],"construct":[57],"ML":[58,83,116,149],"clusters":[59],"speedup":[61],"DML,":[62],"but":[63],"there":[64],"also":[66],"problems":[67],"such":[68],"as":[69],"port":[70],"constraints":[71],"reconfiguration":[73],"delay.":[74],"While":[75],"utilization":[77,112,185],"remains":[78],"a":[79],"critical":[80],"metric":[81],"for":[82,91,147],"service":[84],"providers,":[85],"existing":[86,161],"schedulers":[87],"lack":[88],"explicit":[89],"optimization":[90,113],"this":[92,105],"objective.":[93],"Therefore,":[94],"refined":[95],"scheduling":[96,162],"strategies":[97],"required":[99],"overcome":[101],"hardware":[102],"limitations.":[103],"In":[104],"paper,":[106],"we":[107,152],"formally":[108],"problem":[114],"in":[115,164,178,183],"clusters,":[117],"establish":[118],"its":[119],"relationship":[120],"with":[121],"job":[122],"scheduling.":[123],"We":[124],"propose":[125],"both":[126],"ILP-based":[127],"optimal":[128],"solutions":[129],"practical":[131],"heuristic-based":[132],"online":[133],"scheduler":[134],"called":[135],"OMLSched":[136,157,171],"schedule":[138],"DML":[140],"jobs":[141],"while":[142],"minimizing":[143],"inter-job":[145],"contention":[146],"optical":[148],"clusters.":[150],"Finally,":[151],"evaluate":[153],"performance":[155,174],"several":[159],"other":[160],"methods":[163],"simulations.":[165],"simulation":[167],"results":[168],"show":[169],"that":[170],"achieve":[173],"improvements":[175],"48%":[177],"28%":[182],"respectively.":[186]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2026-04-14T00:00:00"}
