{"id":"https://openalex.org/W4411725354","doi":"https://doi.org/10.1109/iscas56072.2025.11044158","title":"LLM Training Workload IO Characteristics","display_name":"LLM Training Workload IO Characteristics","publication_year":2025,"publication_date":"2025-05-25","ids":{"openalex":"https://openalex.org/W4411725354","doi":"https://doi.org/10.1109/iscas56072.2025.11044158"},"language":"en","primary_location":{"id":"doi:10.1109/iscas56072.2025.11044158","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas56072.2025.11044158","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5081338858","display_name":"Kiran Gunnam","orcid":"https://orcid.org/0000-0001-7219-7234"},"institutions":[{"id":"https://openalex.org/I11912373","display_name":"Micron (United States)","ror":"https://ror.org/02fv52296","country_code":"US","type":"company","lineage":["https://openalex.org/I11912373"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kiran Gunnam","raw_affiliation_strings":["Micron Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Micron Technology","institution_ids":["https://openalex.org/I11912373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5118664044","display_name":"Alex Mohandas","orcid":null},"institutions":[{"id":"https://openalex.org/I11912373","display_name":"Micron (United States)","ror":"https://ror.org/02fv52296","country_code":"US","type":"company","lineage":["https://openalex.org/I11912373"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alex Mohandas","raw_affiliation_strings":["Micron Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Micron Technology","institution_ids":["https://openalex.org/I11912373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5118664045","display_name":"Mahesh Kumar Dhote","orcid":null},"institutions":[{"id":"https://openalex.org/I11912373","display_name":"Micron (United States)","ror":"https://ror.org/02fv52296","country_code":"US","type":"company","lineage":["https://openalex.org/I11912373"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mahesh Kumar Dhote","raw_affiliation_strings":["Micron Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Micron Technology","institution_ids":["https://openalex.org/I11912373"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Rajesh Bhagwat","orcid":null},"institutions":[{"id":"https://openalex.org/I11912373","display_name":"Micron (United States)","ror":"https://ror.org/02fv52296","country_code":"US","type":"company","lineage":["https://openalex.org/I11912373"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rajesh Bhagwat","raw_affiliation_strings":["Micron Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Micron Technology","institution_ids":["https://openalex.org/I11912373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020446417","display_name":"Ponna Darshan","orcid":null},"institutions":[{"id":"https://openalex.org/I11912373","display_name":"Micron (United States)","ror":"https://ror.org/02fv52296","country_code":"US","type":"company","lineage":["https://openalex.org/I11912373"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Darshan P","raw_affiliation_strings":["Micron Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Micron Technology","institution_ids":["https://openalex.org/I11912373"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5118664046","display_name":"Kanaiah Kothalikar","orcid":null},"institutions":[{"id":"https://openalex.org/I11912373","display_name":"Micron (United States)","ror":"https://ror.org/02fv52296","country_code":"US","type":"company","lineage":["https://openalex.org/I11912373"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kanaiah Kothalikar","raw_affiliation_strings":["Micron Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Micron Technology","institution_ids":["https://openalex.org/I11912373"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.14804633,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.6233000159263611,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13382","display_name":"Robotics and Automated Systems","score":0.6233000159263611,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.7893591523170471},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.7798734307289124},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6938685178756714},{"id":"https://openalex.org/keywords/aeronautics","display_name":"Aeronautics","score":0.35050496459007263},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.19291162490844727},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.121641606092453},{"id":"https://openalex.org/keywords/meteorology","display_name":"Meteorology","score":0.06507563591003418}],"concepts":[{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.7893591523170471},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.7798734307289124},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6938685178756714},{"id":"https://openalex.org/C178802073","wikidata":"https://www.wikidata.org/wiki/Q8421","display_name":"Aeronautics","level":1,"score":0.35050496459007263},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.19291162490844727},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.121641606092453},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.06507563591003418},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscas56072.2025.11044158","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscas56072.2025.11044158","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on Circuits and Systems (ISCAS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2150230714","https://openalex.org/W2961595369","https://openalex.org/W3037960858","https://openalex.org/W3155243801","https://openalex.org/W3173778203","https://openalex.org/W4283363061","https://openalex.org/W4321636578","https://openalex.org/W4389519530","https://openalex.org/W4390579167","https://openalex.org/W4399794472","https://openalex.org/W4400772129","https://openalex.org/W4402494106"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2000785801","https://openalex.org/W986318368","https://openalex.org/W2384410913","https://openalex.org/W2352878646","https://openalex.org/W2004734601","https://openalex.org/W2287264064","https://openalex.org/W2130149817"],"abstract_inverted_index":{"Deep":[0],"learning":[1],"models,":[2,59],"especially":[3],"large":[4],"language":[5],"models":[6],"(LLMs),":[7],"demand":[8],"significant":[9],"computational":[10],"resources":[11],"for":[12,81,167,181,189,210,216],"training.":[13],"To":[14],"optimize":[15],"performance":[16],"and":[17,23,50,57,63,75,79,85,91,159,172,192,194],"resource":[18],"allocation,":[19],"understanding":[20],"memory":[21,83],"utilization":[22],"I/O":[24,140],"characteristics":[25,161],"during":[26,162],"LLM":[27,164],"training":[28,44,120,131,214],"is":[29,179],"essential.":[30],"In":[31],"our":[32,52],"study,":[33],"we":[34,108,195],"explore":[35],"the":[36,43,110,148,152,163,173,208,211],"impact":[37,111,130],"of":[38,45,112,144,151,155,175],"SSD":[39,158],"storage":[40],"technologies":[41],"on":[42,65,119],"a":[46,66,168],"BERT":[47],"(Encoder-Based)":[48],"model":[49,77],"extend":[51],"findings":[53],"to":[54,73,104,128,138,157,202],"other":[55],"encoder":[56],"decoder-based":[58],"including":[60],"GPT-Falcon,":[61],"RoBERTa,":[62],"GPT-2,":[64],"GPU":[67,170],"setup.":[68,183],"We":[69],"utilize":[70],"regular":[71,100],"checkpoints":[72],"analyzing":[74],"saving":[76],"state":[78],"parameters":[80],"accessing":[82],"usage":[84],"assess":[86],"write":[87],"bandwidth":[88,93],"(for":[89,94],"checkpointing)":[90],"read":[92],"restore":[95],"operation":[96],"as":[97,99],"well":[98],"traffic":[101,156],"data":[102],"ingestion)":[103],"identify":[105],"bottlenecks.":[106],"Additionally,":[107],"investigated":[109],"different":[113,153],"Logical":[114],"Block":[115],"Addressing":[116],"(LBA)":[117],"sizes":[118],"characteristics.":[121],"The":[122,142],"synchronous":[123],"checkpointing":[124],"process":[125],"was":[126],"found":[127],"significantly":[129],"time,":[132],"particularly":[133],"with":[134],"smaller":[135],"sizes,":[136],"due":[137],"frequent":[139],"operations.":[141],"contribution":[143],"this":[145,177,198],"paper":[146],"includes":[147],"systematic":[149],"study":[150,178,185,199],"types":[154],"their":[160],"pre-training":[165],"phase":[166],"single":[169],"setup":[171],"analysis":[174],"how":[176],"applicable":[180],"multi-GPU":[182],"This":[184],"offers":[186],"valuable":[187],"insights":[188],"both":[190],"practitioners":[191],"researchers,":[193],"hope":[196],"that":[197],"will":[200],"lead":[201],"additional":[203],"future":[204],"work":[205],"in":[206],"improving":[207],"SSDs":[209],"large-scale":[212],"distributed":[213],"systems":[215],"LLMs.":[217]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
