{"id":"https://openalex.org/W7154458894","doi":"https://doi.org/10.48550/arxiv.2604.12599","title":"Beyond Pre-Training: The Full Lifecycle of Foundation Models on HPC Systems","display_name":"Beyond Pre-Training: The Full Lifecycle of Foundation Models on HPC Systems","publication_year":2026,"publication_date":"2026-04-14","ids":{"openalex":"https://openalex.org/W7154458894","doi":"https://doi.org/10.48550/arxiv.2604.12599"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.12599","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12599","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.12599","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044457525","display_name":"D. Conciatore","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Conciatore, Dino","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057354993","display_name":"Elia Oggian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oggian, Elia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133682010","display_name":"Federico Da Forno","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Da Forno, Federico","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120403539","display_name":"Stefano Schuppli","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schuppli, Stefano","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133715423","display_name":"Jerome Tissieres","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tissieres, Jerome","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046896923","display_name":"Joost VandeVondele","orcid":"https://orcid.org/0000-0002-0902-5111"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"VandeVondele, Joost","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5040455527","display_name":"Maxime Martinasso","orcid":"https://orcid.org/0000-0003-1849-1621"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Martinasso, Maxime","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.5925999879837036,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.5925999879837036,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.09539999812841415,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.05350000038743019,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.7789999842643738},{"id":"https://openalex.org/keywords/blueprint","display_name":"Blueprint","score":0.6841999888420105},{"id":"https://openalex.org/keywords/bespoke","display_name":"Bespoke","score":0.5217000246047974},{"id":"https://openalex.org/keywords/service","display_name":"Service (business)","score":0.49320000410079956},{"id":"https://openalex.org/keywords/operationalization","display_name":"Operationalization","score":0.4846999943256378},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.43470001220703125},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.4287000000476837},{"id":"https://openalex.org/keywords/commodity","display_name":"Commodity","score":0.4108000099658966}],"concepts":[{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.7789999842643738},{"id":"https://openalex.org/C155911762","wikidata":"https://www.wikidata.org/wiki/Q422321","display_name":"Blueprint","level":2,"score":0.6841999888420105},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6502000093460083},{"id":"https://openalex.org/C44210515","wikidata":"https://www.wikidata.org/wiki/Q16968978","display_name":"Bespoke","level":2,"score":0.5217000246047974},{"id":"https://openalex.org/C2780378061","wikidata":"https://www.wikidata.org/wiki/Q25351891","display_name":"Service (business)","level":2,"score":0.49320000410079956},{"id":"https://openalex.org/C9354725","wikidata":"https://www.wikidata.org/wiki/Q286017","display_name":"Operationalization","level":2,"score":0.4846999943256378},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.47620001435279846},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.43470001220703125},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.4287000000476837},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.4165000021457672},{"id":"https://openalex.org/C2779439359","wikidata":"https://www.wikidata.org/wiki/Q317088","display_name":"Commodity","level":2,"score":0.4108000099658966},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.37540000677108765},{"id":"https://openalex.org/C2776397876","wikidata":"https://www.wikidata.org/wiki/Q1450531","display_name":"Cyberinfrastructure","level":2,"score":0.32710000872612},{"id":"https://openalex.org/C57041688","wikidata":"https://www.wikidata.org/wiki/Q220644","display_name":"Service-oriented architecture","level":3,"score":0.32670000195503235},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.31869998574256897},{"id":"https://openalex.org/C35280785","wikidata":"https://www.wikidata.org/wiki/Q559486","display_name":"System lifecycle","level":4,"score":0.29420000314712524},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.29159998893737793},{"id":"https://openalex.org/C110354214","wikidata":"https://www.wikidata.org/wiki/Q6314146","display_name":"Engineering management","level":1,"score":0.29100000858306885},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.2872999906539917},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2777000069618225},{"id":"https://openalex.org/C2778837361","wikidata":"https://www.wikidata.org/wiki/Q2450880","display_name":"Exascale computing","level":3,"score":0.27129998803138733},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.2635999917984009},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.2565999925136566}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.12599","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12599","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.12599","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.12599","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.6379385590553284}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large-scale":[0],"pre-training":[1,44],"of":[2,33,42,51,55,100,110],"Foundational":[3],"Models":[4],"(FM)":[5],"constitutes":[6],"a":[7,112,117,123,192],"computationally":[8,81],"intensive":[9],"first":[10,22],"phase":[11,23],"for":[12,194],"enabling":[13,195],"AI":[14,57,114,205],"across":[15],"diverse":[16],"scientific":[17,209],"and":[18,64,107,129,165,176,202,210],"societal":[19],"applications.":[20],"This":[21,102],"has":[24],"positioned":[25],"High-Performance":[26],"Computing":[27],"(HPC)":[28],"facilities":[29],"as":[30,62],"indispensable":[31],"backbones":[32],"\"Sovereign":[34],"AI\"":[35],"initiatives.":[36],"While":[37],"the":[38,47,56,105,132,159,182],"massive":[39],"throughput":[40],"requirements":[41],"FM":[43],"align":[45],"with":[46,72,147],"traditional":[48],"capability-oriented":[49],"mission":[50],"HPC,":[52],"subsequent":[53],"phases":[54,78],"lifecycle,":[58],"typically":[59],"referred":[60],"to":[61,197],"fine-tuning":[63,174],"inference,":[65],"introduce":[66],"operational":[67],"paradigms":[68],"that":[69,95,138],"can":[70],"conflict":[71],"established":[73],"batch-processing":[74],"environments.":[75],"Moreover,":[76],"these":[77],"are":[79],"not":[80],"trivial:":[82],"they":[83],"often":[84],"require":[85],"substantial":[86],"high-end":[87],"compute":[88,145],"resources":[89],"while":[90,185],"exhibiting":[91],"hardware":[92],"utilization":[93],"patterns":[94],"differ":[96],"significantly":[97],"from":[98],"those":[99],"pre-training.":[101],"paper":[103],"addresses":[104],"architectural":[106],"strategic":[108],"challenges":[109],"operationalizing":[111],"complete":[113],"lifecycle":[115],"within":[116],"national":[118],"supercomputing":[119],"facility.":[120],"We":[121,168],"present":[122],"hybrid":[124],"cloud-native":[125],"platform":[126],"being":[127],"developed":[128],"deployed":[130],"at":[131],"Swiss":[133],"National":[134],"Supercomputing":[135],"Centre":[136],"(CSCS)":[137],"combines":[139],"diskless":[140],"GPU-enabled":[141],"HPE":[142],"Cray":[143],"EX":[144],"nodes":[146],"virtualized":[148],"commodity":[149],"infrastructure.":[150],"Orchestrated":[151],"by":[152],"Kubernetes,":[153],"this":[154],"novel":[155],"service":[156],"architecture":[157],"bridges":[158],"gap":[160],"between":[161],"HPC":[162],"batch":[163],"processing":[164],"service-oriented":[166],"workflows.":[167],"report":[169],"our":[170],"initial":[171],"investigations":[172],"into":[173,207],"pipelines":[175],"highly":[177],"available":[178],"inference":[179],"services,":[180],"analyzing":[181],"associated":[183],"trade-offs":[184],"improving":[186],"user":[187],"productivity.":[188],"Our":[189],"findings":[190],"offer":[191],"blueprint":[193],"supercomputers":[196],"integrate":[198],"\"AI":[199],"Factories\"":[200],"services":[201],"workflows,":[203],"supporting":[204],"innovations":[206],"end-to-end":[208],"industrial":[211],"use":[212],"cases.":[213]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-16T00:00:00"}
