{"id":"https://openalex.org/W7139942511","doi":"https://doi.org/10.48550/arxiv.2603.18383","title":"From Servers to Sites: Compositional Power Trace Generation of LLM Inference for Infrastructure Planning","display_name":"From Servers to Sites: Compositional Power Trace Generation of LLM Inference for Infrastructure Planning","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7139942511","doi":"https://doi.org/10.48550/arxiv.2603.18383"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.18383","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18383","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.18383","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5087148095","display_name":"Grant Wilkins","orcid":"https://orcid.org/0000-0001-9126-0673"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wilkins, Grant","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005485274","display_name":"Fiodar Kazhamiaka","orcid":"https://orcid.org/0000-0002-0798-5151"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kazhamiaka, Fiodar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130246753","display_name":"Ram Rajagopal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rajagopal, Ram","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.6495000123977661,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.6495000123977661,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.14990000426769257,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.04699999839067459,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.7175999879837036},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.7001000046730042},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6161999702453613},{"id":"https://openalex.org/keywords/trace","display_name":"TRACE (psycholinguistics)","score":0.6050999760627747},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.5073999762535095},{"id":"https://openalex.org/keywords/capacity-planning","display_name":"Capacity planning","score":0.4916999936103821},{"id":"https://openalex.org/keywords/idle","display_name":"Idle","score":0.40880000591278076},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.4034999907016754},{"id":"https://openalex.org/keywords/data-center","display_name":"Data center","score":0.3898000121116638}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7229999899864197},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.7175999879837036},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.7001000046730042},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6161999702453613},{"id":"https://openalex.org/C75291252","wikidata":"https://www.wikidata.org/wiki/Q1315756","display_name":"TRACE (psycholinguistics)","level":2,"score":0.6050999760627747},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.5232999920845032},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.5073999762535095},{"id":"https://openalex.org/C2781007418","wikidata":"https://www.wikidata.org/wiki/Q1456934","display_name":"Capacity planning","level":2,"score":0.4916999936103821},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.45669999718666077},{"id":"https://openalex.org/C16320812","wikidata":"https://www.wikidata.org/wiki/Q1812200","display_name":"Idle","level":2,"score":0.40880000591278076},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.3898000121116638},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.35499998927116394},{"id":"https://openalex.org/C5297727","wikidata":"https://www.wikidata.org/wiki/Q786970","display_name":"Autocorrelation","level":2,"score":0.3499999940395355},{"id":"https://openalex.org/C423512","wikidata":"https://www.wikidata.org/wiki/Q383973","display_name":"Electricity generation","level":3,"score":0.3116999864578247},{"id":"https://openalex.org/C123745756","wikidata":"https://www.wikidata.org/wiki/Q1665949","display_name":"Interconnection","level":2,"score":0.3009999990463257},{"id":"https://openalex.org/C2780898871","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Performance metric","level":2,"score":0.289000004529953},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.2863999903202057},{"id":"https://openalex.org/C180591934","wikidata":"https://www.wikidata.org/wiki/Q1253369","display_name":"Downtime","level":2,"score":0.2831999957561493},{"id":"https://openalex.org/C29852176","wikidata":"https://www.wikidata.org/wiki/Q373338","display_name":"Critical infrastructure","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C45872418","wikidata":"https://www.wikidata.org/wiki/Q5318966","display_name":"Dynamic demand","level":3,"score":0.26179999113082886},{"id":"https://openalex.org/C186370098","wikidata":"https://www.wikidata.org/wiki/Q442787","display_name":"Energy (signal processing)","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.25380000472068787},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.25189998745918274},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.18383","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18383","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.18383","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.18383","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.6433407068252563,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Datacenter":[0],"operators":[1],"and":[2,21,31,54,57,66,89,110,118,130,147,177,188],"electrical":[3],"utilities":[4,24],"rely":[5],"on":[6,61,97],"power":[7,36,76,91,112,175],"traces":[8,16,109,122,169],"at":[9,134],"different":[10],"spatiotemporal":[11],"scales.":[12],"Operators":[13],"use":[14,25],"fine-grained":[15],"for":[17,29,114,159],"provisioning,":[18],"facility":[19,58],"management,":[20],"scheduling,":[22],"while":[23,162],"site-level":[26],"load":[27,132,179],"profiles":[28,113,133],"capacity":[30],"interconnection":[32],"planning.":[33],"Existing":[34],"datacenter":[35],"models":[37],"do":[38],"not":[39],"capture":[40],"LLM":[41,74],"inference":[42,75],"workloads,":[43],"in":[44],"which":[45],"GPUs":[46],"shift":[47],"rapidly":[48],"among":[49,86],"compute-intensive":[50],"prefill,":[51],"lower-power":[52],"decode,":[53],"idle":[55],"states,":[56],"demand":[59],"depends":[60],"how":[62],"these":[63],"states":[64,88],"evolve":[65],"synchronize":[67],"across":[68],"many":[69],"devices.":[70],"We":[71],"show":[72],"that":[73,105,184],"can":[77],"be":[78],"represented":[79],"compositionally":[80],"through":[81],"two":[82],"components:":[83],"workload-driven":[84],"transitions":[85],"operating":[87],"configuration-specific":[90],"distributions":[92],"within":[93],"those":[94],"states.":[95],"Building":[96],"this":[98],"observation,":[99],"we":[100],"develop":[101],"a":[102],"trace-generation":[103],"framework":[104,151],"learns":[106],"from":[107,124],"measured":[108],"synthesizes":[111],"new":[115],"traffic":[116],"conditions":[117],"serving":[119],"configurations.":[120],"These":[121],"aggregate":[123],"GPU":[125,148],"servers":[126],"to":[127],"rack-,":[128],"row-,":[129],"facility-scale":[131],"the":[135,140],"temporal":[136,164],"granularity":[137],"required":[138],"by":[139],"study.":[141],"Across":[142],"multiple":[143],"LLMs,":[144],"tensor-parallel":[145],"settings,":[146],"generations,":[149],"our":[150],"achieves":[152],"median":[153],"absolute":[154],"energy":[155],"error":[156],"below":[157],"5%":[158],"most":[160],"configurations":[161],"preserving":[163],"autocorrelation":[165],"structure.":[166],"The":[167],"resulting":[168],"support":[170],"downstream":[171],"analyses":[172],"including":[173],"oversubscription,":[174],"modulation,":[176],"utility-facing":[178],"characterization,":[180],"enabling":[181],"infrastructure":[182],"evaluations":[183],"flat":[185],"nameplate":[186],"assumptions":[187],"static":[189],"trace":[190],"replay":[191],"cannot":[192],"support.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-21T00:00:00"}
