{"id":"https://openalex.org/W7125179025","doi":"https://doi.org/10.48550/arxiv.2601.11935","title":"Big Data Workload Profiling for Energy-Aware Cloud Resource Management","display_name":"Big Data Workload Profiling for Energy-Aware Cloud Resource Management","publication_year":2026,"publication_date":"2026-01-17","ids":{"openalex":"https://openalex.org/W7125179025","doi":"https://doi.org/10.48550/arxiv.2601.11935"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.11935","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.11935","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.11935","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123528531","display_name":"Milan Parikh","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Parikh, Milan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040634542","display_name":"Arun Soni","orcid":"https://orcid.org/0000-0001-8593-3229"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Soni, Aniket Abhishek","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123489547","display_name":"Sneja Mitinbhai Shah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shah, Sneja Mitinbhai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123473935","display_name":"Ayush Raj Jha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jha, Ayush Raj","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5123528531"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9750999808311462,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9750999808311462,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.006800000090152025,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.002199999988079071,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.8177000284194946},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.7703999876976013},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.7231000065803528},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.6552000045776367},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.630299985408783},{"id":"https://openalex.org/keywords/energy-consumption","display_name":"Energy consumption","score":0.5830000042915344},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.54830002784729},{"id":"https://openalex.org/keywords/service-level-agreement","display_name":"Service-level agreement","score":0.5099999904632568}],"concepts":[{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.8177000284194946},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.7703999876976013},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7592999935150146},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.7231000065803528},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.6552000045776367},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.630299985408783},{"id":"https://openalex.org/C2780165032","wikidata":"https://www.wikidata.org/wiki/Q16869822","display_name":"Energy consumption","level":2,"score":0.5830000042915344},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.54830002784729},{"id":"https://openalex.org/C2778160497","wikidata":"https://www.wikidata.org/wiki/Q869830","display_name":"Service-level agreement","level":3,"score":0.5099999904632568},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4749000072479248},{"id":"https://openalex.org/C25344961","wikidata":"https://www.wikidata.org/wiki/Q192726","display_name":"Virtual machine","level":2,"score":0.4569000005722046},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.45190000534057617},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4481000006198883},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.4350999891757965},{"id":"https://openalex.org/C153740404","wikidata":"https://www.wikidata.org/wiki/Q671224","display_name":"Data center","level":2,"score":0.42899999022483826},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.39469999074935913},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3817000091075897},{"id":"https://openalex.org/C142355369","wikidata":"https://www.wikidata.org/wiki/Q7698919","display_name":"Temporal isolation among virtual machines","level":4,"score":0.34150001406669617},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.3131999969482422},{"id":"https://openalex.org/C181889124","wikidata":"https://www.wikidata.org/wiki/Q380204","display_name":"Service level","level":2,"score":0.2962000072002411},{"id":"https://openalex.org/C1668388","wikidata":"https://www.wikidata.org/wiki/Q1149776","display_name":"Data management","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.28290000557899475},{"id":"https://openalex.org/C175801342","wikidata":"https://www.wikidata.org/wiki/Q1988917","display_name":"Data analysis","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C520301825","wikidata":"https://www.wikidata.org/wiki/Q380170","display_name":"Energy conservation","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.26190000772476196}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.11935","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.11935","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.11935","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.11935","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.5581563115119934}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cloud":[0],"data":[1,13,139],"centers":[2],"face":[3],"increasing":[4],"pressure":[5],"to":[6,16,43,108,112],"reduce":[7],"operational":[8],"energy":[9,29,63,104],"consumption":[10],"as":[11,125],"big":[12,138],"workloads":[14,92],"continue":[15],"grow":[17],"in":[18],"scale":[19],"and":[20,28,39,64,70,90,128],"complexity.":[21],"This":[22],"paper":[23],"presents":[24],"a":[25,95,113,126],"workload":[26,123],"aware":[27],"efficient":[30],"scheduling":[31],"framework":[32,81],"that":[33],"profiles":[34],"CPU":[35],"utilization,":[36],"memory":[37],"demand,":[38],"storage":[40],"IO":[41],"behavior":[42],"guide":[44],"virtual":[45],"machine":[46],"placement":[47],"decisions.":[48],"By":[49],"combining":[50],"historical":[51],"execution":[52],"logs":[53],"with":[54,116],"real":[55],"time":[56],"telemetry,":[57],"the":[58,62,133],"proposed":[59],"system":[60],"predicts":[61],"performance":[65,118],"impact":[66],"of":[67,106,135],"candidate":[68],"placements":[69],"enables":[71],"adaptive":[72],"consolidation":[73],"while":[74],"preserving":[75],"service":[76],"level":[77],"agreement":[78],"compliance.":[79],"The":[80],"is":[82],"evaluated":[83],"using":[84],"representative":[85],"Hadoop":[86],"MapReduce,":[87],"Spark":[88],"MLlib,":[89],"ETL":[91],"deployed":[93],"on":[94],"multi":[96],"node":[97],"cloud":[98,136],"testbed.":[99],"Experimental":[100],"results":[101],"demonstrate":[102],"consistent":[103],"savings":[105],"15":[107],"20":[109],"percent":[110],"compared":[111],"baseline":[114],"scheduler,":[115],"negligible":[117],"degradation.":[119],"These":[120],"findings":[121],"highlight":[122],"profiling":[124],"practical":[127],"scalable":[129],"strategy":[130],"for":[131],"improving":[132],"sustainability":[134],"based":[137],"processing":[140],"environments.":[141]},"counts_by_year":[],"updated_date":"2026-01-22T23:33:04.759266","created_date":"2026-01-22T00:00:00"}
