{"id":"https://openalex.org/W2763493608","doi":"https://doi.org/10.1109/tpds.2017.2762310","title":"A Job Sizing Strategy for High-Throughput Scientific Workflows","display_name":"A Job Sizing Strategy for High-Throughput Scientific Workflows","publication_year":2017,"publication_date":"2017-10-12","ids":{"openalex":"https://openalex.org/W2763493608","doi":"https://doi.org/10.1109/tpds.2017.2762310","mag":"2763493608"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2017.2762310","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2017.2762310","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051396274","display_name":"Benjam\u00edn Tovar","orcid":"https://orcid.org/0000-0002-5294-2281"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Benjamin Tovar","raw_affiliation_strings":["University of Notre Dame, Notre Dame, IN"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame, Notre Dame, IN","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072339196","display_name":"Rafael Ferreira da Silva","orcid":"https://orcid.org/0000-0002-1720-0928"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rafael Ferreira da Silva","raw_affiliation_strings":["Information Sciences Institute, University of Southern California, Marina Del Rey, CA"],"affiliations":[{"raw_affiliation_string":"Information Sciences Institute, University of Southern California, Marina Del Rey, CA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005056823","display_name":"Gideon Juve","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gideon Juve","raw_affiliation_strings":["Information Sciences Institute, University of Southern California, Marina Del Rey, CA"],"affiliations":[{"raw_affiliation_string":"Information Sciences Institute, University of Southern California, Marina Del Rey, CA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031941569","display_name":"Ewa Deelman","orcid":"https://orcid.org/0000-0001-5106-503X"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ewa Deelman","raw_affiliation_strings":["Information Sciences Institute, University of Southern California, Marina Del Rey, CA"],"affiliations":[{"raw_affiliation_string":"Information Sciences Institute, University of Southern California, Marina Del Rey, CA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027512179","display_name":"William Allcock","orcid":"https://orcid.org/0000-0002-7984-6847"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William Allcock","raw_affiliation_strings":["Argonne National Laboratory, Lemont, IL"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, Lemont, IL","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007301255","display_name":"Douglas Thain","orcid":"https://orcid.org/0000-0001-5218-1956"},"institutions":[{"id":"https://openalex.org/I107639228","display_name":"University of Notre Dame","ror":"https://ror.org/00mkhxb43","country_code":"US","type":"education","lineage":["https://openalex.org/I107639228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Douglas Thain","raw_affiliation_strings":["University of Notre Dame, Notre Dame, IN"],"affiliations":[{"raw_affiliation_string":"University of Notre Dame, Notre Dame, IN","institution_ids":["https://openalex.org/I107639228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042010270","display_name":"Miron Livny","orcid":"https://orcid.org/0000-0001-5444-7439"},"institutions":[{"id":"https://openalex.org/I135310074","display_name":"University of Wisconsin\u2013Madison","ror":"https://ror.org/01y2jtd41","country_code":"US","type":"education","lineage":["https://openalex.org/I135310074"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Miron Livny","raw_affiliation_strings":["University of Wisconsin, Madison, WI"],"affiliations":[{"raw_affiliation_string":"University of Wisconsin, Madison, WI","institution_ids":["https://openalex.org/I135310074"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5051396274"],"corresponding_institution_ids":["https://openalex.org/I107639228"],"apc_list":null,"apc_paid":null,"fwci":1.8648,"has_fulltext":false,"cited_by_count":22,"citation_normalized_percentile":{"value":0.87877889,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"29","issue":"2","first_page":"240","last_page":"253"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.8492370843887329},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8290138244628906},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8119732737541199},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.5851532220840454},{"id":"https://openalex.org/keywords/sizing","display_name":"Sizing","score":0.5705788135528564},{"id":"https://openalex.org/keywords/resource-allocation","display_name":"Resource allocation","score":0.4820767045021057},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.42081135511398315},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3271113634109497},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.19605693221092224},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.14495736360549927}],"concepts":[{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.8492370843887329},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8290138244628906},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8119732737541199},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.5851532220840454},{"id":"https://openalex.org/C2777767291","wikidata":"https://www.wikidata.org/wiki/Q1080291","display_name":"Sizing","level":2,"score":0.5705788135528564},{"id":"https://openalex.org/C29202148","wikidata":"https://www.wikidata.org/wiki/Q287260","display_name":"Resource allocation","level":2,"score":0.4820767045021057},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.42081135511398315},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3271113634109497},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.19605693221092224},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.14495736360549927},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2017.2762310","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2017.2762310","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Decent work and economic growth","score":0.6800000071525574,"id":"https://metadata.un.org/sdg/8"}],"awards":[{"id":"https://openalex.org/G5520337016","display_name":null,"funder_award_id":"ER26110","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"}],"funders":[{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320309636","display_name":"University of Minnesota","ror":"https://ror.org/03grvy078"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W180765255","https://openalex.org/W928347285","https://openalex.org/W1480875294","https://openalex.org/W1736267949","https://openalex.org/W1925464213","https://openalex.org/W1941096926","https://openalex.org/W1965168630","https://openalex.org/W1978879585","https://openalex.org/W1983046182","https://openalex.org/W2016395505","https://openalex.org/W2022642059","https://openalex.org/W2025397485","https://openalex.org/W2028141695","https://openalex.org/W2030742422","https://openalex.org/W2053341340","https://openalex.org/W2054818428","https://openalex.org/W2064959504","https://openalex.org/W2084078215","https://openalex.org/W2086126933","https://openalex.org/W2088351838","https://openalex.org/W2090388856","https://openalex.org/W2094806030","https://openalex.org/W2104998023","https://openalex.org/W2113209795","https://openalex.org/W2119352128","https://openalex.org/W2120422789","https://openalex.org/W2129542763","https://openalex.org/W2146438496","https://openalex.org/W2148317584","https://openalex.org/W2150074609","https://openalex.org/W2154983209","https://openalex.org/W2157282184","https://openalex.org/W2202483651","https://openalex.org/W2223186009","https://openalex.org/W2258432161","https://openalex.org/W2297835331","https://openalex.org/W3162118826","https://openalex.org/W4362678814","https://openalex.org/W6607303267","https://openalex.org/W6677954900","https://openalex.org/W6692071552","https://openalex.org/W6697360534"],"related_works":["https://openalex.org/W2375311683","https://openalex.org/W2366062860","https://openalex.org/W2373777250","https://openalex.org/W2353956655","https://openalex.org/W2020653254","https://openalex.org/W2010454064","https://openalex.org/W2352072014","https://openalex.org/W217279133","https://openalex.org/W2393487946","https://openalex.org/W2373310108"],"abstract_inverted_index":{"The":[0],"user":[1],"of":[2,68,70,84,148,160,162,164,171],"a":[3,8,73,92],"computing":[4],"facility":[5],"must":[6],"make":[7],"critical":[9],"decision":[10,61],"when":[11,65],"submitting":[12],"jobs":[13,71,123],"for":[14,28,94],"execution:":[15],"how":[16],"many":[17],"resources":[18,56],"(such":[19],"as":[20,108],"cores,":[21],"memory,":[22],"and":[23,104,121,144,156],"disk)":[24],"should":[25],"be":[26,58],"requested":[27],"each":[29],"job?":[30],"If":[31],"the":[32,37,46,51,96,112,141,150],"request":[33,47],"is":[34,48,62,115],"too":[35,49],"small,":[36],"job":[38,52,97],"may":[39,53,78],"fail":[40],"due":[41],"to":[42,128,133,152,175],"resource":[43,85,113],"exhaustion;":[44],"if":[45],"large,":[50],"succeed,":[54],"but":[55],"will":[57],"wasted.":[59],"This":[60],"especially":[63],"important":[64],"running":[66],"hundreds":[67,161],"thousands":[69,163],"in":[72,106,131,169],"high":[74,153],"throughput":[75,135,154,170],"workflow,":[76],"which":[77],"exhibit":[79],"complex,":[80],"long":[81],"tailed":[82],"distributions":[83],"consumption.":[86],"In":[87],"this":[88],"paper,":[89],"we":[90],"present":[91,145],"strategy":[93],"solving":[95],"sizing":[98],"problem:":[99],"(1)":[100],"applications":[101],"are":[102,124],"monitored":[103],"measured":[105],"user-space":[107],"they":[109],"run;":[110],"(2)":[111],"usage":[114],"collected":[116],"into":[117],"an":[118,167],"online":[119],"archive;":[120],"(3)":[122],"automatically":[125],"sized":[126],"according":[127],"historical":[129],"data":[130],"order":[132],"maximize":[134],"or":[136],"minimize":[137],"waste.":[138],"We":[139],"evaluate":[140],"solution":[142],"analytically,":[143],"case":[146],"studies":[147],"applying":[149],"technique":[151],"physics":[155],"bioinformatics":[157],"workflows":[158],"consisting":[159],"jobs,":[165],"demonstrating":[166],"increase":[168],"10-400":[172],"percent":[173],"compared":[174],"naive":[176],"approaches.":[177]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
