{"id":"https://openalex.org/W2511318867","doi":"https://doi.org/10.1145/2967938.2967947","title":"OAWS","display_name":"OAWS","publication_year":2016,"publication_date":"2016-08-31","ids":{"openalex":"https://openalex.org/W2511318867","doi":"https://doi.org/10.1145/2967938.2967947","mag":"2511318867"},"language":"en","primary_location":{"id":"doi:10.1145/2967938.2967947","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2967938.2967947","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2016 International Conference on Parallel Architectures and Compilation","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5115602018","display_name":"Bin Wang","orcid":"https://orcid.org/0000-0001-7665-6290"},"institutions":[{"id":"https://openalex.org/I82497590","display_name":"Auburn University","ror":"https://ror.org/02v80fc35","country_code":"US","type":"education","lineage":["https://openalex.org/I82497590"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bin Wang","raw_affiliation_strings":["Auburn University, Auburn, AL, USA"],"affiliations":[{"raw_affiliation_string":"Auburn University, Auburn, AL, USA","institution_ids":["https://openalex.org/I82497590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100513379","display_name":"Yue Zhu","orcid":"https://orcid.org/0009-0009-2273-5618"},"institutions":[{"id":"https://openalex.org/I103163165","display_name":"Florida State University","ror":"https://ror.org/05g3dte14","country_code":"US","type":"education","lineage":["https://openalex.org/I103163165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yue Zhu","raw_affiliation_strings":["Florida State University, Tallahassee, FL, USA"],"affiliations":[{"raw_affiliation_string":"Florida State University, Tallahassee, FL, USA","institution_ids":["https://openalex.org/I103163165"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070216261","display_name":"Weikuan Yu","orcid":"https://orcid.org/0000-0002-8754-0311"},"institutions":[{"id":"https://openalex.org/I103163165","display_name":"Florida State University","ror":"https://ror.org/05g3dte14","country_code":"US","type":"education","lineage":["https://openalex.org/I103163165"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weikuan Yu","raw_affiliation_strings":["Florida State University, Tallahassee, FL, USA"],"affiliations":[{"raw_affiliation_string":"Florida State University, Tallahassee, FL, USA","institution_ids":["https://openalex.org/I103163165"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5115602018"],"corresponding_institution_ids":["https://openalex.org/I82497590"],"apc_list":null,"apc_paid":null,"fwci":4.0994,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.94132029,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"45","last_page":"55"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8552024960517883},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.675636887550354},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6030459403991699},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5748957395553589},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.5306940078735352},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.4112946689128876},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.33469223976135254},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.33085644245147705}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8552024960517883},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.675636887550354},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6030459403991699},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5748957395553589},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.5306940078735352},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.4112946689128876},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.33469223976135254},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.33085644245147705},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2967938.2967947","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2967938.2967947","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2016 International Conference on Parallel Architectures and Compilation","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2987797212","display_name":null,"funder_award_id":"1340947","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3248119133","display_name":null,"funder_award_id":"1059376","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3393734607","display_name":null,"funder_award_id":"1564647","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G339692774","display_name":null,"funder_award_id":"1561041","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320313710","display_name":"Menzies School of Health Research","ror":"https://ror.org/006mbby82"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W1971421905","https://openalex.org/W1979527452","https://openalex.org/W2008115889","https://openalex.org/W2012303498","https://openalex.org/W2020572638","https://openalex.org/W2027806965","https://openalex.org/W2033486618","https://openalex.org/W2047060659","https://openalex.org/W2048441570","https://openalex.org/W2050710108","https://openalex.org/W2051688423","https://openalex.org/W2053744175","https://openalex.org/W2060087084","https://openalex.org/W2062527253","https://openalex.org/W2067441262","https://openalex.org/W2079038734","https://openalex.org/W2080592089","https://openalex.org/W2084309410","https://openalex.org/W2090584832","https://openalex.org/W2096661534","https://openalex.org/W2098505406","https://openalex.org/W2109432325","https://openalex.org/W2128120785","https://openalex.org/W2129817042","https://openalex.org/W2142444503","https://openalex.org/W2149234156","https://openalex.org/W2155503253","https://openalex.org/W2155568054","https://openalex.org/W2163820265","https://openalex.org/W2168921806","https://openalex.org/W2169880332","https://openalex.org/W2252393321","https://openalex.org/W2254138160","https://openalex.org/W2273440736","https://openalex.org/W2327201404","https://openalex.org/W3148394109","https://openalex.org/W4237024478","https://openalex.org/W4240221132"],"related_works":["https://openalex.org/W2152099439","https://openalex.org/W1984163603","https://openalex.org/W3130422087","https://openalex.org/W2787993192","https://openalex.org/W3004195166","https://openalex.org/W1563139915","https://openalex.org/W2885669284","https://openalex.org/W4301184821","https://openalex.org/W2126310295","https://openalex.org/W2004686618"],"abstract_inverted_index":{"We":[0,60],"have":[1,61],"closely":[2],"examined":[3],"GPU":[4,15],"resource":[5],"utilization":[6],"when":[7],"executing":[8],"memory-intensive":[9],"benchmarks.":[10],"Our":[11,100],"detailed":[12],"analysis":[13],"of":[14,28,35,75,78,86,129],"global":[16],"memory":[17,39,44,63,80,106],"accesses":[18],"reveals":[19],"that":[20,69,90,123],"divergent":[21,79],"loads":[22],"can":[23,70,104],"lead":[24],"to":[25,138],"the":[26,57,73,84,97,124,139],"occlusion":[27,40],"Load-Store":[29],"units,":[30],"resulting":[31],"in":[32],"quick":[33],"consumption":[34],"MSHR":[36,76,93,98,112],"entries.":[37],"Such":[38],"prevents":[41],"other":[42],"ready":[43],"instructions":[45],"from":[46],"accessing":[47],"L1":[48],"data":[49],"cache,":[50],"eventually":[51],"stalling":[52],"warp":[53],"schedulers":[54],"and":[55,82,108,126,133,149,154],"degrading":[56],"overall":[58],"performance.":[59],"designed":[62],"Occlusion":[64],"Aware":[65],"Warp":[66],"Scheduling":[67],"(OAWS)":[68],"dynamically":[71],"predict":[72],"demand":[74],"entries":[77,113],"instructions,":[81],"maximize":[83],"number":[85],"concurrent":[87],"warps":[88],"such":[89],"their":[91],"aggregate":[92],"consumptions":[94],"are":[95],"within":[96],"capacity.":[99],"dynamic":[101,127,144],"OAWS":[102,130,145],"policy":[103],"prevent":[105],"occlusions":[107],"effectively":[109],"leverage":[110],"more":[111],"for":[114,118],"better":[115],"IPC":[116],"performance":[117,135],"GPU.":[119],"Experimental":[120],"results":[121],"show":[122],"static":[125],"versions":[128],"achieve":[131],"36.7%":[132],"73.1%":[134],"improvement,":[136],"compared":[137],"baseline":[140],"GTO":[141],"scheduling.":[142],"Particularly,":[143],"outperforms":[146],"MASCAR,":[147],"CCWS,":[148],"SWL-Best":[150],"by":[151],"70.1%,":[152],"57.8%,":[153],"11.4%,":[155],"respectively.":[156]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-09-16T00:00:00"}
