{"id":"https://openalex.org/W4409248436","doi":"https://doi.org/10.1109/hpca61900.2025.00123","title":"Marching Page Walks: Batching and Concurrent Page Table Walks for Enhancing GPU Throughput","display_name":"Marching Page Walks: Batching and Concurrent Page Table Walks for Enhancing GPU Throughput","publication_year":2025,"publication_date":"2025-03-01","ids":{"openalex":"https://openalex.org/W4409248436","doi":"https://doi.org/10.1109/hpca61900.2025.00123"},"language":"en","primary_location":{"id":"doi:10.1109/hpca61900.2025.00123","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00123","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100444749","display_name":"Jiwon Lee","orcid":"https://orcid.org/0009-0009-6529-5333"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jiwon Lee","raw_affiliation_strings":["Yonsei University,Department of Electrical and Electronic Engineering,Seoul,Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of Electrical and Electronic Engineering,Seoul,Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018121479","display_name":"Gun Ko","orcid":null},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gun Ko","raw_affiliation_strings":["Yonsei University,Department of Electrical and Electronic Engineering,Seoul,Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of Electrical and Electronic Engineering,Seoul,Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040253395","display_name":"Myung Kuk Yoon","orcid":"https://orcid.org/0000-0002-9332-0251"},"institutions":[{"id":"https://openalex.org/I138925566","display_name":"Ewha Womans University","ror":"https://ror.org/053fp5c05","country_code":"KR","type":"education","lineage":["https://openalex.org/I138925566"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Myung Kuk Yoon","raw_affiliation_strings":["Ewha Womans University,Department of Computer Science and Engineering,Seoul,Korea"],"affiliations":[{"raw_affiliation_string":"Ewha Womans University,Department of Computer Science and Engineering,Seoul,Korea","institution_ids":["https://openalex.org/I138925566"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012141172","display_name":"Ipoom Jeong","orcid":"https://orcid.org/0000-0001-7513-2858"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Ipoom Jeong","raw_affiliation_strings":["Yonsei University,Department of System Semiconductor Engineering,Seoul,Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of System Semiconductor Engineering,Seoul,Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015526090","display_name":"Yunho Oh","orcid":"https://orcid.org/0000-0001-6442-3705"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yunho Oh","raw_affiliation_strings":["Korea University,School of Electrical Engineering,Seoul,Korea"],"affiliations":[{"raw_affiliation_string":"Korea University,School of Electrical Engineering,Seoul,Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017913155","display_name":"Won Woo Ro","orcid":"https://orcid.org/0000-0001-5390-6445"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Won Woo Ro","raw_affiliation_strings":["Yonsei University,Department of Electrical and Electronic Engineering,Seoul,Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of Electrical and Electronic Engineering,Seoul,Korea","institution_ids":["https://openalex.org/I193775966"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100444749"],"corresponding_institution_ids":["https://openalex.org/I193775966"],"apc_list":null,"apc_paid":null,"fwci":4.699,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.94430447,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1662","last_page":"1677"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7462903261184692},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.6506799459457397},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6309887170791626},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.5595638751983643},{"id":"https://openalex.org/keywords/random-walk","display_name":"Random walk","score":0.5140074491500854},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.48509514331817627},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.48247984051704407},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.3429810404777527},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.170372873544693},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.14443182945251465},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12416359782218933},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.06534671783447266}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7462903261184692},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.6506799459457397},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6309887170791626},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.5595638751983643},{"id":"https://openalex.org/C121194460","wikidata":"https://www.wikidata.org/wiki/Q856741","display_name":"Random walk","level":2,"score":0.5140074491500854},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.48509514331817627},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.48247984051704407},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.3429810404777527},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.170372873544693},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.14443182945251465},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12416359782218933},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.06534671783447266},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca61900.2025.00123","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00123","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":76,"referenced_works":["https://openalex.org/W1978301594","https://openalex.org/W1997162567","https://openalex.org/W2004807638","https://openalex.org/W2020733012","https://openalex.org/W2047390994","https://openalex.org/W2054095206","https://openalex.org/W2061812855","https://openalex.org/W2062430565","https://openalex.org/W2080592089","https://openalex.org/W2093828978","https://openalex.org/W2099911225","https://openalex.org/W2100926301","https://openalex.org/W2120000030","https://openalex.org/W2120715680","https://openalex.org/W2126540423","https://openalex.org/W2128120785","https://openalex.org/W2146241244","https://openalex.org/W2238595726","https://openalex.org/W2315868086","https://openalex.org/W2416722775","https://openalex.org/W2470920449","https://openalex.org/W2625932461","https://openalex.org/W2626757163","https://openalex.org/W2725159389","https://openalex.org/W2774409802","https://openalex.org/W2793599434","https://openalex.org/W2794228535","https://openalex.org/W2885000039","https://openalex.org/W2904412652","https://openalex.org/W2920870926","https://openalex.org/W2928181291","https://openalex.org/W2931925202","https://openalex.org/W2933788198","https://openalex.org/W2934021599","https://openalex.org/W2962821792","https://openalex.org/W2980066681","https://openalex.org/W3010795619","https://openalex.org/W3011261380","https://openalex.org/W3014112970","https://openalex.org/W3017225859","https://openalex.org/W3017302221","https://openalex.org/W3042526471","https://openalex.org/W3042851732","https://openalex.org/W3043023532","https://openalex.org/W3043804473","https://openalex.org/W3089681336","https://openalex.org/W3090784541","https://openalex.org/W3091730480","https://openalex.org/W3102510044","https://openalex.org/W3153491892","https://openalex.org/W3159322435","https://openalex.org/W3159945917","https://openalex.org/W3166541059","https://openalex.org/W3177916483","https://openalex.org/W3205144645","https://openalex.org/W3205535571","https://openalex.org/W3207422314","https://openalex.org/W4213250435","https://openalex.org/W4214655995","https://openalex.org/W4250481301","https://openalex.org/W4281689389","https://openalex.org/W4308083524","https://openalex.org/W4308084044","https://openalex.org/W4327930453","https://openalex.org/W4360831812","https://openalex.org/W4360831817","https://openalex.org/W4360831987","https://openalex.org/W4386763881","https://openalex.org/W4388858680","https://openalex.org/W4401211780","https://openalex.org/W4404954833","https://openalex.org/W6690740084","https://openalex.org/W6694513646","https://openalex.org/W6731837222","https://openalex.org/W6763585923","https://openalex.org/W6859297029"],"related_works":["https://openalex.org/W4399354997","https://openalex.org/W2005148983","https://openalex.org/W2012954338","https://openalex.org/W2096672917","https://openalex.org/W2392023973","https://openalex.org/W3189307731","https://openalex.org/W1428699136","https://openalex.org/W2949962288","https://openalex.org/W2364686214","https://openalex.org/W1998560227"],"abstract_inverted_index":{"Virtual":[0],"memory,":[1],"with":[2],"the":[3,22,25,40,86,131,148,167,179,218,233],"support":[4],"of":[5,24,42,48,61,67,89,114,150,221],"address":[6,163],"translation":[7,32],"hardware,":[8,33],"is":[9],"a":[10,37,59,64,74,79,82,96,112,136,142],"key":[11],"technique":[12],"in":[13,19,39,104,126,161,181],"expanding":[14],"programmability":[15],"and":[16,46,152,204,226],"memory":[17,144,211],"management":[18],"GPUs.":[20,105],"However,":[21],"nature":[23],"GPU":[26,53,154,182,228],"execution":[27],"model":[28],"heavily":[29],"pressures":[30],"its":[31],"particularly":[34],"due":[35],"to":[36,122,139,157,191],"discrepancy":[38],"behavior":[41],"page":[43,101,115,137,183,222],"table":[44,102,184],"walkers":[45,116],"thousands":[47],"concurrently":[49,158,205],"running":[50],"threads.":[51],"In":[52],"workloads,":[54],"multiple":[55,119,210],"threads":[56],"simultaneously":[57],"access":[58,159],"number":[60,66],"pages":[62,160],"necessitating":[63],"substantial":[65],"translations":[68],"whereas":[69],"each":[70],"walker":[71,138],"handles":[72,206],"only":[73],"single":[75,143],"walk":[76,90,120,189],"request":[77,145],"at":[78],"time.":[80],"Such":[81],"limitation":[83],"significantly":[84,146],"increases":[85],"queueing":[87,219],"latency":[88,220],"requests,":[91],"which":[92],"we":[93,110,129,170],"observe":[94],"as":[95],"major":[97],"bottleneck":[98],"for":[99],"servicing":[100],"walks":[103,223],"To":[106],"tackle":[107],"this":[108],"challenge,":[109],"investigate":[111],"design":[113],"that":[117,176,194,215],"facilitates":[118],"requests":[121,190,203],"be":[123,196],"handled":[124],"together":[125],"batches.":[127],"Then,":[128,199],"make":[130],"following":[132],"observations:":[133],"1)":[134],"allowing":[135],"issue":[140],"beyond":[141],"improves":[147,227],"throughput":[149],"walkers,":[151],"2)":[153],"applications":[155],"tend":[156],"wide":[162],"ranges.":[164],"By":[165],"leveraging":[166],"above":[168],"implications,":[169],"propose":[171],"Marching":[172],"Page":[173],"Walks":[174],"(MPW)":[175],"effectively":[177],"mitigate":[178],"contention":[180],"walkers.":[185],"MPW":[186,200,216],"scans":[187],"pending":[188],"identify":[192],"ones":[193],"can":[195],"grouped":[197],"together.":[198],"batches":[201],"these":[202],"them":[207],"by":[208,224,230],"issuing":[209],"instructions.":[212],"Experiments":[213],"show":[214],"reduces":[217],"86.7%":[225],"performance":[229],"55.6%":[231],"over":[232],"baseline":[234],"design.":[235]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
