{"id":"https://openalex.org/W4360831966","doi":"https://doi.org/10.1109/hpca56546.2023.10070978","title":"NvWa: Enhancing Sequence Alignment Accelerator Throughput via Hardware Scheduling","display_name":"NvWa: Enhancing Sequence Alignment Accelerator Throughput via Hardware Scheduling","publication_year":2023,"publication_date":"2023-02-01","ids":{"openalex":"https://openalex.org/W4360831966","doi":"https://doi.org/10.1109/hpca56546.2023.10070978"},"language":"en","primary_location":{"id":"doi:10.1109/hpca56546.2023.10070978","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca56546.2023.10070978","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063575625","display_name":"Yewen Li","orcid":"https://orcid.org/0000-0001-8406-0606"},"institutions":[{"id":"https://openalex.org/I4210133325","display_name":"Institute of Process Engineering","ror":"https://ror.org/03j4x9j18","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210133325"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yewen Li","raw_affiliation_strings":["ICT, CAS,State Key Lab of Processors","State Key Lab of Processors, ICT, CAS","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"ICT, CAS,State Key Lab of Processors","institution_ids":["https://openalex.org/I4210133325"]},{"raw_affiliation_string":"State Key Lab of Processors, ICT, CAS","institution_ids":[]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100453922","display_name":"Xueqi Li","orcid":"https://orcid.org/0000-0002-4825-6887"},"institutions":[{"id":"https://openalex.org/I4210133325","display_name":"Institute of Process Engineering","ror":"https://ror.org/03j4x9j18","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210133325"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xueqi Li","raw_affiliation_strings":["ICT, CAS,State Key Lab of Processors","State Key Lab of Processors, ICT, CAS"],"affiliations":[{"raw_affiliation_string":"ICT, CAS,State Key Lab of Processors","institution_ids":["https://openalex.org/I4210133325"]},{"raw_affiliation_string":"State Key Lab of Processors, ICT, CAS","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046028512","display_name":"Ruihao Gao","orcid":"https://orcid.org/0000-0002-0931-6672"},"institutions":[{"id":"https://openalex.org/I4210133325","display_name":"Institute of Process Engineering","ror":"https://ror.org/03j4x9j18","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210133325"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruihao Gao","raw_affiliation_strings":["ICT, CAS,State Key Lab of Processors","University of Chinese Academy of Sciences, Beijing, China","State Key Lab of Processors, ICT, CAS"],"affiliations":[{"raw_affiliation_string":"ICT, CAS,State Key Lab of Processors","institution_ids":["https://openalex.org/I4210133325"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"State Key Lab of Processors, ICT, CAS","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062446464","display_name":"Wanqi Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133325","display_name":"Institute of Process Engineering","ror":"https://ror.org/03j4x9j18","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210133325"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wanqi Liu","raw_affiliation_strings":["ICT, CAS,State Key Lab of Processors","State Key Lab of Processors, ICT, CAS","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"ICT, CAS,State Key Lab of Processors","institution_ids":["https://openalex.org/I4210133325"]},{"raw_affiliation_string":"State Key Lab of Processors, ICT, CAS","institution_ids":[]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5104072170","display_name":"Guangming Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133325","display_name":"Institute of Process Engineering","ror":"https://ror.org/03j4x9j18","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210133325"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guangming Tan","raw_affiliation_strings":["ICT, CAS,State Key Lab of Processors","University of Chinese Academy of Sciences, Beijing, China","State Key Lab of Processors, ICT, CAS"],"affiliations":[{"raw_affiliation_string":"ICT, CAS,State Key Lab of Processors","institution_ids":["https://openalex.org/I4210133325"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"State Key Lab of Processors, ICT, CAS","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5063575625"],"corresponding_institution_ids":["https://openalex.org/I4210133325","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.9543,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.74971865,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1236","last_page":"1248"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9555000066757202,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.783033549785614},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.6603349447250366},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6190222501754761},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.5986062288284302},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.4834824204444885},{"id":"https://openalex.org/keywords/seeding","display_name":"Seeding","score":0.4724469780921936},{"id":"https://openalex.org/keywords/schedule","display_name":"Schedule","score":0.4673210680484772},{"id":"https://openalex.org/keywords/critical-path-method","display_name":"Critical path method","score":0.44739922881126404},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3252228796482086},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.2801320552825928},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.26981139183044434},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.18035241961479187},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09566152095794678},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09373405575752258}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.783033549785614},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.6603349447250366},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6190222501754761},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.5986062288284302},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.4834824204444885},{"id":"https://openalex.org/C36248471","wikidata":"https://www.wikidata.org/wiki/Q7445669","display_name":"Seeding","level":2,"score":0.4724469780921936},{"id":"https://openalex.org/C68387754","wikidata":"https://www.wikidata.org/wiki/Q7271585","display_name":"Schedule","level":2,"score":0.4673210680484772},{"id":"https://openalex.org/C115874739","wikidata":"https://www.wikidata.org/wiki/Q825377","display_name":"Critical path method","level":2,"score":0.44739922881126404},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3252228796482086},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.2801320552825928},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.26981139183044434},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.18035241961479187},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09566152095794678},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09373405575752258},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca56546.2023.10070978","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca56546.2023.10070978","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Symposium on High-Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Affordable and clean energy","id":"https://metadata.un.org/sdg/7","score":0.8399999737739563}],"awards":[],"funders":[{"id":"https://openalex.org/F4320335768","display_name":"National Postdoctoral Program for Innovative Talents","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":72,"referenced_works":["https://openalex.org/W1573552135","https://openalex.org/W1606938841","https://openalex.org/W1983394510","https://openalex.org/W2001496424","https://openalex.org/W2006899413","https://openalex.org/W2014555481","https://openalex.org/W2031445984","https://openalex.org/W2034861439","https://openalex.org/W2039824819","https://openalex.org/W2055043387","https://openalex.org/W2087064593","https://openalex.org/W2093931624","https://openalex.org/W2103441770","https://openalex.org/W2115069592","https://openalex.org/W2128830021","https://openalex.org/W2144560237","https://openalex.org/W2146696273","https://openalex.org/W2154826966","https://openalex.org/W2158322625","https://openalex.org/W2194172909","https://openalex.org/W2319458729","https://openalex.org/W2330100020","https://openalex.org/W2515042543","https://openalex.org/W2515673159","https://openalex.org/W2577617591","https://openalex.org/W2725159389","https://openalex.org/W2741506553","https://openalex.org/W2754515634","https://openalex.org/W2788559611","https://openalex.org/W2789784730","https://openalex.org/W2789843538","https://openalex.org/W2790091177","https://openalex.org/W2883847355","https://openalex.org/W2887089575","https://openalex.org/W2889019034","https://openalex.org/W2904739694","https://openalex.org/W2928905502","https://openalex.org/W2935576241","https://openalex.org/W2942400511","https://openalex.org/W2950629094","https://openalex.org/W2966678303","https://openalex.org/W2971559821","https://openalex.org/W2979449748","https://openalex.org/W2979823675","https://openalex.org/W2981619930","https://openalex.org/W2986616285","https://openalex.org/W3013605959","https://openalex.org/W3015825547","https://openalex.org/W3017228913","https://openalex.org/W3035066704","https://openalex.org/W3042538963","https://openalex.org/W3046494740","https://openalex.org/W3099458570","https://openalex.org/W3101704407","https://openalex.org/W3105003914","https://openalex.org/W3130152469","https://openalex.org/W3158540161","https://openalex.org/W3189987728","https://openalex.org/W3193844559","https://openalex.org/W4226027979","https://openalex.org/W4232675554","https://openalex.org/W4236236547","https://openalex.org/W4241026011","https://openalex.org/W4247053599","https://openalex.org/W4252563462","https://openalex.org/W4254502766","https://openalex.org/W4281647104","https://openalex.org/W4394666350","https://openalex.org/W6674561012","https://openalex.org/W6741902625","https://openalex.org/W6744145316","https://openalex.org/W6803052005"],"related_works":["https://openalex.org/W2352942191","https://openalex.org/W2363460986","https://openalex.org/W609318495","https://openalex.org/W2376229137","https://openalex.org/W1501193936","https://openalex.org/W2262854793","https://openalex.org/W2379237800","https://openalex.org/W2760702716","https://openalex.org/W2386584920","https://openalex.org/W2532502681"],"abstract_inverted_index":{"Sequence":[0],"alignment":[1,14,43],"is":[2,70],"the":[3,8,17,28,32,36,42,47,60,80,94,97,101,104,109,128,131,150,173,185,189],"most":[4],"time-consuming":[5],"step":[6],"in":[7,41,55,123],"genome":[9],"analysis":[10],"pipeline.":[11],"Since":[12],"sequence":[13,40,62,76,175],"generally":[15],"follows":[16],"seed-and-extension":[18],"paradigm,":[19],"prior":[20],"proposed":[21],"hardware":[22,72],"accelerators":[23],"either":[24],"opt":[25],"to":[26,46,117,161,168],"accelerate":[27],"seeding":[29,95,110,121,159],"phase":[30],"or":[31,50],"seed-extension":[33,98,129,144,165],"phase.":[34],"However,":[35],"diversity":[37,81],"of":[38],"each":[39],"workflow":[44],"leads":[45],"pipeline":[48],"stall":[49],"bubbles,":[51],"which":[52,69,92,183],"finally":[53],"results":[54,194],"a":[56,71,114,179,215],"decreased":[57],"throughput":[58],"for":[59,75,172],"end-to-end":[61],"alignment.In":[63],"this":[64],"paper,":[65],"we":[66,83,112,177],"propose":[67,84,113,178],"NvWa,":[68],"scheduling":[73,87,191],"accelerator":[74],"alignment.":[77],"To":[78],"solve":[79],"problem,":[82],"three":[85],"novel":[86],"mechanisms":[88],"and":[89,100,139,157,163,188,205,223],"corresponding":[90],"architecture,":[91],"target":[93],"phase,":[96,99,111,130],"interaction":[102],"between":[103],"two":[105,151,224],"phases,":[106,152],"respectively.":[107,227],"For":[108,127],"Seeding":[115],"Scheduler":[116,133],"schedule":[118],"all":[119],"idle":[120],"units":[122],"only":[124],"one":[125],"cycle.":[126],"Extension":[132],"can":[134,198],"achieve":[135,199],"both":[136],"lower":[137],"latency":[138],"higher":[140],"parallelism":[141],"when":[142,212],"facing":[143],"tasks":[145],"with":[146,214],"different":[147],"scales.":[148],"Between":[149],"an":[153,219],"efficient":[154],"Coordinator":[155],"caches":[156],"dispatches":[158],"hits":[160],"optimal":[162],"sub-optimal":[164],"units.":[166],"Furthermore,":[167],"avoid":[169],"algorithmic":[170],"obsolescence":[171],"new":[174],"technologies,":[176],"loosely":[180],"coupled":[181],"design,":[182],"decouples":[184],"data":[186],"path":[187],"control":[190],"path.":[192],"Experimental":[193],"show":[195],"that":[196],"NvWa":[197],"493\u00d7,":[200],"200\u00d7,":[201],"12.11\u00d7,":[202],"2.30\u00d7":[203],"speedup":[204],"14.21\u00d7,":[206],"5.60\u00d7,":[207],"4.34\u00d7,":[208],"5.85\u00d7":[209],"energy":[210],"reduction":[211],"compared":[213],"16-thread":[216],"CPU":[217],"baseline,":[218],"NVIDIA":[220],"A100":[221],"GPU,":[222],"state-of-the-art":[225],"accelerators,":[226]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
