{"id":"https://openalex.org/W1980160788","doi":"https://doi.org/10.1109/bicta.2010.5645235","title":"The optimization of parallel Smith-Waterman sequence alignment using on-chip memory of GPGPU","display_name":"The optimization of parallel Smith-Waterman sequence alignment using on-chip memory of GPGPU","publication_year":2010,"publication_date":"2010-09-01","ids":{"openalex":"https://openalex.org/W1980160788","doi":"https://doi.org/10.1109/bicta.2010.5645235","mag":"1980160788"},"language":"en","primary_location":{"id":"doi:10.1109/bicta.2010.5645235","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bicta.2010.5645235","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE Fifth International Conference on Bio-Inspired Computing: Theories and Applications (BIC-TA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119309918","display_name":"Qian Zhang","orcid":"https://orcid.org/0000-0001-5314-4233"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Qian Zhang","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085758579","display_name":"Hong An","orcid":"https://orcid.org/0000-0002-3900-3722"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong An","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China","Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101511610","display_name":"Gu Liu","orcid":"https://orcid.org/0000-0002-2691-7867"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gu Liu","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108198361","display_name":"Wenting Han","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenting Han","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Laboratory of Computer System and Architecture, Chinese Academy and Sciences, Beijing, China","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100545080","display_name":"Yao Ping","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Yao","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105868773","display_name":"Mu Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mu Xu","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100339637","display_name":"Xiaoqiang Li","orcid":"https://orcid.org/0000-0002-9526-4628"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoqiang Li","raw_affiliation_strings":["Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","Department of Computer Science and Technology, University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Department of Computer Science and Technology, University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5119309918"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":0.451,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.71066789,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"844","last_page":"850"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.934499979019165,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.9447432160377502},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.8881814479827881},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8230621814727783},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.751244306564331},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.599048376083374},{"id":"https://openalex.org/keywords/smith\u2013waterman-algorithm","display_name":"Smith\u2013Waterman algorithm","score":0.5399977564811707},{"id":"https://openalex.org/keywords/shared-memory","display_name":"Shared memory","score":0.48251959681510925},{"id":"https://openalex.org/keywords/memory-hierarchy","display_name":"Memory hierarchy","score":0.44385725259780884},{"id":"https://openalex.org/keywords/performance-improvement","display_name":"Performance improvement","score":0.42465710639953613},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.09266498684883118},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.08512258529663086}],"concepts":[{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.9447432160377502},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.8881814479827881},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8230621814727783},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.751244306564331},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.599048376083374},{"id":"https://openalex.org/C72802188","wikidata":"https://www.wikidata.org/wiki/Q1683352","display_name":"Smith\u2013Waterman algorithm","level":5,"score":0.5399977564811707},{"id":"https://openalex.org/C133875982","wikidata":"https://www.wikidata.org/wiki/Q764810","display_name":"Shared memory","level":2,"score":0.48251959681510925},{"id":"https://openalex.org/C2778100165","wikidata":"https://www.wikidata.org/wiki/Q1589327","display_name":"Memory hierarchy","level":3,"score":0.44385725259780884},{"id":"https://openalex.org/C2778915421","wikidata":"https://www.wikidata.org/wiki/Q3643177","display_name":"Performance improvement","level":2,"score":0.42465710639953613},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.09266498684883118},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.08512258529663086},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.0},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bicta.2010.5645235","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bicta.2010.5645235","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2010 IEEE Fifth International Conference on Bio-Inspired Computing: Theories and Applications (BIC-TA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1573897044","https://openalex.org/W1992851788","https://openalex.org/W2011652244","https://openalex.org/W2054227483","https://openalex.org/W2109393352","https://openalex.org/W2116508956","https://openalex.org/W2116715773","https://openalex.org/W2128022558","https://openalex.org/W2130561688","https://openalex.org/W2133540884","https://openalex.org/W2146379626","https://openalex.org/W2165949232","https://openalex.org/W2166621589","https://openalex.org/W6634426487"],"related_works":["https://openalex.org/W2274873983","https://openalex.org/W2128546436","https://openalex.org/W2972717823","https://openalex.org/W4254940814","https://openalex.org/W2594155508","https://openalex.org/W2545380179","https://openalex.org/W55660756","https://openalex.org/W3083624021","https://openalex.org/W2811273125","https://openalex.org/W2081131254"],"abstract_inverted_index":{"Memory":[0],"optimization":[1],"is":[2,21,95,103],"an":[3],"important":[4],"strategy":[5],"to":[6,74,97,142],"gain":[7],"high":[8],"performance":[9,165],"for":[10,28,130],"sequence":[11,30,78],"alignment":[12,31,79],"implemented":[13],"by":[14,81],"CUDA":[15],"on":[16,67,149,159,174],"GPGPU.":[17],"Smith-Waterman":[18,77,112],"(SW)":[19],"algorithm":[20,25],"the":[22,87],"most":[23],"sensitive":[24],"widely":[26],"used":[27,42,96,105],"local":[29],"but":[32],"very":[33],"time":[34,155],"consuming.":[35],"Although":[36],"several":[37],"parallel":[38,65,76,111,147],"methods":[39],"have":[40],"been":[41],"in":[43,107,151,169],"some":[44],"studies":[45],"and":[46,127,156,161],"shown":[47],"good":[48],"performances,":[49],"advantages":[50],"of":[51,89,110,118,153,171],"GPGPU":[52,68,150],"memory":[53,71,94,102,120,124,132],"hierarchy":[54],"are":[55],"still":[56],"not":[57],"fully":[58],"exploited.":[59],"This":[60],"paper":[61],"presents":[62],"a":[63],"new":[64],"method":[66],"using":[69],"on-chip":[70,92,119],"more":[72],"efficiently":[73],"optimize":[75],"presented":[80],"Gregory":[82],"M.":[83],"Striemer.":[84],"To":[85],"minimize":[86],"cost":[88],"data":[90],"transfers,":[91],"shared":[93],"store":[98],"intermediate":[99],"results.":[100],"Constant":[101],"also":[104],"effectively":[106],"our":[108,175],"implementation":[109],"algorithm.":[113],"Using":[114],"these":[115],"two":[116],"kinds":[117],"decreases":[121],"long":[122],"latency":[123],"access":[125],"operations,":[126],"reduces":[128],"demand":[129],"global":[131],"when":[133],"aligning":[134],"longer":[135],"sequences.":[136],"The":[137],"experimental":[138],"results":[139],"show":[140],"1.66x":[141],"3.16x":[143],"speedup":[144,158,163],"over":[145,166],"Gregory's":[146],"SW":[148,168],"terms":[152,170],"execution":[154],"19.70x":[157],"average":[160],"22.43x":[162],"peak":[164],"serial":[167],"clock":[172],"cycles":[173],"computer":[176],"platform.":[177]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
