{"id":"https://openalex.org/W4385585436","doi":"https://doi.org/10.1109/ipdpsw59300.2023.00037","title":"An Efficient Parallel Sketch-based Algorithm for Mapping Long Reads to Contigs","display_name":"An Efficient Parallel Sketch-based Algorithm for Mapping Long Reads to Contigs","publication_year":2023,"publication_date":"2023-05-01","ids":{"openalex":"https://openalex.org/W4385585436","doi":"https://doi.org/10.1109/ipdpsw59300.2023.00037"},"language":"en","primary_location":{"id":"doi:10.1109/ipdpsw59300.2023.00037","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdpsw59300.2023.00037","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Parallel and Distributed Processing Symposium Workshops (IPDPSW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102943780","display_name":"Tazin Rahman","orcid":"https://orcid.org/0009-0001-8469-0234"},"institutions":[{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Tazin Rahman","raw_affiliation_strings":["Washington State University,Pullman,USA","Washington State University, Pullman, USA"],"affiliations":[{"raw_affiliation_string":"Washington State University,Pullman,USA","institution_ids":["https://openalex.org/I72951846"]},{"raw_affiliation_string":"Washington State University, Pullman, USA","institution_ids":["https://openalex.org/I72951846"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054749460","display_name":"Oieswarya Bhowmik","orcid":"https://orcid.org/0009-0005-0041-9914"},"institutions":[{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oieswarya Bhowmik","raw_affiliation_strings":["Washington State University,Pullman,USA","Washington State University, Pullman, USA"],"affiliations":[{"raw_affiliation_string":"Washington State University,Pullman,USA","institution_ids":["https://openalex.org/I72951846"]},{"raw_affiliation_string":"Washington State University, Pullman, USA","institution_ids":["https://openalex.org/I72951846"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048410309","display_name":"Ananth Kalyanaraman","orcid":"https://orcid.org/0000-0001-6721-233X"},"institutions":[{"id":"https://openalex.org/I72951846","display_name":"Washington State University","ror":"https://ror.org/05dk0ce17","country_code":"US","type":"education","lineage":["https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ananth Kalyanaraman","raw_affiliation_strings":["Washington State University,Pullman,USA","Washington State University, Pullman, USA"],"affiliations":[{"raw_affiliation_string":"Washington State University,Pullman,USA","institution_ids":["https://openalex.org/I72951846"]},{"raw_affiliation_string":"Washington State University, Pullman, USA","institution_ids":["https://openalex.org/I72951846"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102943780"],"corresponding_institution_ids":["https://openalex.org/I72951846"],"apc_list":null,"apc_paid":null,"fwci":0.7962,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.7337,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"157","last_page":"166"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11048","display_name":"Bacteriophages and microbial interactions","score":0.9872000217437744,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.749767005443573},{"id":"https://openalex.org/keywords/contig","display_name":"Contig","score":0.7339286804199219},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.6340608596801758},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5073477625846863},{"id":"https://openalex.org/keywords/sequence-assembly","display_name":"Sequence assembly","score":0.5051751732826233},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5020394325256348},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.4584069550037384},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.2603442966938019},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.25571614503860474},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.10349833965301514}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.749767005443573},{"id":"https://openalex.org/C59582021","wikidata":"https://www.wikidata.org/wiki/Q1128751","display_name":"Contig","level":4,"score":0.7339286804199219},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.6340608596801758},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5073477625846863},{"id":"https://openalex.org/C18949551","wikidata":"https://www.wikidata.org/wiki/Q740578","display_name":"Sequence assembly","level":5,"score":0.5051751732826233},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5020394325256348},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.4584069550037384},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.2603442966938019},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.25571614503860474},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.10349833965301514},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C162317418","wikidata":"https://www.wikidata.org/wiki/Q252857","display_name":"Transcriptome","level":4,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ipdpsw59300.2023.00037","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ipdpsw59300.2023.00037","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE International Parallel and Distributed Processing Symposium Workshops (IPDPSW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2105656684","https://openalex.org/W2108435020","https://openalex.org/W2124985265","https://openalex.org/W2132069633","https://openalex.org/W2144560237","https://openalex.org/W2157539385","https://openalex.org/W2179507357","https://openalex.org/W2346680365","https://openalex.org/W2767590279","https://openalex.org/W2788228074","https://openalex.org/W2789843538","https://openalex.org/W2807773783","https://openalex.org/W2884798430","https://openalex.org/W2950150251","https://openalex.org/W2950354111","https://openalex.org/W2951822379","https://openalex.org/W2953147862","https://openalex.org/W2961460076","https://openalex.org/W2987650093","https://openalex.org/W3009972029","https://openalex.org/W3045408080","https://openalex.org/W3098495126","https://openalex.org/W3102863871","https://openalex.org/W3208925084","https://openalex.org/W4220982887","https://openalex.org/W4225624933","https://openalex.org/W4226289813","https://openalex.org/W4242729757","https://openalex.org/W6679663036","https://openalex.org/W6775062811"],"related_works":["https://openalex.org/W1506942559","https://openalex.org/W2051711022","https://openalex.org/W2900736737","https://openalex.org/W2952258368","https://openalex.org/W4211197914","https://openalex.org/W4320879640","https://openalex.org/W4385406776","https://openalex.org/W2068532136","https://openalex.org/W4319941024","https://openalex.org/W3155662303"],"abstract_inverted_index":{"Long":[0],"read":[1,36],"technologies":[2,18],"are":[3],"continuing":[4],"to":[5,44,75,114,158,161],"evolve":[6],"at":[7],"a":[8,42,84,104,121,127,149,168,191,204],"rapid":[9],"pace,":[10],"with":[11,23,177,193],"the":[12,15,46,69,130,156],"latest":[13],"of":[14,71,92,129],"high":[16,24,150],"fidelity":[17],"delivering":[19],"reads":[20,74,113,182],"over":[21,203],"10Kbp":[22],"accuracy":[25],"(99.9%).":[26],"However,":[27,88],"there":[28],"also":[29],"exist":[30],"partially":[31],"constructed":[32,79],"assemblies":[33,60],"using":[34],"short":[35],"data.":[37],"Hybrid":[38],"assembly":[39],"workflows":[40],"provide":[41],"way":[43],"combine":[45],"information":[47],"in":[48,99,147],"both":[49],"these":[50],"data":[51],"sources":[52],"and":[53,57,61,183,196],"generate":[54],"highly":[55,145],"improved":[56],"near":[58],"complete":[59],"genomic":[62],"scaffolds.":[63],"In":[64],"this":[65,100],"paper,":[66,101],"we":[67,102],"address":[68],"problem":[70],"mapping":[72,152,163,192],"long":[73,112,181],"contigs":[76],"(representing":[77],"prior":[78],"partial":[80],"assemblies).":[81],"This":[82],"is":[83,95,144],"many-to-many":[85],"comparison":[86],"application.":[87],"brute":[89],"force":[90],"comparisons":[91],"all":[93],"pairs":[94],"not":[96],"practical.":[97],"Therefore,":[98],"present":[103],"parallel,":[105],"alignment-free":[106],"sketching-based":[107],"algorithm":[108,143],"that":[109,140],"efficiently":[110],"maps":[111],"contigs.":[115],"More":[116],"specifically,":[117],"our":[118,141,187],"approach":[119,189],"uses":[120],"minimizer-based":[122],"Jaccard":[123],"estimator":[124],"(or":[125],"JEM),":[126],"variant":[128],"classical":[131],"MinHashing":[132],"technique,":[133],"as":[134],"its":[135],"sketch.":[136],"Experimental":[137],"evaluation":[138],"shows":[139],"parallel":[142],"effective":[146],"producing":[148],"quality":[151],"while":[153,199],"improving":[154],"significantly":[155],"time":[157],"solution":[159],"compared":[160],"state-of-the-art":[162,205],"tools.":[164],"For":[165],"instance,":[166],"for":[167],"large":[169],"genome":[170],"Betta":[171],"splendens":[172],"($\\approx$":[173],"350":[174],"Mbp":[175],"genome)":[176],"429":[178],"K":[179,185],"HiFi":[180],"98":[184],"contigs,":[186],"JEM":[188],"produces":[190],"99.31%":[194],"precision":[195],"96.18%":[197],"recall,":[198],"yielding":[200],"7.13$\\times$":[201],"speedup":[202],"mapper":[206],"(Mashmap).":[207]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2025-12-11T23:09:37.256380","created_date":"2025-10-10T00:00:00"}
