{"id":"https://openalex.org/W4313452862","doi":"https://doi.org/10.1109/bibm55620.2022.9995126","title":"An interleaved hardware-accelerated k-mer parser","display_name":"An interleaved hardware-accelerated k-mer parser","publication_year":2022,"publication_date":"2022-12-06","ids":{"openalex":"https://openalex.org/W4313452862","doi":"https://doi.org/10.1109/bibm55620.2022.9995126"},"language":"en","primary_location":{"id":"doi:10.1109/bibm55620.2022.9995126","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bibm55620.2022.9995126","pdf_url":null,"source":{"id":"https://openalex.org/S4363607730","display_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017152835","display_name":"Franco Milicchio","orcid":"https://orcid.org/0000-0002-4875-4894"},"institutions":[{"id":"https://openalex.org/I119003972","display_name":"Roma Tre University","ror":"https://ror.org/05vf0dg29","country_code":"IT","type":"education","lineage":["https://openalex.org/I119003972"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Franco Milicchio","raw_affiliation_strings":["Roma Tre University,Department of Engineering,Rome,Italy","Department of Engineering, Roma Tre University, Rome, Italy"],"affiliations":[{"raw_affiliation_string":"Roma Tre University,Department of Engineering,Rome,Italy","institution_ids":["https://openalex.org/I119003972"]},{"raw_affiliation_string":"Department of Engineering, Roma Tre University, Rome, Italy","institution_ids":["https://openalex.org/I119003972"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020831803","display_name":"Marco Ant\u00f4nio Oliva","orcid":"https://orcid.org/0000-0003-0525-3114"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marco Oliva","raw_affiliation_strings":["University of Florida,Department of Computer and Information Science and Engineering,Gainesville,FL,USA","Department of Computer and Information Science and Engineering, University of Florida, Gainesville, FL, USA"],"affiliations":[{"raw_affiliation_string":"University of Florida,Department of Computer and Information Science and Engineering,Gainesville,FL,USA","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Computer and Information Science and Engineering, University of Florida, Gainesville, FL, USA","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039419132","display_name":"Mattia Prosperi","orcid":"https://orcid.org/0000-0002-9021-5595"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mattia Prosperi","raw_affiliation_strings":["University of Florida,Department of Epidemiology,Gainesville,FL,USA","Department of Epidemiology, University of Florida, Gainesville, FL, USA"],"affiliations":[{"raw_affiliation_string":"University of Florida,Department of Epidemiology,Gainesville,FL,USA","institution_ids":["https://openalex.org/I33213144"]},{"raw_affiliation_string":"Department of Epidemiology, University of Florida, Gainesville, FL, USA","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5017152835"],"corresponding_institution_ids":["https://openalex.org/I119003972"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.42167722,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2929","last_page":"2933"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11970","display_name":"Molecular Biology Techniques and Applications","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8507565855979919},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.6667566299438477},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6227524280548096},{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.6025123000144958},{"id":"https://openalex.org/keywords/hardware-acceleration","display_name":"Hardware acceleration","score":0.462202787399292},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.41507595777511597},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.35628634691238403},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.30507588386535645},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.29915279150009155},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.1395370364189148}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8507565855979919},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.6667566299438477},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6227524280548096},{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.6025123000144958},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.462202787399292},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.41507595777511597},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.35628634691238403},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.30507588386535645},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.29915279150009155},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.1395370364189148}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bibm55620.2022.9995126","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bibm55620.2022.9995126","pdf_url":null,"source":{"id":"https://openalex.org/S4363607730","display_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2037748100","https://openalex.org/W2057253402","https://openalex.org/W2070102345","https://openalex.org/W2121716038","https://openalex.org/W2260037449","https://openalex.org/W2330100020","https://openalex.org/W2575250966","https://openalex.org/W2583363792","https://openalex.org/W2753396470","https://openalex.org/W2799394118","https://openalex.org/W2805016149","https://openalex.org/W2897927784","https://openalex.org/W2902483623","https://openalex.org/W2952597168","https://openalex.org/W2981619930","https://openalex.org/W3015565387","https://openalex.org/W4205838375","https://openalex.org/W6756628031"],"related_works":["https://openalex.org/W2534771569","https://openalex.org/W2037547261","https://openalex.org/W4311812695","https://openalex.org/W2117788426","https://openalex.org/W4242015792","https://openalex.org/W3011583392","https://openalex.org/W2291920536","https://openalex.org/W4379115909","https://openalex.org/W3152699334","https://openalex.org/W2785001802"],"abstract_inverted_index":{"Advances":[0],"in":[1,65,78,175],"next-generation":[2],"sequencing":[3,66,160],"(NGS)":[4],"have":[5],"not":[6],"only":[7],"increased":[8],"the":[9,62,215],"overall":[10],"throughput":[11],"of":[12,47,156],"genomic":[13],"content":[14],"(e.g.":[15,27,195],"Illumina":[16],"NovaSeq":[17],"up":[18],"to":[19,44,59,61],"6,":[20],"000GB),":[21],"but":[22],"also":[23],"provided":[24],"technology":[25],"miniaturization":[26],"Oxford":[28],"Nanopore":[29],"MinION)":[30],"enabling":[31],"real-time,":[32],"mobile":[33],"experiments.":[34],"Single":[35],"Instruction/Multiple":[36],"Data":[37],"(SIMD)":[38],"hardware":[39,86],"acceleration":[40],"is":[41],"increasingly":[42],"used":[43],"improve":[45],"performance":[46],"NGS":[48,104],"data":[49],"processing":[50],"tools,":[51],"while":[52],"generic":[53,92,187],"template":[54],"programming":[55,93],"libraries":[56],"are":[57,212],"advantageous":[58],"adapt":[60],"fast":[63],"changes":[64],"and":[67,116,137,144,163,170,178,209,218],"computing":[68],"platforms.":[69],"We":[70,97],"here":[71],"present":[72],"a":[73,91],"novel":[74],"k-mer":[75,100,112,179,207],"parser":[76,101,151,208],"written":[77],"ISO":[79],"C++":[80],"that":[81,191],"exploits":[82],"an":[83,119],"interleaved,":[84],"non-sequential,":[85],"accelerated":[87],"SIMD":[88,204],"implementation":[89],"within":[90],"framework":[94],"called":[95],"libseq.":[96],"benchmarked":[98],"our":[99,150,184],"using":[102,132],"different":[103],"experimental":[105],"datasets":[106],"comparing":[107],"with":[108,122],"other":[109,189],"two":[110],"popular":[111],"counting":[113],"tools":[114],"(DSK":[115],"KMC3).":[117],"On":[118,158],"Intel":[120,125],"machine":[121],"AVX2":[123],"(Quad-Core":[124],"Core":[126],"i5":[127],"CPU,":[128],"32":[129],"GB":[130],"RAM),":[131],"simulated":[133],"in-memory":[134],"reads,":[135],"DSK":[136,162],"KMC3":[138,164],"were":[139,165],"on":[140,166,193],"average":[141,167],"3.":[142],"6x":[143],"1.":[145],"03x":[146],"times":[147,173],"slower":[148,174],"than":[149,181],"across":[152],"k":[153],"value":[154],"ranges":[155],"35-63.":[157],"real":[159],"experiments,":[161],"8.":[168],"3x":[169],"28.":[171],"8x":[172],"file/read":[176],"parsing":[177],"building":[180],"ours.":[182],"Since":[183],"tool":[185],"uses":[186],"programming,":[188],"methods":[190],"rely":[192],"k-mers":[194],"de":[196],"Bruijn":[197],"graphs)":[198],"can":[199],"directly":[200],"benefit":[201],"from":[202],"its":[203],"acceleration.":[205],"Our":[206],"libseq":[210],"2.0":[211],"released":[213],"under":[214],"BSD":[216],"license":[217],"available":[219],"at":[220],"https://zenodo.org/record/7015294.":[221]},"counts_by_year":[],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-10-10T00:00:00"}
