{"id":"https://openalex.org/W4205472782","doi":"https://doi.org/10.1109/access.2021.3121749","title":"Fast Hybrid Data Structure for a Large Alphabet K-Mers Indexing for Whole Genome Alignment","display_name":"Fast Hybrid Data Structure for a Large Alphabet K-Mers Indexing for Whole Genome Alignment","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W4205472782","doi":"https://doi.org/10.1109/access.2021.3121749"},"language":"en","primary_location":{"id":"doi:10.1109/access.2021.3121749","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3121749","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09583298.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09583298.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068155919","display_name":"Rostislav H\u0159iv\u0148\u00e1k","orcid":"https://orcid.org/0000-0002-5229-3891"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Rostislav Hrivnak","raw_affiliation_strings":["V\u0160B\u2014Technical University of Ostrava, Ostrava, Czech Republic"],"raw_orcid":"https://orcid.org/0000-0002-5229-3891","affiliations":[{"raw_affiliation_string":"V\u0160B\u2014Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056523918","display_name":"Petr Gajdo\u0161","orcid":"https://orcid.org/0000-0003-1831-3489"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Petr Gajdos","raw_affiliation_strings":["V\u0160B\u2014Technical University of Ostrava, Ostrava, Czech Republic"],"raw_orcid":"https://orcid.org/0000-0003-1831-3489","affiliations":[{"raw_affiliation_string":"V\u0160B\u2014Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5011543714","display_name":"V\u00e1clav Sn\u00e5\u0161el","orcid":"https://orcid.org/0000-0002-9600-8319"},"institutions":[{"id":"https://openalex.org/I142208455","display_name":"VSB - Technical University of Ostrava","ror":"https://ror.org/05x8mcb75","country_code":"CZ","type":"education","lineage":["https://openalex.org/I142208455"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Vaclav Snasel","raw_affiliation_strings":["V\u0160B\u2014Technical University of Ostrava, Ostrava, Czech Republic"],"raw_orcid":"https://orcid.org/0000-0002-9600-8319","affiliations":[{"raw_affiliation_string":"V\u0160B\u2014Technical University of Ostrava, Ostrava, Czech Republic","institution_ids":["https://openalex.org/I142208455"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.20153539,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"9","issue":null,"first_page":"161890","last_page":"161897"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12029","display_name":"DNA and Biological Computing","score":0.9671000242233276,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.7575554847717285},{"id":"https://openalex.org/keywords/suffix","display_name":"Suffix","score":0.7119580507278442},{"id":"https://openalex.org/keywords/compressed-suffix-array","display_name":"Compressed suffix array","score":0.5057518482208252},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.4940777122974396},{"id":"https://openalex.org/keywords/alphabet","display_name":"Alphabet","score":0.48566973209381104},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.45563358068466187},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3888428509235382},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3719345033168793},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.3558374345302582},{"id":"https://openalex.org/keywords/discrete-mathematics","display_name":"Discrete mathematics","score":0.3238510489463806},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.30475592613220215},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.29448240995407104},{"id":"https://openalex.org/keywords/suffix-tree","display_name":"Suffix tree","score":0.28634053468704224},{"id":"https://openalex.org/keywords/arithmetic","display_name":"Arithmetic","score":0.1451338231563568},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.12361767888069153}],"concepts":[{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.7575554847717285},{"id":"https://openalex.org/C2779804580","wikidata":"https://www.wikidata.org/wiki/Q102047","display_name":"Suffix","level":2,"score":0.7119580507278442},{"id":"https://openalex.org/C100903775","wikidata":"https://www.wikidata.org/wiki/Q5157028","display_name":"Compressed suffix array","level":4,"score":0.5057518482208252},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.4940777122974396},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.48566973209381104},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.45563358068466187},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3888428509235382},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3719345033168793},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.3558374345302582},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.3238510489463806},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.30475592613220215},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.29448240995407104},{"id":"https://openalex.org/C2781166958","wikidata":"https://www.wikidata.org/wiki/Q1426863","display_name":"Suffix tree","level":3,"score":0.28634053468704224},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.1451338231563568},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.12361767888069153},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/access.2021.3121749","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3121749","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09583298.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:f609ac6e77f14e19beb8d21553e23efb","is_oa":true,"landing_page_url":"https://doaj.org/article/f609ac6e77f14e19beb8d21553e23efb","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 9, Pp 161890-161897 (2021)","raw_type":"article"},{"id":"pmh:oai:dspace.vsb.cz:10084/146001","is_oa":true,"landing_page_url":"http://hdl.handle.net/10084/146001","pdf_url":null,"source":{"id":"https://openalex.org/S4306401668","display_name":"DSpace V\u0160B-TUO (V\u0160B-TUO)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I142208455","host_organization_name":"VSB - Technical University of Ostrava","host_organization_lineage":["https://openalex.org/I142208455"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2021.3121749","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3121749","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/9312710/09583298.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4125322560","display_name":null,"funder_award_id":"NU20-06-00269","funder_id":"https://openalex.org/F4320321798","funder_display_name":"Ministerstvo Zdravotnictv\u00ed Cesk\u00e9 Republiky"},{"id":"https://openalex.org/G4533279616","display_name":null,"funder_award_id":"CZ-102","funder_id":"https://openalex.org/F4320309086","funder_display_name":"Celgene"},{"id":"https://openalex.org/G851577961","display_name":null,"funder_award_id":"SP2021/94","funder_id":"https://openalex.org/F4320323872","funder_display_name":"Vysok\u00e1 \u0160kola B\u00e1nsk\u00e1 - Technick\u00e1 Univerzita Ostrava"}],"funders":[{"id":"https://openalex.org/F4320309086","display_name":"Celgene","ror":"https://ror.org/0527yg379"},{"id":"https://openalex.org/F4320321798","display_name":"Ministerstvo Zdravotnictv\u00ed Cesk\u00e9 Republiky","ror":"https://ror.org/00y6khe77"},{"id":"https://openalex.org/F4320323872","display_name":"Vysok\u00e1 \u0160kola B\u00e1nsk\u00e1 - Technick\u00e1 Univerzita Ostrava","ror":"https://ror.org/05x8mcb75"},{"id":"https://openalex.org/F4320324050","display_name":"Ostravsk\u00e1 Univerzita v Ostrav\u011b","ror":"https://ror.org/00pyqav47"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4205472782.pdf","grobid_xml":"https://content.openalex.org/works/W4205472782.grobid-xml"},"referenced_works_count":34,"referenced_works":["https://openalex.org/W1517052908","https://openalex.org/W1909344111","https://openalex.org/W2000484009","https://openalex.org/W2059513841","https://openalex.org/W2102278945","https://openalex.org/W2103441770","https://openalex.org/W2104677379","https://openalex.org/W2141262285","https://openalex.org/W2142619120","https://openalex.org/W2142678478","https://openalex.org/W2152331922","https://openalex.org/W2158714788","https://openalex.org/W2158874082","https://openalex.org/W2161488606","https://openalex.org/W2169456326","https://openalex.org/W2170551349","https://openalex.org/W2344026279","https://openalex.org/W2418511861","https://openalex.org/W2533248932","https://openalex.org/W2592783371","https://openalex.org/W2784788330","https://openalex.org/W2794300029","https://openalex.org/W2899025479","https://openalex.org/W2963963068","https://openalex.org/W2964849163","https://openalex.org/W3017152484","https://openalex.org/W3037350306","https://openalex.org/W3037460463","https://openalex.org/W3214513246","https://openalex.org/W6639872743","https://openalex.org/W6650339521","https://openalex.org/W6683504902","https://openalex.org/W6780102401","https://openalex.org/W7008732128"],"related_works":["https://openalex.org/W2359436045","https://openalex.org/W1596809600","https://openalex.org/W2576782855","https://openalex.org/W96331545","https://openalex.org/W2073921136","https://openalex.org/W203848531","https://openalex.org/W2405892617","https://openalex.org/W4293529780","https://openalex.org/W363060408","https://openalex.org/W2143531254"],"abstract_inverted_index":{"The":[0,102,252],"most":[1],"common":[2],"index":[3,153,211,239],"data":[4,23,154,194],"structures":[5,24],"used":[6,140],"by":[7],"whole":[8,75],"genome":[9,76],"aligners":[10],"(WGA)":[11],"are":[12,80,94],"based":[13,156],"on":[14,90,133,157,174,258],"suffix":[15,18],"trees":[16],"(ST),":[17],"arrays,":[19],"and":[20,163],"FM-indexes.":[21],"These":[22],"show":[25],"good":[26],"performance":[27,132,213,223,241],"results":[28],"as":[29,96],"WGA":[30],"works":[31],"with":[32,84,172],"sequences":[33],"of":[34,99,104,148,206,224],"letters":[35,42],"over":[36,203],"small":[37],"alphabets;":[38],"for":[39,70,200],"example,":[40],"four":[41],"<inline-formula":[43,50,57,64,106],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[44,51,58,65,107,260],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">":[45,52,59,66,108],"<tex-math":[46,53,60,67,109],"notation=\"LaTeX\">$a$":[47],"</tex-math></inline-formula>":[48,55,62,69,112],",":[49,56,63],"notation=\"LaTeX\">$c$":[54],"notation=\"LaTeX\">$t$":[61],"notation=\"LaTeX\">$g$":[68],"DNA":[71,91],"alignment.":[72],"A":[73],"novel":[74],"aligner,":[77],"which":[78,93,166],"we":[79],"developing,":[81],"will":[82],"work":[83],"distances":[85],"between":[86],"the":[87,138,146,179,221,225,229,250,263],"label":[88],"sites":[89],"samples,":[92],"represented":[95],"a":[97,125,149,158],"sequence":[98],"positive":[100],"integers.":[101],"size":[103],"alphabet":[105,205,230],"notation=\"LaTeX\">$\\sigma":[110],"$":[111],"is":[113,124,255],"theoretically":[114],"unlimited.":[115],"This":[116,143],"has":[117],"prompted":[118],"us":[119],"to":[120,137,178,216,233,245],"investigate":[121],"if":[122],"there":[123],"better":[126,169,219,248],"structure":[127,155],"that":[128],"would":[129],"improve":[130],"search":[131,160,212,222,240],"large":[134,175],"alphabets":[135,176],"compared":[136,177],"commonly":[139],"suffix-based":[141],"structures.":[142],"paper":[144],"presents":[145],"implementation":[147],"highly":[150],"optimized":[151],"hybrid":[152],"ternary":[159],"tree":[161],"(TST)":[162],"hash":[164],"tables,":[165],"perform":[167],"much":[168],"when":[170],"working":[171],"strings":[173],"ST.":[180,227,251],"Single":[181],"core":[182],"parallelism":[183],"was":[184,214,231,242],"achieved":[185],"using":[186],"advanced":[187],"vector":[188],"extensions":[189],"(AVX)":[190],"single":[191],"instruction":[192,196],"multiple":[193],"(SIMD)":[195],"set.":[197],"When":[198,228],"searching":[199],"short":[201],"k-mers":[202],"an":[204],"25,":[207],"695":[208],"letters,":[209,237],"our":[210,238],"up":[215,244],"29":[217],"times":[218,247],"than":[220,249],"reference":[226],"compressed":[232],"approximately":[234],"1,":[235],"300":[236],"still":[243],"2.6":[246],"source":[253],"code":[254],"available":[256],"free":[257],"<uri":[259],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">http://olgen.cz/Resources/Upload/Home/public/software/hds.zip</uri>":[261],"under":[262],"MIT":[264],"license.":[265]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
