{"id":"https://openalex.org/W2005533448","doi":"https://doi.org/10.1145/2808719.2811429","title":"A new method for DNA sequencing error verification and correction via an on-disk index tree","display_name":"A new method for DNA sequencing error verification and correction via an on-disk index tree","publication_year":2015,"publication_date":"2015-09-09","ids":{"openalex":"https://openalex.org/W2005533448","doi":"https://doi.org/10.1145/2808719.2811429","mag":"2005533448"},"language":"en","primary_location":{"id":"doi:10.1145/2808719.2811429","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2808719.2811429","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th ACM Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034117321","display_name":"Yarong Gu","orcid":"https://orcid.org/0009-0002-8628-304X"},"institutions":[{"id":"https://openalex.org/I4210130704","display_name":"University of Michigan\u2013Dearborn","ror":"https://ror.org/035wtm547","country_code":"US","type":"education","lineage":["https://openalex.org/I4210130704"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yarong Gu","raw_affiliation_strings":["The University of Michigan, Dearborn"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Michigan, Dearborn","institution_ids":["https://openalex.org/I4210130704"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101804184","display_name":"Xianying Liu","orcid":"https://orcid.org/0000-0002-5658-5875"},"institutions":[{"id":"https://openalex.org/I4210130704","display_name":"University of Michigan\u2013Dearborn","ror":"https://ror.org/035wtm547","country_code":"US","type":"education","lineage":["https://openalex.org/I4210130704"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xianying Liu","raw_affiliation_strings":["The University of Michigan, Dearborn"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Michigan, Dearborn","institution_ids":["https://openalex.org/I4210130704"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103136845","display_name":"Qiang Zhu","orcid":"https://orcid.org/0000-0001-7094-9236"},"institutions":[{"id":"https://openalex.org/I4210130704","display_name":"University of Michigan\u2013Dearborn","ror":"https://ror.org/035wtm547","country_code":"US","type":"education","lineage":["https://openalex.org/I4210130704"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Qiang Zhu","raw_affiliation_strings":["The University of Michigan, Dearborn"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Michigan, Dearborn","institution_ids":["https://openalex.org/I4210130704"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087648465","display_name":"Youchao Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I4210130704","display_name":"University of Michigan\u2013Dearborn","ror":"https://ror.org/035wtm547","country_code":"US","type":"education","lineage":["https://openalex.org/I4210130704"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Youchao Dong","raw_affiliation_strings":["The University of Michigan, Dearborn"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The University of Michigan, Dearborn","institution_ids":["https://openalex.org/I4210130704"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036229691","display_name":"C. Titus Brown","orcid":"https://orcid.org/0000-0001-6001-2677"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"C. Titus Brown","raw_affiliation_strings":["Michigan State University, East Lansing","Michigan State Univ., East Lansing#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing","institution_ids":["https://openalex.org/I87216513"]},{"raw_affiliation_string":"Michigan State Univ., East Lansing#TAB#","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059755229","display_name":"Sakti Pramanik","orcid":null},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sakti Pramanik","raw_affiliation_strings":["Michigan State University, East Lansing","Michigan State Univ., East Lansing#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing","institution_ids":["https://openalex.org/I87216513"]},{"raw_affiliation_string":"Michigan State Univ., East Lansing#TAB#","institution_ids":["https://openalex.org/I87216513"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5034117321"],"corresponding_institution_ids":["https://openalex.org/I4210130704"],"apc_list":null,"apc_paid":null,"fwci":1.3355,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.86024638,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"503","last_page":"504"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8109323382377625},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6454010605812073},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5999356508255005},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5667918920516968},{"id":"https://openalex.org/keywords/bloom-filter","display_name":"Bloom filter","score":0.5580983757972717},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.4763912558555603},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.47425806522369385},{"id":"https://openalex.org/keywords/error-detection-and-correction","display_name":"Error detection and correction","score":0.4736917018890381},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.472817063331604},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.44137176871299744},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.42559170722961426},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4192917048931122},{"id":"https://openalex.org/keywords/k-mer","display_name":"k-mer","score":0.41103214025497437},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3834259808063507},{"id":"https://openalex.org/keywords/dna-sequencing","display_name":"DNA sequencing","score":0.34008312225341797},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12470629811286926},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10750672221183777},{"id":"https://openalex.org/keywords/dna","display_name":"DNA","score":0.083285391330719}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8109323382377625},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6454010605812073},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5999356508255005},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5667918920516968},{"id":"https://openalex.org/C147224247","wikidata":"https://www.wikidata.org/wiki/Q885373","display_name":"Bloom filter","level":2,"score":0.5580983757972717},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.4763912558555603},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.47425806522369385},{"id":"https://openalex.org/C103088060","wikidata":"https://www.wikidata.org/wiki/Q1062839","display_name":"Error detection and correction","level":2,"score":0.4736917018890381},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.472817063331604},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.44137176871299744},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.42559170722961426},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4192917048931122},{"id":"https://openalex.org/C2279292","wikidata":"https://www.wikidata.org/wiki/Q6322851","display_name":"k-mer","level":4,"score":0.41103214025497437},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3834259808063507},{"id":"https://openalex.org/C51679486","wikidata":"https://www.wikidata.org/wiki/Q380546","display_name":"DNA sequencing","level":3,"score":0.34008312225341797},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12470629811286926},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10750672221183777},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.083285391330719},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2808719.2811429","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2808719.2811429","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 6th ACM Conference on Bioinformatics, Computational Biology and Health Informatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":5,"referenced_works":["https://openalex.org/W2052039291","https://openalex.org/W2096128575","https://openalex.org/W2123837096","https://openalex.org/W2133956160","https://openalex.org/W2135631159"],"related_works":["https://openalex.org/W2086572746","https://openalex.org/W2604468458","https://openalex.org/W2563930566","https://openalex.org/W4226101760","https://openalex.org/W2417068752","https://openalex.org/W3132474731","https://openalex.org/W2097066660","https://openalex.org/W4297832806","https://openalex.org/W2092772380","https://openalex.org/W1989871058"],"abstract_inverted_index":{"Existing":[0],"sequencing":[1,18,105],"error":[2,19],"correction":[3,20],"techniques":[4],"demand":[5],"large":[6,45],"expensive":[7],"memory":[8],"space.":[9],"In":[10],"this":[11],"work,":[12],"we":[13],"introduce":[14],"a":[15,32,44,58,89],"new":[16],"disk-based":[17],"method":[21,97],"to":[22,30,40,64,81],"solve":[23],"the":[24,38,56,66,95],"problem.":[25],"The":[26],"key":[27],"idea":[28],"is":[29,79,98],"utilize":[31],"special":[33,61],"on-disk":[34],"index":[35],"structure,":[36],"called":[37],"BoND-tree,":[39,57],"store":[41],"and":[42,49,69,83,103,111],"access":[43],"set":[46,59],"of":[47,60,109],"k-mers":[48,68],"their":[50,70],"associated":[51],"metadata":[52],"on":[53],"disk.":[54],"With":[55],"box":[62],"queries":[63],"retrieve":[65],"relevant":[67],"counts":[71],"are":[72],"efficiently":[73],"processed.":[74],"A":[75],"comprehensive":[76],"voting":[77],"mechanism":[78],"adopted":[80],"determine":[82],"correct":[84],"an":[85],"erroneous":[86],"base":[87],"in":[88,101,107],"genome":[90],"sequence.":[91],"Experiments":[92],"demonstrate":[93],"that":[94],"proposed":[96],"quite":[99],"promising":[100],"verifying":[102],"correcting":[104],"errors":[106],"terms":[108],"accuracy":[110],"scalability.":[112]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":2}],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-10T00:00:00"}
