{"id":"https://openalex.org/W2135434593","doi":"https://doi.org/10.1109/cit.2008.4594729","title":"A compressing method for genome sequence cluster using sequence alignment","display_name":"A compressing method for genome sequence cluster using sequence alignment","publication_year":2008,"publication_date":"2008-07-01","ids":{"openalex":"https://openalex.org/W2135434593","doi":"https://doi.org/10.1109/cit.2008.4594729","mag":"2135434593"},"language":"en","primary_location":{"id":"doi:10.1109/cit.2008.4594729","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cit.2008.4594729","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 8th IEEE International Conference on Computer and Information Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111626464","display_name":"Kwang Su Jung","orcid":null},"institutions":[{"id":"https://openalex.org/I163753206","display_name":"Chungbuk National University","ror":"https://ror.org/02wnxgj78","country_code":"KR","type":"education","lineage":["https://openalex.org/I163753206"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Kwang Su Jung","raw_affiliation_strings":["Database Bioinformatics Laboratory, Chungbuk National University, South Korea","Database/Bioinf. Lab., Chungbuk Nat. Univ., Cheongju"],"affiliations":[{"raw_affiliation_string":"Database Bioinformatics Laboratory, Chungbuk National University, South Korea","institution_ids":["https://openalex.org/I163753206"]},{"raw_affiliation_string":"Database/Bioinf. Lab., Chungbuk Nat. Univ., Cheongju","institution_ids":["https://openalex.org/I163753206"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008124846","display_name":"Nam Hee Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I163753206","display_name":"Chungbuk National University","ror":"https://ror.org/02wnxgj78","country_code":"KR","type":"education","lineage":["https://openalex.org/I163753206"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Nam Hee Yu","raw_affiliation_strings":["Database Bioinformatics Laboratory, Chungbuk National University, South Korea","Database/Bioinf. Lab., Chungbuk Nat. Univ., Cheongju"],"affiliations":[{"raw_affiliation_string":"Database Bioinformatics Laboratory, Chungbuk National University, South Korea","institution_ids":["https://openalex.org/I163753206"]},{"raw_affiliation_string":"Database/Bioinf. Lab., Chungbuk Nat. Univ., Cheongju","institution_ids":["https://openalex.org/I163753206"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113804807","display_name":"Seung Jung Shin","orcid":null},"institutions":[{"id":"https://openalex.org/I177023625","display_name":"Hansei University","ror":"https://ror.org/01bxsr356","country_code":"KR","type":"education","lineage":["https://openalex.org/I177023625"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seung Jung Shin","raw_affiliation_strings":["Divison of IT, Hansei Univiersity, South Korea","Divison of IT, Hansei Univiersity, Korea"],"affiliations":[{"raw_affiliation_string":"Divison of IT, Hansei Univiersity, South Korea","institution_ids":["https://openalex.org/I177023625"]},{"raw_affiliation_string":"Divison of IT, Hansei Univiersity, Korea","institution_ids":["https://openalex.org/I177023625"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5043932631","display_name":"Keun Ho Ryu","orcid":"https://orcid.org/0000-0003-0394-9054"},"institutions":[{"id":"https://openalex.org/I163753206","display_name":"Chungbuk National University","ror":"https://ror.org/02wnxgj78","country_code":"KR","type":"education","lineage":["https://openalex.org/I163753206"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Keun Ho Ryu","raw_affiliation_strings":["Database Bioinformatics Laboratory, Chungbuk National University, South Korea","Database/BioInformatics Laboratory, Chungbuk National University, Korea"],"affiliations":[{"raw_affiliation_string":"Database Bioinformatics Laboratory, Chungbuk National University, South Korea","institution_ids":["https://openalex.org/I163753206"]},{"raw_affiliation_string":"Database/BioInformatics Laboratory, Chungbuk National University, Korea","institution_ids":["https://openalex.org/I163753206"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5111626464"],"corresponding_institution_ids":["https://openalex.org/I163753206"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.13115892,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"5","issue":null,"first_page":"520","last_page":"525"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/alignment-free-sequence-analysis","display_name":"Alignment-free sequence analysis","score":0.798147439956665},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.7265586256980896},{"id":"https://openalex.org/keywords/sequence-logo","display_name":"Sequence logo","score":0.7254245281219482},{"id":"https://openalex.org/keywords/sequence-alignment","display_name":"Sequence alignment","score":0.5969495177268982},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.5610079169273376},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5098533034324646},{"id":"https://openalex.org/keywords/multiple-sequence-alignment","display_name":"Multiple sequence alignment","score":0.5089731216430664},{"id":"https://openalex.org/keywords/cluster","display_name":"Cluster (spacecraft)","score":0.5045541524887085},{"id":"https://openalex.org/keywords/nucleic-acid-sequence","display_name":"Nucleic acid sequence","score":0.4687146246433258},{"id":"https://openalex.org/keywords/structural-alignment","display_name":"Structural alignment","score":0.4586787819862366},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.45319047570228577},{"id":"https://openalex.org/keywords/sequence-analysis","display_name":"Sequence analysis","score":0.44606393575668335},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.4450395703315735},{"id":"https://openalex.org/keywords/edit-distance","display_name":"Edit distance","score":0.44497784972190857},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.4196586608886719},{"id":"https://openalex.org/keywords/homology","display_name":"Homology (biology)","score":0.4167305827140808},{"id":"https://openalex.org/keywords/dna-sequencing","display_name":"DNA sequencing","score":0.4164399206638336},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.41413113474845886},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.32604026794433594},{"id":"https://openalex.org/keywords/dna","display_name":"DNA","score":0.31591856479644775},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2071102261543274},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.11199095845222473}],"concepts":[{"id":"https://openalex.org/C180384323","wikidata":"https://www.wikidata.org/wiki/Q16335137","display_name":"Alignment-free sequence analysis","level":5,"score":0.798147439956665},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.7265586256980896},{"id":"https://openalex.org/C105082737","wikidata":"https://www.wikidata.org/wiki/Q7452470","display_name":"Sequence logo","level":5,"score":0.7254245281219482},{"id":"https://openalex.org/C45484198","wikidata":"https://www.wikidata.org/wiki/Q827246","display_name":"Sequence alignment","level":4,"score":0.5969495177268982},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.5610079169273376},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5098533034324646},{"id":"https://openalex.org/C88031987","wikidata":"https://www.wikidata.org/wiki/Q1377767","display_name":"Multiple sequence alignment","level":5,"score":0.5089731216430664},{"id":"https://openalex.org/C164866538","wikidata":"https://www.wikidata.org/wiki/Q367351","display_name":"Cluster (spacecraft)","level":2,"score":0.5045541524887085},{"id":"https://openalex.org/C84148353","wikidata":"https://www.wikidata.org/wiki/Q863908","display_name":"Nucleic acid sequence","level":3,"score":0.4687146246433258},{"id":"https://openalex.org/C4668613","wikidata":"https://www.wikidata.org/wiki/Q4116110","display_name":"Structural alignment","level":5,"score":0.4586787819862366},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.45319047570228577},{"id":"https://openalex.org/C61053724","wikidata":"https://www.wikidata.org/wiki/Q1154615","display_name":"Sequence analysis","level":3,"score":0.44606393575668335},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.4450395703315735},{"id":"https://openalex.org/C44359876","wikidata":"https://www.wikidata.org/wiki/Q5338467","display_name":"Edit distance","level":2,"score":0.44497784972190857},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4196586608886719},{"id":"https://openalex.org/C165525559","wikidata":"https://www.wikidata.org/wiki/Q224180","display_name":"Homology (biology)","level":3,"score":0.4167305827140808},{"id":"https://openalex.org/C51679486","wikidata":"https://www.wikidata.org/wiki/Q380546","display_name":"DNA sequencing","level":3,"score":0.4164399206638336},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.41413113474845886},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.32604026794433594},{"id":"https://openalex.org/C552990157","wikidata":"https://www.wikidata.org/wiki/Q7430","display_name":"DNA","level":2,"score":0.31591856479644775},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2071102261543274},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.11199095845222473},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/cit.2008.4594729","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cit.2008.4594729","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2008 8th IEEE International Conference on Computer and Information Technology","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.665.935","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.665.935","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://cial.csie.ncku.edu.tw/presentation/group_pdf/A+Compressing+Method+for+Genome+Sequence+Cluster+using+Sequence.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W21816278","https://openalex.org/W1527979595","https://openalex.org/W1534606537","https://openalex.org/W1975001431","https://openalex.org/W1981014117","https://openalex.org/W1994414218","https://openalex.org/W2015292449","https://openalex.org/W2029195137","https://openalex.org/W2031716828","https://openalex.org/W2033339460","https://openalex.org/W2045954434","https://openalex.org/W2054600139","https://openalex.org/W2055043387","https://openalex.org/W2056619794","https://openalex.org/W2062112417","https://openalex.org/W2074231493","https://openalex.org/W2087064593","https://openalex.org/W2143210482","https://openalex.org/W2149208773","https://openalex.org/W2158714788","https://openalex.org/W4236236547"],"related_works":["https://openalex.org/W2051969447","https://openalex.org/W2029514038","https://openalex.org/W997010268","https://openalex.org/W2141862901","https://openalex.org/W2088487249","https://openalex.org/W566472934","https://openalex.org/W1998139877","https://openalex.org/W3201601936","https://openalex.org/W1484713061","https://openalex.org/W3128610423"],"abstract_inverted_index":{"After":[0],"identifying":[1],"the":[2,17,70,116,150],"function":[3],"of":[4,16,39,45,79,121,136,160,168],"a":[5,30,34,46,51,60,66,80,91,100,106,111,130,164],"protein,":[6],"biologists":[7],"produce":[8],"new":[9,21,92],"useful":[10],"proteins":[11,22],"by":[12,118,128],"substituting":[13],"some":[14],"residues":[15],"identified":[18],"protein.":[19],"These":[20],"have":[23],"high":[24],"sequence":[25,31,62,97,101,108,113,131,138],"homology":[26],"(similarity).":[27],"We":[28,89,104,153],"define":[29],"cluster":[32,35,117,162,170],"as":[33],"that":[36],"is":[37,59,140],"constituted":[38],"similar":[40],"sequences.":[41,123,152],"As":[42],"another":[43],"example":[44],"Sequence":[47],"Cluster,":[48],"we":[49],"consider":[50],"SNP":[52,58],"(Single":[53],"Nucleotide":[54],"Polymorphism)":[55],"Cluster.":[56],"A":[57],"DNA":[61],"variation":[63],"occurring":[64],"when":[65],"single":[67],"nucleotide":[68],"in":[69,86,115],"genome":[71],"(or":[72,82],"other":[73],"shared":[74],"sequence)":[75],"differs":[76],"between":[77,83,149],"members":[78],"species":[81],"paired":[84],"chromosomes":[85],"an":[87,147],"individual).":[88],"suggest":[90],"compressing":[93],"technique":[94],"for":[95],"these":[96],"clusters":[98],"using":[99,176],"alignment":[102,132,139],"method.":[103],"select":[105],"representative":[107,156,177],"which":[109],"has":[110],"minimum":[112],"distance":[114],"scanning":[119],"distances":[120,125],"all":[122],"The":[124,134],"are":[126],"obtained":[127],"calculating":[129],"score.":[133],"result":[135],"this":[137],"utilized":[141],"to":[142],"author":[143],"conversion":[144],"information":[145],"called":[146],"Edit-Script":[148],"two":[151],"only":[154],"stored":[155],"sequences":[157,167,178],"and":[158,179],"Edit-Scripts":[159],"each":[161,169],"into":[163],"database.":[165],"Member":[166],"can":[171],"then":[172],"be":[173],"easily":[174],"created":[175],"Edit-Scripts.":[180]},"counts_by_year":[],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
