{"id":"https://openalex.org/W2098188217","doi":"https://doi.org/10.1186/1748-7188-6-2","title":"WordCluster: detecting clusters of DNA words and genomic elements","display_name":"WordCluster: detecting clusters of DNA words and genomic elements","publication_year":2011,"publication_date":"2011-01-24","ids":{"openalex":"https://openalex.org/W2098188217","doi":"https://doi.org/10.1186/1748-7188-6-2","mag":"2098188217","pmid":"https://pubmed.ncbi.nlm.nih.gov/21261981"},"language":"en","primary_location":{"id":"doi:10.1186/1748-7188-6-2","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1748-7188-6-2","pdf_url":"https://almob.biomedcentral.com/counter/pdf/10.1186/1748-7188-6-2","source":{"id":"https://openalex.org/S205663195","display_name":"Algorithms for Molecular Biology","issn_l":"1748-7188","issn":["1748-7188"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for Molecular Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://almob.biomedcentral.com/counter/pdf/10.1186/1748-7188-6-2","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084745527","display_name":"Michael Hackenberg","orcid":"https://orcid.org/0000-0003-2248-3114"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Michael Hackenberg","raw_affiliation_strings":["Dpto, de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab, de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda, del Conocimiento s/n, 18100-Granada, Spain. mlhack@gmail.com","Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dpto, de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab, de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda, del Conocimiento s/n, 18100-Granada, Spain. mlhack@gmail.com","institution_ids":["https://openalex.org/I173304897"]},{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074555181","display_name":"Pedro Carpena","orcid":"https://orcid.org/0000-0001-5568-0216"},"institutions":[{"id":"https://openalex.org/I136199984","display_name":"Harvard University","ror":"https://ror.org/03vek6s52","country_code":"US","type":"education","lineage":["https://openalex.org/I136199984"]},{"id":"https://openalex.org/I4210148319","display_name":"Woman's Hospital","ror":"https://ror.org/05f9h3891","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210148319"]},{"id":"https://openalex.org/I82767444","display_name":"Universidad de M\u00e1laga","ror":"https://ror.org/036b2ww28","country_code":"ES","type":"education","lineage":["https://openalex.org/I82767444"]}],"countries":["ES","US"],"is_corresponding":false,"raw_author_name":"Pedro Carpena","raw_affiliation_strings":["Division of Sleep Medicine, Brigham and Woman's Hospital, Harvard Medical School, Boston, MA, 02115, USA","Dpto. de F\u00edsica Aplicada II, E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga, 29071, Malaga, Spain","Brigham and Woman's Hospital, Harvard Medical School","E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Sleep Medicine, Brigham and Woman's Hospital, Harvard Medical School, Boston, MA, 02115, USA","institution_ids":["https://openalex.org/I4210148319"]},{"raw_affiliation_string":"Dpto. de F\u00edsica Aplicada II, E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga, 29071, Malaga, Spain","institution_ids":["https://openalex.org/I82767444"]},{"raw_affiliation_string":"Brigham and Woman's Hospital, Harvard Medical School","institution_ids":["https://openalex.org/I136199984"]},{"raw_affiliation_string":"E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga","institution_ids":["https://openalex.org/I82767444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050320939","display_name":"Pedro Bernaola\u2010Galv\u00e1n","orcid":"https://orcid.org/0000-0002-2895-3116"},"institutions":[{"id":"https://openalex.org/I82767444","display_name":"Universidad de M\u00e1laga","ror":"https://ror.org/036b2ww28","country_code":"ES","type":"education","lineage":["https://openalex.org/I82767444"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Pedro Bernaola-Galv\u00e1n","raw_affiliation_strings":["Dpto. de F\u00edsica Aplicada II, E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga, 29071, Malaga, Spain","Dpto. de F\u00edsica Aplicada II, E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga, Malaga, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dpto. de F\u00edsica Aplicada II, E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga, 29071, Malaga, Spain","institution_ids":["https://openalex.org/I82767444"]},{"raw_affiliation_string":"Dpto. de F\u00edsica Aplicada II, E.T.S.I. de Telecomunicaci\u00f3n, Universidad de M\u00e1laga, Malaga, Spain","institution_ids":["https://openalex.org/I82767444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039320926","display_name":"Guillermo Barturen","orcid":"https://orcid.org/0000-0003-2103-1028"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Guillermo Barturen","raw_affiliation_strings":["Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab. de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda. del Conocimiento s/n, 18100, Granada, Spain","Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab. de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda. del Conocimiento s/n, 18100, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]},{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022023349","display_name":"A. Marti \u0301\u2013Alganza","orcid":null},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"\u00c1ngel M Alganza","raw_affiliation_strings":["Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab. de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda. del Conocimiento s/n, 18100, Granada, Spain","Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab. de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda. del Conocimiento s/n, 18100, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]},{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009966967","display_name":"Jos\u00e9 Luis Tejera Oliver","orcid":"https://orcid.org/0000-0003-0216-0393"},"institutions":[{"id":"https://openalex.org/I173304897","display_name":"Universidad de Granada","ror":"https://ror.org/04njjy449","country_code":"ES","type":"education","lineage":["https://openalex.org/I173304897"]}],"countries":["ES"],"is_corresponding":true,"raw_author_name":"Jos\u00e9 L Oliver","raw_affiliation_strings":["Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab. de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda. del Conocimiento s/n, 18100, Granada, Spain","Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Campus de Fuentenueva s/n, 18071-Granada & Lab. de Bioinform\u00e1tica, Centro de Investigaci\u00f3n Biom\u00e9dica, PTS, Avda. del Conocimiento s/n, 18100, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]},{"raw_affiliation_string":"Dpto. de Gen\u00e9tica, Facultad de Ciencias, Universidad de Granada, Granada, Spain","institution_ids":["https://openalex.org/I173304897"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5009966967","https://openalex.org/A5084745527"],"corresponding_institution_ids":["https://openalex.org/I173304897"],"apc_list":{"value":1490,"currency":"GBP","value_usd":1827},"apc_paid":{"value":1490,"currency":"GBP","value_usd":1827},"fwci":1.3307,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.79877876,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"6","issue":"1","first_page":"2","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.15850000083446503,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.15850000083446503,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10222","display_name":"Genomics and Chromatin Dynamics","score":0.11869999766349792,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12946","display_name":"Fractal and DNA sequence analysis","score":0.11079999804496765,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.6267122030258179},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5892515778541565},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.5606842041015625},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5322888493537903},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.5256304144859314},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.521081805229187},{"id":"https://openalex.org/keywords/cpg-site","display_name":"CpG site","score":0.49499934911727905},{"id":"https://openalex.org/keywords/human-genome","display_name":"Human genome","score":0.4544054865837097},{"id":"https://openalex.org/keywords/genomics","display_name":"Genomics","score":0.43727195262908936},{"id":"https://openalex.org/keywords/gene-annotation","display_name":"Gene Annotation","score":0.43468955159187317},{"id":"https://openalex.org/keywords/dna-methylation","display_name":"DNA methylation","score":0.42055660486221313},{"id":"https://openalex.org/keywords/web-server","display_name":"Web server","score":0.41482478380203247},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.4005231261253357},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.36117684841156006},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.3609282374382019},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.14825758337974548},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.14769405126571655}],"concepts":[{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.6267122030258179},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5892515778541565},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.5606842041015625},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5322888493537903},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.5256304144859314},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.521081805229187},{"id":"https://openalex.org/C140173407","wikidata":"https://www.wikidata.org/wiki/Q1138358","display_name":"CpG site","level":5,"score":0.49499934911727905},{"id":"https://openalex.org/C197077220","wikidata":"https://www.wikidata.org/wiki/Q720988","display_name":"Human genome","level":4,"score":0.4544054865837097},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.43727195262908936},{"id":"https://openalex.org/C2908923196","wikidata":"https://www.wikidata.org/wiki/Q5205742","display_name":"Gene Annotation","level":4,"score":0.43468955159187317},{"id":"https://openalex.org/C190727270","wikidata":"https://www.wikidata.org/wiki/Q874745","display_name":"DNA methylation","level":4,"score":0.42055660486221313},{"id":"https://openalex.org/C11392498","wikidata":"https://www.wikidata.org/wiki/Q11288","display_name":"Web server","level":3,"score":0.41482478380203247},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.4005231261253357},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36117684841156006},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.3609282374382019},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.14825758337974548},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.14769405126571655},{"id":"https://openalex.org/C150194340","wikidata":"https://www.wikidata.org/wiki/Q26972","display_name":"Gene expression","level":3,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1186/1748-7188-6-2","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1748-7188-6-2","pdf_url":"https://almob.biomedcentral.com/counter/pdf/10.1186/1748-7188-6-2","source":{"id":"https://openalex.org/S205663195","display_name":"Algorithms for Molecular Biology","issn_l":"1748-7188","issn":["1748-7188"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for Molecular Biology","raw_type":"journal-article"},{"id":"pmid:21261981","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/21261981","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for molecular biology : AMB","raw_type":null},{"id":"pmh:oai:digibug.ugr.es:10481/33377","is_oa":false,"landing_page_url":"http://hdl.handle.net/10481/33377","pdf_url":null,"source":{"id":"https://openalex.org/S4306400567","display_name":"Institutional Repository of the University of Granada (University of Granada)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I173304897","host_organization_name":"Universidad de Granada","host_organization_lineage":["https://openalex.org/I173304897"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:doaj.org/article:f60c5491426c4bf2b5d70fedadae2138","is_oa":false,"landing_page_url":"https://doaj.org/article/f60c5491426c4bf2b5d70fedadae2138","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms for Molecular Biology, Vol 6, Iss 1, p 2 (2011)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:3037320","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/3037320","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Algorithms Mol Biol","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1748-7188-6-2","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1748-7188-6-2","pdf_url":"https://almob.biomedcentral.com/counter/pdf/10.1186/1748-7188-6-2","source":{"id":"https://openalex.org/S205663195","display_name":"Algorithms for Molecular Biology","issn_l":"1748-7188","issn":["1748-7188"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Algorithms for Molecular Biology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320326754","display_name":"Junta de Andaluc\u00eda","ror":"https://ror.org/01jem9c82"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2098188217.pdf","grobid_xml":"https://content.openalex.org/works/W2098188217.grobid-xml"},"referenced_works_count":18,"referenced_works":["https://openalex.org/W1531954825","https://openalex.org/W2011399892","https://openalex.org/W2022846158","https://openalex.org/W2054883945","https://openalex.org/W2059099579","https://openalex.org/W2084748297","https://openalex.org/W2102619694","https://openalex.org/W2103017472","https://openalex.org/W2107903949","https://openalex.org/W2119022656","https://openalex.org/W2123047097","https://openalex.org/W2126804125","https://openalex.org/W2145191876","https://openalex.org/W2161399316","https://openalex.org/W2161645441","https://openalex.org/W2414817931","https://openalex.org/W2740984310","https://openalex.org/W4210430020"],"related_works":["https://openalex.org/W3012096999","https://openalex.org/W2009940763","https://openalex.org/W1976142521","https://openalex.org/W4383032973","https://openalex.org/W4200520333","https://openalex.org/W2981857975","https://openalex.org/W2884291362","https://openalex.org/W2343917130","https://openalex.org/W2130867076","https://openalex.org/W2129156298"],"abstract_inverted_index":{"BACKGROUND:":[0],"Many":[1],"k-mers":[2],"(or":[3],"DNA":[4,72,180],"words)":[5],"and":[6,29,54,87,145,183],"genomic":[7,78,184],"elements":[8],"are":[9,21],"known":[10],"to":[11,37,68,101,156,174],"be":[12,130],"spatially":[13],"clustered":[14],"in":[15,41,132,167],"the":[16,22,82,94,108,115,122,137,148,168,189,203,211],"genome.":[17,170],"Well":[18],"established":[19],"examples":[20],"genes,":[23],"TFBSs,":[24],"CpG":[25],"dinucleotides,":[26],"microRNA":[27],"genes":[28,166],"ultra-conserved":[30],"non-coding":[31],"regions.":[32],"Currently,":[33],"no":[34],"algorithm":[35,67],"exists":[36],"find":[38],"these":[39],"clusters":[40,70,123,161,178],"a":[42,97,102,192],"statistically":[43,159],"comprehensible":[44],"way.":[45],"The":[46,186],"detection":[47,204],"of":[48,71,117,124,139,147,162,179,188,205,218],"clustering":[49],"often":[50],"relies":[51],"on":[52,81],"densities":[53],"sliding-window":[55],"approaches":[56],"or":[57,75,210],"arbitrarily":[58],"chosen":[59],"distance":[60,83],"thresholds.":[61],"RESULTS:":[62],"We":[63,92,113],"introduce":[64],"here":[65],"an":[66,88],"detect":[69],"words":[73,181],"(k-mers),":[74],"any":[76],"other":[77],"element,":[79],"based":[80],"between":[84,143],"consecutive":[85],"copies":[86],"assigned":[89],"statistical":[90],"significance.":[91],"implemented":[93],"method":[95,190],"into":[96,191],"web":[98,193],"server":[99,194],"connected":[100],"MySQL":[103],"backend,":[104],"which":[105],"also":[106],"determines":[107],"co-localization":[109,206],"with":[110,207],"gene":[111,208],"annotations.":[112],"demonstrate":[114],"usefulness":[116],"this":[118],"approach":[119],"by":[120],"detecting":[121],"CAG/CTG":[125],"(cytosine":[126],"contexts":[127],"that":[128,136],"can":[129],"methylated":[131],"undifferentiated":[133],"cells),":[134],"showing":[135],"degree":[138],"methylation":[140],"vary":[141],"drastically":[142],"inside":[144],"outside":[146],"clusters.":[149],"As":[150],"another":[151],"example,":[152],"we":[153],"used":[154],"WordCluster":[155,172],"search":[157],"for":[158,215],"significant":[160],"olfactory":[163],"receptor":[164],"(OR)":[165],"human":[169],"CONCLUSIONS:":[171],"seems":[173],"predict":[175],"biological":[176],"meaningful":[177],"(k-mers)":[182],"entities.":[185],"implementation":[187],"is":[195],"available":[196],"at":[197],"http://bioinfo2.ugr.es/wordCluster/wordCluster.php":[198],"including":[199],"additional":[200],"features":[201],"like":[202],"regions":[209],"annotation":[212],"enrichment":[213],"tool":[214],"functional":[216],"analysis":[217],"overlapped":[219],"genes.":[220]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":3}],"updated_date":"2026-06-19T15:47:20.252518","created_date":"2025-10-10T00:00:00"}
