{"id":"https://openalex.org/W2800198679","doi":"https://doi.org/10.1371/journal.pcbi.1006097","title":"A machine learning based framework to identify and classify long terminal repeat retrotransposons","display_name":"A machine learning based framework to identify and classify long terminal repeat retrotransposons","publication_year":2018,"publication_date":"2018-04-23","ids":{"openalex":"https://openalex.org/W2800198679","doi":"https://doi.org/10.1371/journal.pcbi.1006097","mag":"2800198679","pmid":"https://pubmed.ncbi.nlm.nih.gov/29684010"},"language":"en","primary_location":{"id":"doi:10.1371/journal.pcbi.1006097","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1006097","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1006097&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1006097&type=printable","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056559240","display_name":"Leander Schietgat","orcid":"https://orcid.org/0000-0002-2097-0974"},"institutions":[{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Leander Schietgat","raw_affiliation_strings":["Department of Computer Science, KU Leuven, Leuven, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, KU Leuven, Leuven, Belgium","institution_ids":["https://openalex.org/I99464096"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044903173","display_name":"Celine Vens","orcid":"https://orcid.org/0000-0003-0983-256X"},"institutions":[{"id":"https://openalex.org/I32597200","display_name":"Ghent University","ror":"https://ror.org/00cv9y106","country_code":"BE","type":"education","lineage":["https://openalex.org/I32597200"]},{"id":"https://openalex.org/I4210139803","display_name":"VIB-UGent Center for Inflammation Research","ror":"https://ror.org/04q4ydz28","country_code":"BE","type":"facility","lineage":["https://openalex.org/I2802017950","https://openalex.org/I32597200","https://openalex.org/I4210139803"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Celine Vens","raw_affiliation_strings":["Department of Computer Science, KU Leuven, Leuven, Belgium","Department of Public Health and Primary Care, KU Leuven Kulak, Kortrijk, Belgium","Department of Respiratory Medicine, Ghent University, and VIB Inflammation Research Center, Ghent, Belgium"],"raw_orcid":"https://orcid.org/0000-0003-0983-256X","affiliations":[{"raw_affiliation_string":"Department of Computer Science, KU Leuven, Leuven, Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"Department of Public Health and Primary Care, KU Leuven Kulak, Kortrijk, Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"Department of Respiratory Medicine, Ghent University, and VIB Inflammation Research Center, Ghent, Belgium","institution_ids":["https://openalex.org/I4210139803","https://openalex.org/I32597200"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066866262","display_name":"Ricardo Cerri","orcid":"https://orcid.org/0000-0002-2582-1695"},"institutions":[{"id":"https://openalex.org/I177909021","display_name":"Universidade Federal de S\u00e3o Carlos","ror":"https://ror.org/00qdc6m37","country_code":"BR","type":"education","lineage":["https://openalex.org/I177909021"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Ricardo Cerri","raw_affiliation_strings":["Department of Computer Science, UFSCar Federal University of S\u00e3o Carlos, S\u00e3o Carlos, S\u00e3o Paulo, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-2582-1695","affiliations":[{"raw_affiliation_string":"Department of Computer Science, UFSCar Federal University of S\u00e3o Carlos, S\u00e3o Carlos, S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I177909021"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045524441","display_name":"Carlos Norberto Fischer","orcid":"https://orcid.org/0000-0002-5598-6263"},"institutions":[{"id":"https://openalex.org/I879563668","display_name":"Universidade Estadual Paulista (Unesp)","ror":"https://ror.org/00987cb86","country_code":"BR","type":"education","lineage":["https://openalex.org/I879563668"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Carlos N. Fischer","raw_affiliation_strings":["Department of Statistics, Applied Mathematics, and Computer Science, UNESP S\u00e3o Paulo State University, Rio Claro, S\u00e3o Paulo, Brazil"],"raw_orcid":"https://orcid.org/0000-0002-5598-6263","affiliations":[{"raw_affiliation_string":"Department of Statistics, Applied Mathematics, and Computer Science, UNESP S\u00e3o Paulo State University, Rio Claro, S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I879563668"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080804854","display_name":"Eduardo Paulino da Costa","orcid":"https://orcid.org/0000-0001-7210-8190"},"institutions":[{"id":"https://openalex.org/I17974374","display_name":"Universidade de S\u00e3o Paulo","ror":"https://ror.org/036rp1748","country_code":"BR","type":"education","lineage":["https://openalex.org/I17974374"]},{"id":"https://openalex.org/I4210131883","display_name":"Brazilian Society of Computational and Applied Mathematics","ror":"https://ror.org/03kcw4w74","country_code":"BR","type":"other","lineage":["https://openalex.org/I4210131883"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE","BR"],"is_corresponding":false,"raw_author_name":"Eduardo Costa","raw_affiliation_strings":["Department of Computer Science, KU Leuven, Leuven, Belgium","Instituto de Ci\u00eancias Matem\u00e1ticas e de Computa\u00e7\u00e3o, Universidade de S\u00e3o Paulo, S\u00e3o Carlos, S\u00e3o Paulo, Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, KU Leuven, Leuven, Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"Instituto de Ci\u00eancias Matem\u00e1ticas e de Computa\u00e7\u00e3o, Universidade de S\u00e3o Paulo, S\u00e3o Carlos, S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I4210131883","https://openalex.org/I17974374"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077665746","display_name":"Jan Ramon","orcid":"https://orcid.org/0000-0002-0558-7176"},"institutions":[{"id":"https://openalex.org/I1326498283","display_name":"Institut national de recherche en sciences et technologies du num\u00e9rique","ror":"https://ror.org/02kvxyf05","country_code":"FR","type":"government","lineage":["https://openalex.org/I1326498283"]},{"id":"https://openalex.org/I4210138412","display_name":"Centre Inria de l'Universit\u00e9 de Lille","ror":"https://ror.org/04eej9726","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1326498283","https://openalex.org/I4210138412"]},{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE","FR"],"is_corresponding":false,"raw_author_name":"Jan Ramon","raw_affiliation_strings":["Department of Computer Science, KU Leuven, Leuven, Belgium","INRIA Lille Nord Europe, 40 avenue Halley, 59650 Villeneuve d'Ascq, France","INRIA Lille Nord Europe, 40 avenue Halley, 59650 Villeneuve d\u2019Ascq, France"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Computer Science, KU Leuven, Leuven, Belgium","institution_ids":["https://openalex.org/I99464096"]},{"raw_affiliation_string":"INRIA Lille Nord Europe, 40 avenue Halley, 59650 Villeneuve d'Ascq, France","institution_ids":["https://openalex.org/I4210138412"]},{"raw_affiliation_string":"INRIA Lille Nord Europe, 40 avenue Halley, 59650 Villeneuve d\u2019Ascq, France","institution_ids":["https://openalex.org/I4210138412","https://openalex.org/I1326498283"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037469330","display_name":"Cl\u00e1udia M. A. Carareto","orcid":"https://orcid.org/0000-0002-0298-1354"},"institutions":[{"id":"https://openalex.org/I879563668","display_name":"Universidade Estadual Paulista (Unesp)","ror":"https://ror.org/00987cb86","country_code":"BR","type":"education","lineage":["https://openalex.org/I879563668"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Claudia M. A. Carareto","raw_affiliation_strings":["Department of Biology, UNESP S\u00e3o Paulo State University, S\u00e3o Jos\u00e9 do Rio Preto, S\u00e3o Paulo, Brazil"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Biology, UNESP S\u00e3o Paulo State University, S\u00e3o Jos\u00e9 do Rio Preto, S\u00e3o Paulo, Brazil","institution_ids":["https://openalex.org/I879563668"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086906175","display_name":"Hendrik Blockeel","orcid":"https://orcid.org/0000-0003-0378-3699"},"institutions":[{"id":"https://openalex.org/I99464096","display_name":"KU Leuven","ror":"https://ror.org/05f950310","country_code":"BE","type":"education","lineage":["https://openalex.org/I99464096"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Hendrik Blockeel","raw_affiliation_strings":["Department of Computer Science, KU Leuven, Leuven, Belgium"],"raw_orcid":"https://orcid.org/0000-0003-0378-3699","affiliations":[{"raw_affiliation_string":"Department of Computer Science, KU Leuven, Leuven, Belgium","institution_ids":["https://openalex.org/I99464096"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5044903173"],"corresponding_institution_ids":["https://openalex.org/I32597200","https://openalex.org/I4210139803","https://openalex.org/I99464096"],"apc_list":{"value":2655,"currency":"USD","value_usd":2655},"apc_paid":{"value":2655,"currency":"USD","value_usd":2655},"fwci":8.0932,"has_fulltext":true,"cited_by_count":43,"citation_normalized_percentile":{"value":0.96883977,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"14","issue":"4","first_page":"e1006097","last_page":"e1006097"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10434","display_name":"Chromosomal and Genetic Variations","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10434","display_name":"Chromosomal and Genetic Variations","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1110","display_name":"Plant Science"},"field":{"id":"https://openalex.org/fields/11","display_name":"Agricultural and Biological Sciences"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9735999703407288,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/retrotransposon","display_name":"Retrotransposon","score":0.8894602656364441},{"id":"https://openalex.org/keywords/genome","display_name":"Genome","score":0.8240660429000854},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.665435791015625},{"id":"https://openalex.org/keywords/transposable-element","display_name":"Transposable element","score":0.6319805383682251},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6318310499191284},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.6200897693634033},{"id":"https://openalex.org/keywords/long-terminal-repeat","display_name":"Long terminal repeat","score":0.5915048122406006},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.514607310295105},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.48896896839141846},{"id":"https://openalex.org/keywords/drosophila-melanogaster","display_name":"Drosophila melanogaster","score":0.4874551296234131},{"id":"https://openalex.org/keywords/genome-evolution","display_name":"Genome evolution","score":0.45483797788619995},{"id":"https://openalex.org/keywords/genomics","display_name":"Genomics","score":0.42506372928619385},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3882675766944885},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.3743289113044739},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.2902296781539917}],"concepts":[{"id":"https://openalex.org/C7029365","wikidata":"https://www.wikidata.org/wiki/Q413988","display_name":"Retrotransposon","level":5,"score":0.8894602656364441},{"id":"https://openalex.org/C141231307","wikidata":"https://www.wikidata.org/wiki/Q7020","display_name":"Genome","level":3,"score":0.8240660429000854},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.665435791015625},{"id":"https://openalex.org/C4918238","wikidata":"https://www.wikidata.org/wiki/Q121438","display_name":"Transposable element","level":4,"score":0.6319805383682251},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6318310499191284},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.6200897693634033},{"id":"https://openalex.org/C199491388","wikidata":"https://www.wikidata.org/wiki/Q1869477","display_name":"Long terminal repeat","level":4,"score":0.5915048122406006},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.514607310295105},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48896896839141846},{"id":"https://openalex.org/C2780104201","wikidata":"https://www.wikidata.org/wiki/Q130888","display_name":"Drosophila melanogaster","level":3,"score":0.4874551296234131},{"id":"https://openalex.org/C174600577","wikidata":"https://www.wikidata.org/wiki/Q5533491","display_name":"Genome evolution","level":4,"score":0.45483797788619995},{"id":"https://openalex.org/C189206191","wikidata":"https://www.wikidata.org/wiki/Q222046","display_name":"Genomics","level":4,"score":0.42506372928619385},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3882675766944885},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.3743289113044739},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.2902296781539917},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000069550","descriptor_name":"Machine Learning","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000818","descriptor_name":"Animals","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003663","descriptor_name":"Decision Trees","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D004331","descriptor_name":"Drosophila melanogaster","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D004331","descriptor_name":"Drosophila melanogaster","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D004331","descriptor_name":"Drosophila melanogaster","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017124","descriptor_name":"Conserved Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017124","descriptor_name":"Conserved Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017124","descriptor_name":"Conserved Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017360","descriptor_name":"Arabidopsis","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D017360","descriptor_name":"Arabidopsis","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D017360","descriptor_name":"Arabidopsis","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D018626","descriptor_name":"Retroelements","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D018626","descriptor_name":"Retroelements","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D018626","descriptor_name":"Retroelements","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D018744","descriptor_name":"DNA, Plant","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D018744","descriptor_name":"DNA, Plant","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D018744","descriptor_name":"DNA, Plant","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D018745","descriptor_name":"Genome, Plant","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D018745","descriptor_name":"Genome, Plant","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D018745","descriptor_name":"Genome, Plant","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019143","descriptor_name":"Evolution, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020079","descriptor_name":"Terminal Repeat Sequences","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020079","descriptor_name":"Terminal Repeat Sequences","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D020079","descriptor_name":"Terminal Repeat Sequences","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D029681","descriptor_name":"Arabidopsis Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D029681","descriptor_name":"Arabidopsis Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D029681","descriptor_name":"Arabidopsis Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D029721","descriptor_name":"Drosophila Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D029721","descriptor_name":"Drosophila Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D029721","descriptor_name":"Drosophila Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D049750","descriptor_name":"Genome, Insect","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D049750","descriptor_name":"Genome, Insect","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D049750","descriptor_name":"Genome, Insect","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":9,"locations":[{"id":"doi:10.1371/journal.pcbi.1006097","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1006097","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1006097&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},{"id":"pmid:29684010","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/29684010","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS computational biology","raw_type":null},{"id":"pmh:oai:americanae.aecid.es:1809767","is_oa":true,"landing_page_url":"http://doi.org/10.1371/journal.pcbi.1006097","pdf_url":null,"source":{"id":"https://openalex.org/S4306400786","display_name":"Americanae (AECID Library)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"reponame:Reposit\u00f3rio Institucional da UNESP","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:HAL:hal-01814669v1","is_oa":false,"landing_page_url":"https://inria.hal.science/hal-01814669","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, 2018, 14 (4), pp.1-21. &#x27E8;10.1371/journal.pcbi.1006097&#x27E9;","raw_type":"Journal articles"},{"id":"pmh:oai:archive.ugent.be:8564421","is_oa":true,"landing_page_url":"http://hdl.handle.net/1854/LU-8564421","pdf_url":null,"source":{"id":"https://openalex.org/S4306400478","display_name":"Ghent University Academic Bibliography (Ghent University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I32597200","host_organization_name":"Ghent University","host_organization_lineage":["https://openalex.org/I32597200"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"ISSN: 1553-7358","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:doaj.org/article:cf658bdc5f624a4aa584c028da619c4a","is_oa":false,"landing_page_url":"https://doaj.org/article/cf658bdc5f624a4aa584c028da619c4a","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, Vol 14, Iss 4, p e1006097 (2018)","raw_type":"article"},{"id":"pmh:oai:europepmc.org:4875219","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/5933816","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"},{"id":"pmh:oai:lilloa.univ-lille.fr:20.500.12210/23248","is_oa":true,"landing_page_url":"http://hdl.handle.net/20.500.12210/23248","pdf_url":null,"source":{"id":"https://openalex.org/S4306402203","display_name":"LillOA (Universit\u00e9 de Lille (University Of Lille))","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210123514","host_organization_name":"Centre d'Etudes en Civilisations, Langues et Litt\u00e9ratures Etrang\u00e8res","host_organization_lineage":["https://openalex.org/I4210123514"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:repositorio.unesp.br:11449/176256","is_oa":true,"landing_page_url":"http://hdl.handle.net/11449/176256","pdf_url":null,"source":{"id":"https://openalex.org/S4377196277","display_name":"UNESP Institutional Repository (S\u00e3o Paulo State University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I879563668","host_organization_name":"Universidade Estadual Paulista (Unesp)","host_organization_lineage":["https://openalex.org/I879563668"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"instacron:UNESP","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1371/journal.pcbi.1006097","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1006097","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1006097&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2920387762","display_name":null,"funder_award_id":"2013/15070-4","funder_id":"https://openalex.org/F4320320997","funder_display_name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado de S\u00e3o Paulo"},{"id":"https://openalex.org/G4402799499","display_name":null,"funder_award_id":"2015/","funder_id":"https://openalex.org/F4320320997","funder_display_name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado de S\u00e3o Paulo"},{"id":"https://openalex.org/G6489909288","display_name":null,"funder_award_id":"2015/14300-1","funder_id":"https://openalex.org/F4320320997","funder_display_name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado de S\u00e3o Paulo"},{"id":"https://openalex.org/G998091443","display_name":null,"funder_award_id":"306493/2013-6","funder_id":"https://openalex.org/F4320322025","funder_display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico"}],"funders":[{"id":"https://openalex.org/F4320320997","display_name":"Funda\u00e7\u00e3o de Amparo \u00e0 Pesquisa do Estado de S\u00e3o Paulo","ror":"https://ror.org/02ddkpn78"},{"id":"https://openalex.org/F4320321091","display_name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior","ror":"https://ror.org/00x0ma614"},{"id":"https://openalex.org/F4320321730","display_name":"Fonds Wetenschappelijk Onderzoek","ror":"https://ror.org/03qtxy027"},{"id":"https://openalex.org/F4320322025","display_name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","ror":"https://ror.org/03swz6y49"},{"id":"https://openalex.org/F4320322308","display_name":"KU Leuven","ror":"https://ror.org/05f950310"},{"id":"https://openalex.org/F4320325879","display_name":"Universidade Estadual Paulista","ror":"https://ror.org/00987cb86"},{"id":"https://openalex.org/F4320327336","display_name":"Vlaamse regering","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2800198679.pdf","grobid_xml":"https://content.openalex.org/works/W2800198679.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W59589783","https://openalex.org/W1594031697","https://openalex.org/W1700914952","https://openalex.org/W1746365244","https://openalex.org/W1964386992","https://openalex.org/W1969465720","https://openalex.org/W1976526581","https://openalex.org/W1980369994","https://openalex.org/W2011519640","https://openalex.org/W2013475097","https://openalex.org/W2018789136","https://openalex.org/W2021344630","https://openalex.org/W2033049603","https://openalex.org/W2033072307","https://openalex.org/W2036666081","https://openalex.org/W2054254276","https://openalex.org/W2059864757","https://openalex.org/W2060866626","https://openalex.org/W2082330286","https://openalex.org/W2125055259","https://openalex.org/W2129581281","https://openalex.org/W2130212962","https://openalex.org/W2132141594","https://openalex.org/W2133666768","https://openalex.org/W2140141795","https://openalex.org/W2146373732","https://openalex.org/W2150781353","https://openalex.org/W2169859562","https://openalex.org/W2416263659","https://openalex.org/W2524126439","https://openalex.org/W2911964244","https://openalex.org/W2915880292","https://openalex.org/W3085162807","https://openalex.org/W6678449394","https://openalex.org/W6843735874"],"related_works":["https://openalex.org/W2089350008","https://openalex.org/W2990154534","https://openalex.org/W113856995","https://openalex.org/W3145616024","https://openalex.org/W2054036000","https://openalex.org/W2004644512","https://openalex.org/W2402665505","https://openalex.org/W2064967612","https://openalex.org/W2094923272","https://openalex.org/W2131802411"],"abstract_inverted_index":{"Transposable":[0],"elements":[1],"(TEs)":[2],"are":[3,226],"repetitive":[4],"nucleotide":[5],"sequences":[6],"that":[7,71,189,197,221],"make":[8,183],"up":[9],"a":[10,22,44,65,76,81,95,232],"large":[11],"portion":[12],"of":[13,40,89,98,115,122,141,174,199,223],"eukaryotic":[14],"genomes.":[15],"They":[16],"can":[17],"move":[18],"and":[19,27,33,38,56,79,125,128,153,182,205],"duplicate":[20],"within":[21,32],"genome,":[23],"increasing":[24],"genome":[25,45,60,78],"size":[26],"contributing":[28],"to":[29,83,157,164,179,194,214,231],"genetic":[30],"diversity":[31],"across":[34],"species.":[35],"Accurate":[36],"identification":[37,148],"classification":[39,82],"TEs":[41,74,99,196],"present":[42,86],"in":[43,59,75,172,227],"is":[46,161],"an":[47,87,215],"important":[48],"step":[49],"towards":[50,92],"understanding":[51],"their":[52,57,108],"effects":[53],"on":[54,68,118],"genes":[55],"role":[58],"evolution.":[61],"We":[62,85,110],"introduce":[63],"TE-Learner,":[64],"framework":[66,91,117],"based":[67],"machine":[69,166],"learning":[70,167],"automatically":[72],"identifies":[73],"given":[77],"assigns":[80],"them.":[84],"implementation":[88],"our":[90,116,131,190],"LTR":[93,135],"retrotransposons,":[94],"particular":[96],"type":[97],"characterized":[100],"by":[101],"having":[102],"long":[103],"terminal":[104],"repeats":[105],"(LTRs)":[106],"at":[107],"boundaries.":[109],"evaluate":[111],"the":[112,119,139,162,200],"predictive":[113,175],"performance":[114],"well-annotated":[120],"genomes":[121],"Drosophila":[123],"melanogaster":[124],"Arabidopsis":[126],"thaliana":[127],"we":[129,187,206],"compare":[130],"results":[132,140],"for":[133,146],"three":[134,142],"retrotransposon":[136],"superfamilies":[137],"with":[138],"widely":[143],"used":[144],"methods":[145,171],"TE":[147],"or":[149],"classification:":[150],"RepeatMasker,":[151],"Censor":[152],"LtrDigest.":[154],"In":[155],"contrast":[156],"these":[158,170,224],"methods,":[159],"TE-Learner":[160],"first":[163],"incorporate":[165],"techniques,":[168],"outperforming":[169],"terms":[173],"performance,":[176],"while":[177],"able":[178,193],"learn":[180],"models":[181],"predictions":[184,209,225],"efficiently.":[185],"Moreover,":[186],"show":[188],"method":[191,202],"was":[192],"identify":[195],"none":[198],"above":[201],"could":[203],"find,":[204],"investigated":[207],"TE-Learner's":[208],"which":[210],"did":[211],"not":[212],"correspond":[213],"official":[216],"annotation.":[217],"It":[218],"turns":[219],"out":[220],"many":[222],"fact":[228],"strongly":[229],"homologous":[230],"known":[233],"TE.":[234]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":8},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":1}],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2025-10-10T00:00:00"}
