{"id":"https://openalex.org/W2490955734","doi":"https://doi.org/10.1371/journal.pcbi.1005038","title":"Improvement in Protein Domain Identification Is Reached by Breaking Consensus, with the Agreement of Many Profiles and Domain Co-occurrence","display_name":"Improvement in Protein Domain Identification Is Reached by Breaking Consensus, with the Agreement of Many Profiles and Domain Co-occurrence","publication_year":2016,"publication_date":"2016-07-29","ids":{"openalex":"https://openalex.org/W2490955734","doi":"https://doi.org/10.1371/journal.pcbi.1005038","mag":"2490955734","pmid":"https://pubmed.ncbi.nlm.nih.gov/27472895"},"language":"en","primary_location":{"id":"doi:10.1371/journal.pcbi.1005038","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1005038","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1005038&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1005038&type=printable","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089115213","display_name":"Juliana Bernardes","orcid":"https://orcid.org/0000-0003-1341-4256"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I4210097156","display_name":"Biologie Computationnelle, Quantitative et Synth\u00e9tique","ror":"https://ror.org/00pcqj134","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I39804081","https://openalex.org/I4210096427","https://openalex.org/I4210097156"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Juliana Bernardes","raw_affiliation_strings":["Sorbonne Universit\u00e9s, UPMC Univ-Paris 6, CNRS, UMR 7238, Laboratoire de Biologie Computationnelle et Quantitative, Paris, France","LCQB - Biologie Computationnelle et Quantitative = Laboratory of Computational and Quantitative Biology (Biologie Computationnelle et Quantitative UMR 7238 CNRS-Universit\u00e9 Pierre et Marie Curie Site des Cordeliers B\u00e2t. A - 4\u00e8me \u00e9tage, 15, Rue de l'Ecole de M\u00e9decine 75006 Paris, France - France)"],"affiliations":[{"raw_affiliation_string":"Sorbonne Universit\u00e9s, UPMC Univ-Paris 6, CNRS, UMR 7238, Laboratoire de Biologie Computationnelle et Quantitative, Paris, France","institution_ids":["https://openalex.org/I39804081","https://openalex.org/I4210097156","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"LCQB - Biologie Computationnelle et Quantitative = Laboratory of Computational and Quantitative Biology (Biologie Computationnelle et Quantitative UMR 7238 CNRS-Universit\u00e9 Pierre et Marie Curie Site des Cordeliers B\u00e2t. A - 4\u00e8me \u00e9tage, 15, Rue de l'Ecole de M\u00e9decine 75006 Paris, France - France)","institution_ids":["https://openalex.org/I4210097156","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012291023","display_name":"Gerson Zaverucha","orcid":"https://orcid.org/0000-0002-3641-6839"},"institutions":[{"id":"https://openalex.org/I122140584","display_name":"Universidade Federal do Rio de Janeiro","ror":"https://ror.org/03490as77","country_code":"BR","type":"education","lineage":["https://openalex.org/I122140584"]}],"countries":["BR"],"is_corresponding":false,"raw_author_name":"Gerson Zaverucha","raw_affiliation_strings":["COPPE, Programa de Engenharia de Sistemas e Computa\u00e7\u00e3o, Universidade Federal do Rio de Janeiro, Rio de Janeiro, Brazil","COPPE-UFRJ - Instituto Alberto Luiz Coimbra de P\u00f3s-Gradua\u00e7\u00e3o e Pesquisa de Engenharia (Cidade Universit\u00e1ria Centro de Tecnologia, Bloco G, sala 101 Ilha do Fund\u00e3o CEP: 21945-970 Caixa Postal: 68501 Rio de Janeiro - RJ - Brasil - Brazil)"],"affiliations":[{"raw_affiliation_string":"COPPE, Programa de Engenharia de Sistemas e Computa\u00e7\u00e3o, Universidade Federal do Rio de Janeiro, Rio de Janeiro, Brazil","institution_ids":["https://openalex.org/I122140584"]},{"raw_affiliation_string":"COPPE-UFRJ - Instituto Alberto Luiz Coimbra de P\u00f3s-Gradua\u00e7\u00e3o e Pesquisa de Engenharia (Cidade Universit\u00e1ria Centro de Tecnologia, Bloco G, sala 101 Ilha do Fund\u00e3o CEP: 21945-970 Caixa Postal: 68501 Rio de Janeiro - RJ - Brasil - Brazil)","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024201288","display_name":"Catherine Vaquero","orcid":"https://orcid.org/0000-0001-9224-822X"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I154526488","display_name":"Inserm","ror":"https://ror.org/02vjkv261","country_code":"FR","type":"government","lineage":["https://openalex.org/I154526488"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I4210128915","display_name":"Centre d'Immunologie et des Maladies Infectieuses","ror":"https://ror.org/0375b8f90","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I154526488","https://openalex.org/I39804081","https://openalex.org/I4210096427","https://openalex.org/I4210128915"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Catherine Vaquero","raw_affiliation_strings":["Sorbonne Universit\u00e9s, UPMC Univ-Paris 6, INSERM U1135, CNRS ERL 8255, Centre d'Immunologie et des Maladies Infectieuses (CIMI-Paris), Paris, France","CIMI - Centre d'Immunologie et de Maladies Infectieuses (91 Boulevard de l'h\u00f4pital 75013 Paris - France)"],"affiliations":[{"raw_affiliation_string":"Sorbonne Universit\u00e9s, UPMC Univ-Paris 6, INSERM U1135, CNRS ERL 8255, Centre d'Immunologie et des Maladies Infectieuses (CIMI-Paris), Paris, France","institution_ids":["https://openalex.org/I154526488","https://openalex.org/I39804081","https://openalex.org/I4210128915","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"CIMI - Centre d'Immunologie et de Maladies Infectieuses (91 Boulevard de l'h\u00f4pital 75013 Paris - France)","institution_ids":["https://openalex.org/I4210128915"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038174177","display_name":"Alessandra Carbone","orcid":"https://orcid.org/0000-0003-2098-5743"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I185839726","display_name":"Institut Universitaire de France","ror":"https://ror.org/055khg266","country_code":"FR","type":"education","lineage":["https://openalex.org/I185839726"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I4210097156","display_name":"Biologie Computationnelle, Quantitative et Synth\u00e9tique","ror":"https://ror.org/00pcqj134","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I39804081","https://openalex.org/I4210096427","https://openalex.org/I4210097156"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Alessandra Carbone","raw_affiliation_strings":["Institut Universitaire de France, Paris, France","Sorbonne Universit\u00e9s, UPMC Univ-Paris 6, CNRS, UMR 7238, Laboratoire de Biologie Computationnelle et Quantitative, Paris, France","LCQB - Biologie Computationnelle et Quantitative = Laboratory of Computational and Quantitative Biology (Biologie Computationnelle et Quantitative UMR 7238 CNRS-Universit\u00e9 Pierre et Marie Curie Site des Cordeliers B\u00e2t. A - 4\u00e8me \u00e9tage, 15, Rue de l'Ecole de M\u00e9decine 75006 Paris, France - France)","IUF - Institut universitaire de France (Maison des Universit\u00e9s 103 Boulevard Saint-Michel 75005 Paris - France)"],"affiliations":[{"raw_affiliation_string":"Institut Universitaire de France, Paris, France","institution_ids":["https://openalex.org/I185839726"]},{"raw_affiliation_string":"Sorbonne Universit\u00e9s, UPMC Univ-Paris 6, CNRS, UMR 7238, Laboratoire de Biologie Computationnelle et Quantitative, Paris, France","institution_ids":["https://openalex.org/I39804081","https://openalex.org/I4210097156","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"LCQB - Biologie Computationnelle et Quantitative = Laboratory of Computational and Quantitative Biology (Biologie Computationnelle et Quantitative UMR 7238 CNRS-Universit\u00e9 Pierre et Marie Curie Site des Cordeliers B\u00e2t. A - 4\u00e8me \u00e9tage, 15, Rue de l'Ecole de M\u00e9decine 75006 Paris, France - France)","institution_ids":["https://openalex.org/I4210097156","https://openalex.org/I1294671590"]},{"raw_affiliation_string":"IUF - Institut universitaire de France (Maison des Universit\u00e9s 103 Boulevard Saint-Michel 75005 Paris - France)","institution_ids":["https://openalex.org/I185839726"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5038174177","https://openalex.org/A5089115213"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I185839726","https://openalex.org/I39804081","https://openalex.org/I4210097156"],"apc_list":{"value":2655,"currency":"USD","value_usd":2655},"apc_paid":{"value":2655,"currency":"USD","value_usd":2655},"fwci":2.6147,"has_fulltext":true,"cited_by_count":31,"citation_normalized_percentile":{"value":0.89868637,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"12","issue":"7","first_page":"e1005038","last_page":"e1005038"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6554979681968689},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6380982398986816},{"id":"https://openalex.org/keywords/architecture-domain","display_name":"Architecture domain","score":0.6224857568740845},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5649642944335938},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.5593739748001099},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5317206382751465},{"id":"https://openalex.org/keywords/protein-domain","display_name":"Protein domain","score":0.5242986083030701},{"id":"https://openalex.org/keywords/closeness","display_name":"Closeness","score":0.4944901466369629},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.4912044405937195},{"id":"https://openalex.org/keywords/clade","display_name":"Clade","score":0.44642069935798645},{"id":"https://openalex.org/keywords/protein-superfamily","display_name":"Protein superfamily","score":0.4312557578086853},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.42660456895828247},{"id":"https://openalex.org/keywords/statistical-model","display_name":"Statistical model","score":0.4152846038341522},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4030979871749878},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3460598587989807},{"id":"https://openalex.org/keywords/phylogenetic-tree","display_name":"Phylogenetic tree","score":0.3074635863304138},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3052295446395874},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.2331797182559967},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15576598048210144},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.14215511083602905}],"concepts":[{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6554979681968689},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6380982398986816},{"id":"https://openalex.org/C194167682","wikidata":"https://www.wikidata.org/wiki/Q4787088","display_name":"Architecture domain","level":5,"score":0.6224857568740845},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5649642944335938},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.5593739748001099},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5317206382751465},{"id":"https://openalex.org/C144292202","wikidata":"https://www.wikidata.org/wiki/Q898273","display_name":"Protein domain","level":3,"score":0.5242986083030701},{"id":"https://openalex.org/C2779545769","wikidata":"https://www.wikidata.org/wiki/Q5135364","display_name":"Closeness","level":2,"score":0.4944901466369629},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4912044405937195},{"id":"https://openalex.org/C44465124","wikidata":"https://www.wikidata.org/wiki/Q713623","display_name":"Clade","level":4,"score":0.44642069935798645},{"id":"https://openalex.org/C178180057","wikidata":"https://www.wikidata.org/wiki/Q7251477","display_name":"Protein superfamily","level":3,"score":0.4312557578086853},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.42660456895828247},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.4152846038341522},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4030979871749878},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3460598587989807},{"id":"https://openalex.org/C193252679","wikidata":"https://www.wikidata.org/wiki/Q242125","display_name":"Phylogenetic tree","level":3,"score":0.3074635863304138},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3052295446395874},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.2331797182559967},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15576598048210144},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.14215511083602905},{"id":"https://openalex.org/C27591593","wikidata":"https://www.wikidata.org/wiki/Q4380897","display_name":"Enterprise architecture framework","level":4,"score":0.0},{"id":"https://openalex.org/C35869016","wikidata":"https://www.wikidata.org/wiki/Q846636","display_name":"Software architecture","level":3,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000072417","descriptor_name":"Protein Domains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000072417","descriptor_name":"Protein Domains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000072417","descriptor_name":"Protein Domains","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010963","descriptor_name":"Plasmodium falciparum","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D010963","descriptor_name":"Plasmodium falciparum","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D010963","descriptor_name":"Plasmodium falciparum","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D010963","descriptor_name":"Plasmodium falciparum","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D010963","descriptor_name":"Plasmodium falciparum","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D010963","descriptor_name":"Plasmodium falciparum","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D015800","descriptor_name":"Protozoan Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D015800","descriptor_name":"Protozoan Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D015800","descriptor_name":"Protozoan Proteins","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D015800","descriptor_name":"Protozoan Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D015800","descriptor_name":"Protozoan Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D015800","descriptor_name":"Protozoan Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D016384","descriptor_name":"Consensus Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016384","descriptor_name":"Consensus Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016384","descriptor_name":"Consensus Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":6,"locations":[{"id":"doi:10.1371/journal.pcbi.1005038","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1005038","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1005038&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},{"id":"pmid:27472895","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/27472895","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLoS computational biology","raw_type":null},{"id":"pmh:oai:HAL:hal-01390566v1","is_oa":true,"landing_page_url":"https://hal.sorbonne-universite.fr/hal-01390566","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, 2016, 12 (7), pp.e1005038. &#x27E8;10.1371/journal.pcbi.1005038&#x27E9;","raw_type":"Journal articles"},{"id":"pmh:oai:doaj.org/article:28e22b31588e4da29f8803d65c7a5886","is_oa":true,"landing_page_url":"https://doaj.org/article/28e22b31588e4da29f8803d65c7a5886","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"PLoS Computational Biology, Vol 12, Iss 7, p e1005038 (2016)","raw_type":"article"},{"id":"pmh:oai:europepmc.org:3948289","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/4966962","pdf_url":null,"source":{"id":"https://openalex.org/S4306400806","display_name":"Europe PMC (PubMed Central)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1303153112","host_organization_name":"European Bioinformatics Institute","host_organization_lineage":["https://openalex.org/I1303153112"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Text"},{"id":"pmh:oai:figshare.com:article/3876084","is_oa":true,"landing_page_url":"https://figshare.com/articles/dataset/Improvement_in_Protein_Domain_Identification_Is_Reached_by_Breaking_Consensus_with_the_Agreement_of_Many_Profiles_and_Domain_Co-occurrence/3876084","pdf_url":null,"source":{"id":"https://openalex.org/S4377196282","display_name":"Figshare","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210132348","host_organization_name":"Figshare (United Kingdom)","host_organization_lineage":["https://openalex.org/I4210132348"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Dataset"}],"best_oa_location":{"id":"doi:10.1371/journal.pcbi.1005038","is_oa":true,"landing_page_url":"https://doi.org/10.1371/journal.pcbi.1005038","pdf_url":"https://journals.plos.org/ploscompbiol/article/file?id=10.1371/journal.pcbi.1005038&type=printable","source":{"id":"https://openalex.org/S86033158","display_name":"PLoS Computational Biology","issn_l":"1553-734X","issn":["1553-734X","1553-7358"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310315706","host_organization_name":"Public Library of Science","host_organization_lineage":["https://openalex.org/P4310315706"],"host_organization_lineage_names":["Public Library of Science"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"PLOS Computational Biology","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7099999785423279,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G1404270698","display_name":null,"funder_award_id":"NR-11-IDEX-0004-02","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G1789083493","display_name":"LABEX pour la mod\u00e9lisation et la simulation scientifiques en recherche","funder_award_id":"ANR-11-LABX-0037","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G1817966306","display_name":null,"funder_award_id":"ANR-11-LABX-003","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G3335229504","display_name":null,"funder_award_id":"Avenir","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G3807293409","display_name":null,"funder_award_id":"ANR-11-LABX-00","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G4009746975","display_name":null,"funder_award_id":"ANR-11-IDEX-0004-02","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G4423138545","display_name":null,"funder_award_id":"ANR-10-EQPX-29-0","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G4866930200","display_name":null,"funder_award_id":"ANR-11-IDEX","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G5003875507","display_name":null,"funder_award_id":"-11-IDEX-0004-02","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G5043543010","display_name":null,"funder_award_id":"10-EQPX-29-01","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G5615659713","display_name":null,"funder_award_id":"IDEX-0004-02","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G6182026652","display_name":null,"funder_award_id":"11-IDEX-0004","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G6246589203","display_name":null,"funder_award_id":"11-IDEX-0004-02","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G6654833908","display_name":null,"funder_award_id":"ANR-11-IDEX-0004","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G676769616","display_name":null,"funder_award_id":"ANR-10-EQPX-29-01","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7240651115","display_name":null,"funder_award_id":"ANR-10","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7371164504","display_name":null,"funder_award_id":"(ANR-10-EQPX-29-01)","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7823808512","display_name":null,"funder_award_id":"ANR-11-IDEX-000","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G846706564","display_name":null,"funder_award_id":"ANR-11-IDEX-0004-0","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G8510727784","display_name":null,"funder_award_id":"ANR-10-EQPX","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G8668274974","display_name":null,"funder_award_id":"11-LABX-003","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"},{"id":"https://openalex.org/F4320324615","display_name":"Ministry of Education and Science of Ukraine","ror":"https://ror.org/03bra4w96"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2490955734.pdf","grobid_xml":"https://content.openalex.org/works/W2490955734.grobid-xml"},"referenced_works_count":70,"referenced_works":["https://openalex.org/W28412257","https://openalex.org/W102715436","https://openalex.org/W116375701","https://openalex.org/W1483942228","https://openalex.org/W1549656520","https://openalex.org/W1565582771","https://openalex.org/W1598333443","https://openalex.org/W1618905105","https://openalex.org/W1656674553","https://openalex.org/W1827912384","https://openalex.org/W1971913854","https://openalex.org/W1990056477","https://openalex.org/W2002468235","https://openalex.org/W2011983053","https://openalex.org/W2012352014","https://openalex.org/W2021064499","https://openalex.org/W2021973151","https://openalex.org/W2022472106","https://openalex.org/W2035202199","https://openalex.org/W2040184829","https://openalex.org/W2042124637","https://openalex.org/W2045564656","https://openalex.org/W2045839655","https://openalex.org/W2046577575","https://openalex.org/W2051210555","https://openalex.org/W2057071212","https://openalex.org/W2057885377","https://openalex.org/W2083280521","https://openalex.org/W2085277871","https://openalex.org/W2087347434","https://openalex.org/W2087903152","https://openalex.org/W2097555181","https://openalex.org/W2099075703","https://openalex.org/W2099254366","https://openalex.org/W2099946731","https://openalex.org/W2101220662","https://openalex.org/W2106882534","https://openalex.org/W2109715166","https://openalex.org/W2110115297","https://openalex.org/W2110949039","https://openalex.org/W2112792893","https://openalex.org/W2121085676","https://openalex.org/W2121938981","https://openalex.org/W2122879306","https://openalex.org/W2127338593","https://openalex.org/W2136280642","https://openalex.org/W2137015675","https://openalex.org/W2138122982","https://openalex.org/W2140785063","https://openalex.org/W2141885858","https://openalex.org/W2141984528","https://openalex.org/W2142444565","https://openalex.org/W2145268834","https://openalex.org/W2148950394","https://openalex.org/W2149026536","https://openalex.org/W2149531726","https://openalex.org/W2152007783","https://openalex.org/W2153635508","https://openalex.org/W2154139219","https://openalex.org/W2155870664","https://openalex.org/W2157239837","https://openalex.org/W2158714788","https://openalex.org/W2160865839","https://openalex.org/W2161033884","https://openalex.org/W2161072217","https://openalex.org/W2179402585","https://openalex.org/W4210623056","https://openalex.org/W4235914791","https://openalex.org/W4252706339","https://openalex.org/W6683380652"],"related_works":["https://openalex.org/W2050194408","https://openalex.org/W2045839655","https://openalex.org/W2096676112","https://openalex.org/W2161033884","https://openalex.org/W4386158261","https://openalex.org/W2102882929","https://openalex.org/W4226056761","https://openalex.org/W2908283214","https://openalex.org/W2489342160","https://openalex.org/W2786092929"],"abstract_inverted_index":{"Traditional":[0],"protein":[1,78,111,147,190,218,289,295],"annotation":[2,32,59,214],"methods":[3,60,177],"describe":[4],"known":[5,110],"domains":[6],"with":[7],"probabilistic":[8,114],"models":[9,116,193],"representing":[10],"consensus":[11,207],"among":[12],"homologous":[13,126],"domain":[14,41,154,232,254,281,296],"sequences.":[15],"However,":[16],"when":[17],"relevant":[18],"signals":[19],"become":[20],"too":[21],"weak":[22],"to":[23,185,188,196,244,264,271],"be":[24,62,89,197],"identified":[25],"by":[26],"a":[27,66,97,120,129,139,221],"global":[28],"consensus,":[29],"attempts":[30],"for":[31,43,108,153,233],"fail.":[33],"Here":[34],"we":[35,52,212],"address":[36],"the":[37,55,71,101,144,204,249,257,277,283,286,292],"fundamental":[38],"question":[39],"of":[40,57,100,104,125,215,235,246,252,279,285,288,294],"identification":[42],"highly":[44],"divergent":[45],"proteins.":[46],"By":[47],"using":[48],"high":[49],"performance":[50,166],"computing,":[51],"demonstrate":[53],"that":[54,73],"limits":[56],"state-of-the-art":[58],"can":[61],"bypassed.":[63],"We":[64,95,226],"design":[65],"new":[67,269],"strategy":[68],"based":[69,178],"on":[70,179,210,220,256],"observation":[72],"many":[74],"structural":[75],"and":[76,122,155,161,171,181,200,267,291,299],"functional":[77],"constraints":[79],"are":[80,117,194],"not":[81,223],"globally":[82],"conserved":[83,91],"through":[84],"all":[85],"species":[86],"but":[87],"might":[88],"locally":[90],"in":[92],"separate":[93],"clades.":[94],"propose":[96],"novel":[98],"exploitation":[99],"large":[102,121],"amount":[103],"data":[105],"available:":[106],"1.":[107],"each":[109],"domain,":[112],"several":[113,159],"clade-centered":[115,192],"constructed":[118],"from":[119,135],"differentiated":[123],"panel":[124],"sequences,":[127,191],"2.":[128],"decision-making":[130],"protocol":[131],"combines":[132],"outcomes":[133],"obtained":[134],"multiple":[136],"models,":[137],"3.":[138],"multi-criteria":[140],"optimization":[141],"algorithm":[142],"finds":[143],"most":[145],"likely":[146],"architecture.":[148],"The":[149,260],"method":[150,261],"is":[151,167,262],"evaluated":[152],"architecture":[156],"prediction":[157],"over":[158,248],"datasets":[160],"statistical":[162],"testing":[163],"hypotheses.":[164],"Its":[165],"compared":[168],"against":[169,239],"HMMScan":[170],"HHblits,":[172],"two":[173],"widely":[174],"used":[175,206],"search":[176],"sequence-profile":[180],"profile-profile":[182],"comparison.":[183],"Due":[184],"their":[186],"closeness":[187],"actual":[189],"shown":[195],"more":[198],"specific":[199],"functionally":[201],"predictive":[202],"than":[203],"broadly":[205],"models.":[208],"Based":[209],"them,":[211],"improved":[213],"Plasmodium":[216],"falciparum":[217,237],"sequences":[219],"scale":[222],"previously":[224],"possible.":[225],"successfully":[227],"predict":[228],"at":[229],"least":[230],"one":[231],"72%":[234],"P.":[236],"proteins":[238],"63%":[240],"achieved":[241],"previously,":[242],"corresponding":[243],"30%":[245],"improvement":[247],"total":[250],"number":[251],"Pfam":[253],"predictions":[255],"whole":[258],"genome.":[259],"applicable":[263],"any":[265],"genome":[266],"opens":[268],"avenues":[270],"tackle":[272],"evolutionary":[273],"questions":[274],"such":[275],"as":[276],"reconstruction":[278,284],"ancient":[280],"duplications,":[282],"history":[287],"architectures,":[290],"estimation":[293],"age.":[297],"Website":[298],"software:":[300],"http://www.lcqb.upmc.fr/CLADE.":[301]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":4},{"year":2019,"cited_by_count":5},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":4}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
