{"id":"https://openalex.org/W2108428298","doi":"https://doi.org/10.1093/bioinformatics/btg212","title":"Comparison of sequence masking algorithms and the detection of biased protein sequence regions","display_name":"Comparison of sequence masking algorithms and the detection of biased protein sequence regions","publication_year":2003,"publication_date":"2003-09-01","ids":{"openalex":"https://openalex.org/W2108428298","doi":"https://doi.org/10.1093/bioinformatics/btg212","mag":"2108428298","pmid":"https://pubmed.ncbi.nlm.nih.gov/12967964"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/btg212","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btg212","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/19/13/1672/602934/btg212.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://academic.oup.com/bioinformatics/article-pdf/19/13/1672/602934/btg212.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076046328","display_name":"David P. Kreil","orcid":"https://orcid.org/0000-0001-7538-2056"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"David P. Kreil","raw_affiliation_strings":["Department of Genetics/Inference Group (Cavendish Laboratory), University of Cambridge, Cambridge, UK. kreil@ebi.ac.uk"],"affiliations":[{"raw_affiliation_string":"Department of Genetics/Inference Group (Cavendish Laboratory), University of Cambridge, Cambridge, UK. kreil@ebi.ac.uk","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022717154","display_name":"Christos Ouzounis","orcid":"https://orcid.org/0000-0002-0086-8657"},"institutions":[{"id":"https://openalex.org/I1303153112","display_name":"European Bioinformatics Institute","ror":"https://ror.org/02catss52","country_code":"GB","type":"facility","lineage":["https://openalex.org/I1303153112","https://openalex.org/I4210138560"]},{"id":"https://openalex.org/I4210148697","display_name":"Institute of Bioinformatics","ror":"https://ror.org/04hqfvm50","country_code":"IN","type":"nonprofit","lineage":["https://openalex.org/I4210148697"]},{"id":"https://openalex.org/I4210151791","display_name":"Genomics (United Kingdom)","ror":"https://ror.org/053a6xa29","country_code":"GB","type":"company","lineage":["https://openalex.org/I4210151791"]}],"countries":["GB","IN"],"is_corresponding":false,"raw_author_name":"Christos A. Ouzounis","raw_affiliation_strings":["Computational Genomics Group, The European Bioinformatics Institute, EMBL Outstation Cambridge CB10 1SD, UK","Bioinformatics"],"affiliations":[{"raw_affiliation_string":"Computational Genomics Group, The European Bioinformatics Institute, EMBL Outstation Cambridge CB10 1SD, UK","institution_ids":["https://openalex.org/I1303153112","https://openalex.org/I4210151791"]},{"raw_affiliation_string":"Bioinformatics","institution_ids":["https://openalex.org/I4210148697"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5076046328"],"corresponding_institution_ids":["https://openalex.org/I241749"],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":null,"fwci":0.4575,"has_fulltext":true,"cited_by_count":23,"citation_normalized_percentile":{"value":0.61830622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"19","issue":"13","first_page":"1672","last_page":"1681"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12946","display_name":"Fractal and DNA sequence analysis","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.728446364402771},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.684933066368103},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5602827072143555},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5430864691734314},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5006260871887207},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.47969767451286316},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.4619342088699341},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4511812925338745},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3563482165336609},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.3558382987976074},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.348383367061615},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27047985792160034},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.2314337193965912},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.22322538495063782},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.07331785559654236}],"concepts":[{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.728446364402771},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.684933066368103},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5602827072143555},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5430864691734314},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5006260871887207},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.47969767451286316},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.4619342088699341},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4511812925338745},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3563482165336609},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.3558382987976074},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.348383367061615},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27047985792160034},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.2314337193965912},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.22322538495063782},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.07331785559654236},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001426","descriptor_name":"Bacterial Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D001426","descriptor_name":"Bacterial Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D001426","descriptor_name":"Bacterial Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D001426","descriptor_name":"Bacterial Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D001426","descriptor_name":"Bacterial Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D001426","descriptor_name":"Bacterial Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D008957","descriptor_name":"Models, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008957","descriptor_name":"Models, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008957","descriptor_name":"Models, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008969","descriptor_name":"Molecular Sequence Data","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000145","qualifier_name":"classification","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D012680","descriptor_name":"Sensitivity and Specificity","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012680","descriptor_name":"Sensitivity and Specificity","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012680","descriptor_name":"Sensitivity and Specificity","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015203","descriptor_name":"Reproducibility of Results","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015203","descriptor_name":"Reproducibility of Results","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015203","descriptor_name":"Reproducibility of Results","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015233","descriptor_name":"Models, Statistical","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D015982","descriptor_name":"Bias","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015982","descriptor_name":"Bias","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D015982","descriptor_name":"Bias","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017386","descriptor_name":"Sequence Homology, Amino Acid","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020869","descriptor_name":"Gene Expression Profiling","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020869","descriptor_name":"Gene Expression Profiling","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020869","descriptor_name":"Gene Expression Profiling","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000378","qualifier_name":"metabolism","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D041522","descriptor_name":"Aeropyrum","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false}],"locations_count":4,"locations":[{"id":"doi:10.1093/bioinformatics/btg212","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btg212","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/19/13/1672/602934/btg212.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmid:12967964","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/12967964","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics (Oxford, England)","raw_type":null},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.615.4992","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.615.4992","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://bioinformatics.oxfordjournals.org/content/19/13/1672.full.pdf","raw_type":"text"},{"id":"pmh:oai:kclpure.kcl.ac.uk:publications/9aab8b71-f911-4428-839d-c23fcc8f759f","is_oa":false,"landing_page_url":"https://kclpure.kcl.ac.uk/portal/en/publications/9aab8b71-f911-4428-839d-c23fcc8f759f","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Kreil , D P &amp; Ouzounis , C A 2003 , ' Comparison of sequence masking algorithms and the detection of biased protein sequence regions ' , BIOINFORMATICS , vol. 19 , no. 13 , pp. 1672 - 1681 . https://doi.org/10.1093/bioinformatics/btg212","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1093/bioinformatics/btg212","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btg212","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/19/13/1672/602934/btg212.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7407982985","display_name":null,"funder_award_id":"Fellowship","funder_id":"https://openalex.org/F4320334626","funder_display_name":"Medical Research Council"}],"funders":[{"id":"https://openalex.org/F4320314023","display_name":"European Molecular Biology Laboratory","ror":"https://ror.org/050589e39"},{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320334626","display_name":"Medical Research Council","ror":"https://ror.org/03x94j517"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2108428298.pdf","grobid_xml":"https://content.openalex.org/works/W2108428298.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W164956572","https://openalex.org/W1017703714","https://openalex.org/W1491176290","https://openalex.org/W1513332069","https://openalex.org/W1558365920","https://openalex.org/W1970437513","https://openalex.org/W1971592875","https://openalex.org/W1972097354","https://openalex.org/W1986769472","https://openalex.org/W1987055177","https://openalex.org/W1987393189","https://openalex.org/W1990453950","https://openalex.org/W1994481056","https://openalex.org/W2002056148","https://openalex.org/W2002180966","https://openalex.org/W2003144438","https://openalex.org/W2003647795","https://openalex.org/W2008399824","https://openalex.org/W2010961953","https://openalex.org/W2015292449","https://openalex.org/W2025584660","https://openalex.org/W2045274476","https://openalex.org/W2051119339","https://openalex.org/W2051916497","https://openalex.org/W2055043387","https://openalex.org/W2060367243","https://openalex.org/W2064470502","https://openalex.org/W2066688961","https://openalex.org/W2069003894","https://openalex.org/W2084073683","https://openalex.org/W2087344748","https://openalex.org/W2089431713","https://openalex.org/W2092670169","https://openalex.org/W2094519647","https://openalex.org/W2104412724","https://openalex.org/W2105798249","https://openalex.org/W2113333419","https://openalex.org/W2114352708","https://openalex.org/W2142409171","https://openalex.org/W2143210482","https://openalex.org/W2154478075","https://openalex.org/W2169929748","https://openalex.org/W2328496340","https://openalex.org/W2496863210","https://openalex.org/W4213149192","https://openalex.org/W4236236547","https://openalex.org/W4244779656","https://openalex.org/W4246833219","https://openalex.org/W4285719527","https://openalex.org/W4383673615"],"related_works":["https://openalex.org/W3081694532","https://openalex.org/W2069592018","https://openalex.org/W2075740387","https://openalex.org/W2358990940","https://openalex.org/W2004323682","https://openalex.org/W1969211203","https://openalex.org/W2093931120","https://openalex.org/W2349116365","https://openalex.org/W3021708704","https://openalex.org/W1517958729"],"abstract_inverted_index":{"Here":[0],"we":[1],"demonstrate":[2],"that":[3,30,52,68],"compositional":[4],"bias":[5],"seems":[6,98],"to":[7,26,99,107],"be":[8,100],"a":[9,101],"more":[10],"effective":[11],"measure":[12],"for":[13,28,42,93],"the":[14,46,56,69,84,91],"detection":[15],"of":[16,59,109],"biologically":[17],"meaningful":[18],"signals.":[19],"Typical":[20],"results":[21,27],"on":[22],"proteins":[23,44,62],"are":[24],"compared":[25],"sequences":[29,73],"have":[31,55],"been":[32],"randomized":[33,65,72],"in":[34,61,64,105],"various":[35],"ways,":[36],"conserving":[37],"composition":[38,81],"and":[39,67,78],"local":[40,76],"correlations":[41,77],"individual":[43],"or":[45],"entire":[47],"set.":[48],"It":[49],"is":[50,89],"remarkable":[51],"low-complexity":[53],"regions":[54],"same":[57],"form":[58],"distribution":[60],"as":[63],"sequences,":[66],"signal":[70,85],"from":[71,86],"with":[74],"conserved":[75],"amino":[79],"acid":[80],"almost":[82],"matches":[83],"proteins.":[87],"This":[88],"not":[90],"case":[92],"sequence":[94],"bias,":[95],"which":[96],"hence":[97],"genuinely":[102],"biological":[103],"phenomenon":[104],"contrast":[106],"patches":[108],"low":[110],"complexity.":[111]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
