{"id":"https://openalex.org/W2980279728","doi":"https://doi.org/10.1093/bioinformatics/btz762","title":"BCrystal: an interpretable sequence-based protein crystallization predictor","display_name":"BCrystal: an interpretable sequence-based protein crystallization predictor","publication_year":2019,"publication_date":"2019-10-08","ids":{"openalex":"https://openalex.org/W2980279728","doi":"https://doi.org/10.1093/bioinformatics/btz762","mag":"2980279728","pmid":"https://pubmed.ncbi.nlm.nih.gov/31603511"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/btz762","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btz762","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/36/5/1429/33745642/btz762.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://academic.oup.com/bioinformatics/article-pdf/36/5/1429/33745642/btz762.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012462452","display_name":"Abdurrahman Elbasir","orcid":"https://orcid.org/0000-0003-1677-7845"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Abdurrahman Elbasir","raw_affiliation_strings":["ICT Division, College of Science and Engineering , Hamad Bin Khalifa University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ICT Division, College of Science and Engineering , Hamad Bin Khalifa University","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055826525","display_name":"Raghvendra Mall","orcid":"https://orcid.org/0000-0003-1779-3150"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":true,"raw_author_name":"Raghvendra Mall","raw_affiliation_strings":["Data Analytics, Qatar Computing Research Institute , Hamad Bin Khalifa University, Doha 34110, Qatar"],"raw_orcid":"https://orcid.org/0000-0003-1779-3150","affiliations":[{"raw_affiliation_string":"Data Analytics, Qatar Computing Research Institute , Hamad Bin Khalifa University, Doha 34110, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067973729","display_name":"Khalid Kunji","orcid":"https://orcid.org/0000-0003-2946-512X"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Khalid Kunji","raw_affiliation_strings":["Data Analytics, Qatar Computing Research Institute , Hamad Bin Khalifa University, Doha 34110, Qatar"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Data Analytics, Qatar Computing Research Institute , Hamad Bin Khalifa University, Doha 34110, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089740833","display_name":"Reda Rawi","orcid":"https://orcid.org/0000-0002-0445-2325"},"institutions":[{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]},{"id":"https://openalex.org/I4210134534","display_name":"National Institute of Allergy and Infectious Diseases","ror":"https://ror.org/043z4tv69","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210134534"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Reda Rawi","raw_affiliation_strings":["Vaccine Research Center, National Institute of Allergy and Infectious Diseases, National Institutes of Health, Bethesda , MD 20892, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vaccine Research Center, National Institute of Allergy and Infectious Diseases, National Institutes of Health, Bethesda , MD 20892, USA","institution_ids":["https://openalex.org/I4210134534","https://openalex.org/I1299303238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037906104","display_name":"Zeyaul Islam","orcid":"https://orcid.org/0000-0002-5444-3910"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Zeyaul Islam","raw_affiliation_strings":["Diabetes Research Center, Qatar Biomedical Research Institute, Hamad Bin Khalifa University , Doha 34100, Qatar"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Diabetes Research Center, Qatar Biomedical Research Institute, Hamad Bin Khalifa University , Doha 34100, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069049986","display_name":"Gwo\u2010Yu Chuang","orcid":"https://orcid.org/0000-0003-0375-1013"},"institutions":[{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]},{"id":"https://openalex.org/I4210134534","display_name":"National Institute of Allergy and Infectious Diseases","ror":"https://ror.org/043z4tv69","country_code":"US","type":"facility","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210134534"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gwo-Yu Chuang","raw_affiliation_strings":["Vaccine Research Center, National Institute of Allergy and Infectious Diseases, National Institutes of Health, Bethesda , MD 20892, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Vaccine Research Center, National Institute of Allergy and Infectious Diseases, National Institutes of Health, Bethesda , MD 20892, USA","institution_ids":["https://openalex.org/I4210134534","https://openalex.org/I1299303238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010124716","display_name":"Prasanna R. Kolatkar","orcid":"https://orcid.org/0000-0003-4970-5944"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":false,"raw_author_name":"Prasanna R Kolatkar","raw_affiliation_strings":["Diabetes Research Center, Qatar Biomedical Research Institute, Hamad Bin Khalifa University , Doha 34100, Qatar"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Diabetes Research Center, Qatar Biomedical Research Institute, Hamad Bin Khalifa University , Doha 34100, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013350725","display_name":"Halima Bensmail","orcid":"https://orcid.org/0000-0001-6700-5752"},"institutions":[{"id":"https://openalex.org/I4210144839","display_name":"Hamad bin Khalifa University","ror":"https://ror.org/03eyq4y97","country_code":"QA","type":"education","lineage":["https://openalex.org/I4210144839"]}],"countries":["QA"],"is_corresponding":true,"raw_author_name":"Halima Bensmail","raw_affiliation_strings":["Data Analytics, Qatar Computing Research Institute , Hamad Bin Khalifa University, Doha 34110, Qatar"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Data Analytics, Qatar Computing Research Institute , Hamad Bin Khalifa University, Doha 34110, Qatar","institution_ids":["https://openalex.org/I4210144839"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5013350725","https://openalex.org/A5055826525"],"corresponding_institution_ids":["https://openalex.org/I4210144839"],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":null,"fwci":1.927,"has_fulltext":false,"cited_by_count":37,"citation_normalized_percentile":{"value":0.8623438,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"36","issue":"5","first_page":"1429","last_page":"1438"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11162","display_name":"Enzyme Structure and Function","score":0.9602000117301941,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11162","display_name":"Enzyme Structure and Function","score":0.9602000117301941,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.030899999663233757,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.0012000000569969416,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/matthews-correlation-coefficient","display_name":"Matthews correlation coefficient","score":0.6174567341804504},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.6123107671737671},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5828993916511536},{"id":"https://openalex.org/keywords/crystallization","display_name":"Crystallization","score":0.5651963353157043},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.5088536739349365},{"id":"https://openalex.org/keywords/correlation-coefficient","display_name":"Correlation coefficient","score":0.4338315427303314},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.404933899641037},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3613553047180176},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.26942116022109985},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.266192764043808},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.18342244625091553},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.1606384515762329},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.11266690492630005},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.10526052117347717}],"concepts":[{"id":"https://openalex.org/C164085508","wikidata":"https://www.wikidata.org/wiki/Q4811327","display_name":"Matthews correlation coefficient","level":3,"score":0.6174567341804504},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.6123107671737671},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5828993916511536},{"id":"https://openalex.org/C203036418","wikidata":"https://www.wikidata.org/wiki/Q284256","display_name":"Crystallization","level":2,"score":0.5651963353157043},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.5088536739349365},{"id":"https://openalex.org/C2780092901","wikidata":"https://www.wikidata.org/wiki/Q3433612","display_name":"Correlation coefficient","level":2,"score":0.4338315427303314},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.404933899641037},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3613553047180176},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26942116022109985},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.266192764043808},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.18342244625091553},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.1606384515762329},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.11266690492630005},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.10526052117347717},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[{"descriptor_ui":"D003460","descriptor_name":"Crystallization","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003460","descriptor_name":"Crystallization","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D003460","descriptor_name":"Crystallization","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D012984","descriptor_name":"Software","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D018360","descriptor_name":"Crystallography, X-Ray","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D018360","descriptor_name":"Crystallography, X-Ray","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D018360","descriptor_name":"Crystallography, X-Ray","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":3,"locations":[{"id":"doi:10.1093/bioinformatics/btz762","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btz762","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/36/5/1429/33745642/btz762.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmid:31603511","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/31603511","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics (Oxford, England)","raw_type":null},{"id":"pmh:oai:pubmedcentral.nih.gov:7523644","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/7523644","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1093/bioinformatics/btz762","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btz762","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/36/5/1429/33745642/btz762.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W591644047","https://openalex.org/W1525683299","https://openalex.org/W1562353621","https://openalex.org/W1608292140","https://openalex.org/W1678356000","https://openalex.org/W1971916086","https://openalex.org/W1977922844","https://openalex.org/W2019228162","https://openalex.org/W2062849515","https://openalex.org/W2073758773","https://openalex.org/W2073793320","https://openalex.org/W2096495474","https://openalex.org/W2097356092","https://openalex.org/W2098101628","https://openalex.org/W2112796928","https://openalex.org/W2126064524","https://openalex.org/W2129888542","https://openalex.org/W2136299394","https://openalex.org/W2137226992","https://openalex.org/W2142529984","https://openalex.org/W2142808579","https://openalex.org/W2145841875","https://openalex.org/W2148471287","https://openalex.org/W2153635508","https://openalex.org/W2168020168","https://openalex.org/W2169041564","https://openalex.org/W2170240176","https://openalex.org/W2170747616","https://openalex.org/W2282821441","https://openalex.org/W2295598076","https://openalex.org/W2300696561","https://openalex.org/W2413365859","https://openalex.org/W2440774392","https://openalex.org/W2510508396","https://openalex.org/W2512416592","https://openalex.org/W2623334623","https://openalex.org/W2649433081","https://openalex.org/W2766578745","https://openalex.org/W2776730476","https://openalex.org/W2792954461","https://openalex.org/W2794004073","https://openalex.org/W2799591485","https://openalex.org/W2889498145","https://openalex.org/W2900903885","https://openalex.org/W2911954305","https://openalex.org/W2911964244","https://openalex.org/W2914874661","https://openalex.org/W2949956784","https://openalex.org/W2962862931","https://openalex.org/W2963012544","https://openalex.org/W3102476541","https://openalex.org/W4256301573","https://openalex.org/W6680532697","https://openalex.org/W6685053522","https://openalex.org/W6685082496","https://openalex.org/W6722226382","https://openalex.org/W6737947904","https://openalex.org/W6749500503"],"related_works":["https://openalex.org/W2389225124","https://openalex.org/W2089418075","https://openalex.org/W2057419801","https://openalex.org/W2386767533","https://openalex.org/W2072215755","https://openalex.org/W2182882536","https://openalex.org/W2390635035","https://openalex.org/W2023663882","https://openalex.org/W2079031047","https://openalex.org/W3010364596"],"abstract_inverted_index":{"MOTIVATION:":[0],"X-ray":[1],"crystallography":[2],"has":[3],"facilitated":[4],"the":[5,28,37,69,78,83,92,153],"majority":[6],"of":[7,71,87,124,127,133,139,155,159,175],"protein":[8,19,90,150],"structures":[9],"determined":[10],"to":[11,26,35,146,179],"date.":[12],"Sequence-based":[13],"predictors":[14],"that":[15,164],"can":[16],"accurately":[17,180],"estimate":[18],"crystallization":[20,85],"propensities":[21],"would":[22],"be":[23],"highly":[24],"beneficial":[25],"overcome":[27],"high":[29],"expenditure,":[30],"large":[31],"attrition":[32],"rate,":[33],"and":[34,64,114,129,152,161,197],"reduce":[36],"trial-and-error":[38],"settings":[39],"required":[40],"for":[41,82,182],"crystallization.":[42],"RESULTS:":[43],"In":[44],"this":[45],"study,":[46],"we":[47,142],"present":[48],"a":[49],"novel":[50],"model,":[51],"BCrystal,":[52],"which":[53],"uses":[54],"an":[55,88,121],"optimized":[56],"gradient":[57],"boosting":[58],"machine":[59],"(XGBoost)":[60],"on":[61],"sequence,":[62],"structural":[63],"physio-chemical":[65],"features":[66,81],"extracted":[67],"from":[68],"proteins":[70],"interest.":[72],"BCrystal":[73,100,176,192],"also":[74],"provides":[75],"explanations,":[76],"highlighting":[77],"most":[79],"important":[80],"predicted":[84],"propensity":[86],"individual":[89],"using":[91],"SHAP":[93],"algorithm.":[94],"On":[95],"three":[96],"independent":[97],"test":[98],"sets,":[99],"outperforms":[101],"state-of-the-art":[102],"sequence-based":[103],"methods":[104],"by":[105],"more":[106],"than":[107],"12.5%":[108],"in":[109,112,116],"accuracy,":[110],"18%":[111],"recall":[113,126],"0.253":[115],"Matthew's":[117,130],"correlation":[118,131],"coefficient,":[119],"with":[120,149,170,185],"average":[122],"accuracy":[123,174],"93.7%,":[125],"96.63%":[128],"coefficient":[132],"0.868.":[134],"For":[135],"relative":[136],"solvent":[137],"accessibility":[138],"exposed":[140],"residues,":[141],"observed":[143],"higher":[144,173],"values":[145],"associate":[147,168],"positively":[148],"crystallizability":[151],"number":[154],"disordered":[156],"regions,":[157],"fraction":[158],"coils":[160],"tripeptide":[162],"stretches":[163],"contain":[165],"multiple":[166],"histidines":[167],"negatively":[169],"crystallizability.":[171,187],"The":[172],"enables":[177],"it":[178],"screen":[181],"sequence":[183],"variants":[184],"enhanced":[186],"AVAILABILITY":[188],"AND":[189],"IMPLEMENTATION:":[190],"Our":[191],"webserver":[193],"is":[194,200],"at":[195,202,210],"https://machinelearning-protein.qcri.org/":[196],"source":[198],"code":[199],"available":[201,209],"https://github.com/raghvendra5688/BCrystal.":[203],"SUPPLEMENTARY":[204],"INFORMATION:":[205],"Supplementary":[206],"data":[207],"are":[208],"Bioinformatics":[211],"online.":[212]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":5},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
