{"id":"https://openalex.org/W2117502874","doi":"https://doi.org/10.1186/1471-2105-9-510","title":"A discriminative method for protein remote homology detection and fold recognition combining Top-n-grams and latent semantic analysis","display_name":"A discriminative method for protein remote homology detection and fold recognition combining Top-n-grams and latent semantic analysis","publication_year":2008,"publication_date":"2008-12-01","ids":{"openalex":"https://openalex.org/W2117502874","doi":"https://doi.org/10.1186/1471-2105-9-510","mag":"2117502874","pmid":"https://pubmed.ncbi.nlm.nih.gov/19046430"},"language":"en","primary_location":{"id":"doi:10.1186/1471-2105-9-510","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-9-510","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-510","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-510","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100395591","display_name":"Bin Liu","orcid":"https://orcid.org/0000-0003-3685-9469"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I158809036","display_name":"Shenzhen Institute of Information Technology","ror":"https://ror.org/03wrf9427","country_code":"CN","type":"education","lineage":["https://openalex.org/I158809036"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bin Liu","raw_affiliation_strings":["Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China. bliu@insun.hit.edu.cn","Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China. bliu@insun.hit.edu.cn","institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"]},{"raw_affiliation_string":"Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100424254","display_name":"Xiaolong Wang","orcid":"https://orcid.org/0000-0001-9003-4252"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolong Wang","raw_affiliation_strings":["Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China","School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048326379","display_name":"Lei Lin","orcid":"https://orcid.org/0000-0002-1161-8565"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Lin","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China","School of Computer Science and Technology, Harbin Institute of Technology, Harbin PR China#TAB#"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin PR China#TAB#","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100608345","display_name":"Qiwen Dong","orcid":"https://orcid.org/0000-0002-3166-0541"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qiwen Dong","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China","School of Computer Science and Technology, Harbin Institute of Technology, Harbin PR China#TAB#"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin PR China#TAB#","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100328995","display_name":"Xuan Wang","orcid":"https://orcid.org/0000-0002-3512-0649"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuan Wang","raw_affiliation_strings":["Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China","School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China"],"affiliations":[{"raw_affiliation_string":"Harbin Institute of Technology Shenzhen Graduate School, Shenzhen, PR China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Harbin, PR China","institution_ids":["https://openalex.org/I204983213"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100395591"],"corresponding_institution_ids":["https://openalex.org/I158809036","https://openalex.org/I204983213"],"apc_list":{"value":1690,"currency":"GBP","value_usd":2072},"apc_paid":{"value":1690,"currency":"GBP","value_usd":2072},"fwci":1.798,"has_fulltext":true,"cited_by_count":137,"citation_normalized_percentile":{"value":0.84583156,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"9","issue":"1","first_page":"510","last_page":"510"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.74055016040802},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.7365262508392334},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6827941536903381},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.661433756351471},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5480591654777527},{"id":"https://openalex.org/keywords/latent-semantic-analysis","display_name":"Latent semantic analysis","score":0.48723068833351135},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.47892889380455017},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.42854517698287964},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.2201627790927887},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.19162532687187195},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.17271634936332703},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.1438678801059723},{"id":"https://openalex.org/keywords/gene","display_name":"Gene","score":0.0804433524608612}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.74055016040802},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.7365262508392334},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6827941536903381},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.661433756351471},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5480591654777527},{"id":"https://openalex.org/C170133592","wikidata":"https://www.wikidata.org/wiki/Q1806883","display_name":"Latent semantic analysis","level":2,"score":0.48723068833351135},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.47892889380455017},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.42854517698287964},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.2201627790927887},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.19162532687187195},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.17271634936332703},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.1438678801059723},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0804433524608612},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D000595","descriptor_name":"Amino Acid Sequence","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000235","qualifier_name":"genetics","is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D016415","descriptor_name":"Sequence Alignment","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017385","descriptor_name":"Sequence Homology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017385","descriptor_name":"Sequence Homology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017385","descriptor_name":"Sequence Homology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017385","descriptor_name":"Sequence Homology","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017510","descriptor_name":"Protein Folding","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030541","descriptor_name":"Databases, Genetic","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":4,"locations":[{"id":"doi:10.1186/1471-2105-9-510","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-9-510","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-510","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},{"id":"pmid:19046430","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/19046430","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC bioinformatics","raw_type":null},{"id":"pmh:oai:doaj.org/article:c8ae10629f3a4ef2a0d7e5f4ed65d057","is_oa":true,"landing_page_url":"https://doaj.org/article/c8ae10629f3a4ef2a0d7e5f4ed65d057","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics, Vol 9, Iss 1, p 510 (2008)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:2613933","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/2613933","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"BMC Bioinformatics","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1186/1471-2105-9-510","is_oa":true,"landing_page_url":"https://doi.org/10.1186/1471-2105-9-510","pdf_url":"https://bmcbioinformatics.biomedcentral.com/counter/pdf/10.1186/1471-2105-9-510","source":{"id":"https://openalex.org/S19032547","display_name":"BMC Bioinformatics","issn_l":"1471-2105","issn":["1471-2105"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320256","host_organization_name":"BioMed Central","host_organization_lineage":["https://openalex.org/P4310320256","https://openalex.org/P4310319965"],"host_organization_lineage_names":["BioMed Central","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"BMC Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.75,"id":"https://metadata.un.org/sdg/10"}],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G239599399","display_name":null,"funder_award_id":"60435020","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G391238517","display_name":null,"funder_award_id":", and","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4243412236","display_name":null,"funder_award_id":"863 Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5240398506","display_name":null,"funder_award_id":"60673019","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335773","display_name":"National High-tech Research and Development Program","ror":null}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2117502874.pdf","grobid_xml":"https://content.openalex.org/works/W2117502874.grobid-xml"},"referenced_works_count":46,"referenced_works":["https://openalex.org/W1486662173","https://openalex.org/W1558365920","https://openalex.org/W1563088657","https://openalex.org/W1577473172","https://openalex.org/W1592870802","https://openalex.org/W1640943318","https://openalex.org/W1921780704","https://openalex.org/W1970999032","https://openalex.org/W1973714307","https://openalex.org/W1975394843","https://openalex.org/W1982025738","https://openalex.org/W1995918845","https://openalex.org/W2020816856","https://openalex.org/W2022247199","https://openalex.org/W2028903194","https://openalex.org/W2034256925","https://openalex.org/W2055043387","https://openalex.org/W2062296203","https://openalex.org/W2084787613","https://openalex.org/W2087064593","https://openalex.org/W2095692770","https://openalex.org/W2101220662","https://openalex.org/W2104983234","https://openalex.org/W2104997217","https://openalex.org/W2108079689","https://openalex.org/W2118714763","https://openalex.org/W2120401481","https://openalex.org/W2121950477","https://openalex.org/W2124709175","https://openalex.org/W2127464112","https://openalex.org/W2128328428","https://openalex.org/W2140244239","https://openalex.org/W2141915888","https://openalex.org/W2142013909","https://openalex.org/W2145358391","https://openalex.org/W2148279834","https://openalex.org/W2148603752","https://openalex.org/W2149298154","https://openalex.org/W2154218709","https://openalex.org/W2158714788","https://openalex.org/W2158997610","https://openalex.org/W2165979580","https://openalex.org/W2170666908","https://openalex.org/W2170960297","https://openalex.org/W2283504545","https://openalex.org/W2435251607"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W2110523656","https://openalex.org/W1482209366","https://openalex.org/W2521627374","https://openalex.org/W2981954115"],"abstract_inverted_index":{"The":[0],"method":[1],"based":[2,9],"on":[3,10],"Top-n-grams":[4],"significantly":[5],"outperforms":[6],"the":[7,30,42,47,50,55,61],"methods":[8],"many":[11,39],"other":[12],"building":[13,27],"blocks":[14],"including":[15],"N-grams,":[16],"patterns,":[17],"motifs":[18],"and":[19,33,60],"binary":[20],"profiles.":[21],"Therefore,":[22],"Top-n-gram":[23],"is":[24],"a":[25],"good":[26],"block":[28],"of":[29,41,52,57,63],"protein":[31,64],"sequences":[32],"can":[34],"be":[35],"widely":[36],"used":[37],"in":[38],"tasks":[40],"computational":[43],"biology,":[44],"such":[45],"as":[46],"sequence":[48],"alignment,":[49],"prediction":[51,62],"domain":[53],"boundary,":[54],"designation":[56],"knowledge-based":[58],"potentials":[59],"binding":[65],"sites.":[66]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":13},{"year":2018,"cited_by_count":10},{"year":2017,"cited_by_count":9},{"year":2016,"cited_by_count":11},{"year":2015,"cited_by_count":14},{"year":2014,"cited_by_count":14},{"year":2013,"cited_by_count":10},{"year":2012,"cited_by_count":4}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
