{"id":"https://openalex.org/W2145468550","doi":"https://doi.org/10.1093/bioinformatics/btp679","title":"A novel method for accurate one-dimensional protein structure prediction based on fragment matching","display_name":"A novel method for accurate one-dimensional protein structure prediction based on fragment matching","publication_year":2009,"publication_date":"2009-12-09","ids":{"openalex":"https://openalex.org/W2145468550","doi":"https://doi.org/10.1093/bioinformatics/btp679","mag":"2145468550","pmid":"https://pubmed.ncbi.nlm.nih.gov/20007252"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/btp679","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btp679","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/26/4/470/16896756/btp679.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://academic.oup.com/bioinformatics/article-pdf/26/4/470/16896756/btp679.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109806922","display_name":"Tuping Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I161593684","display_name":"Stockholm University","ror":"https://ror.org/05f0yaq80","country_code":"SE","type":"education","lineage":["https://openalex.org/I161593684"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Tuping Zhou","raw_affiliation_strings":["Division of Structural Chemistry, Stockholm University, Stockholm SE-106 91, Sweden"],"affiliations":[{"raw_affiliation_string":"Division of Structural Chemistry, Stockholm University, Stockholm SE-106 91, Sweden","institution_ids":["https://openalex.org/I161593684"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101420205","display_name":"Nanjiang Shu","orcid":"https://orcid.org/0000-0002-3537-2387"},"institutions":[{"id":"https://openalex.org/I161593684","display_name":"Stockholm University","ror":"https://ror.org/05f0yaq80","country_code":"SE","type":"education","lineage":["https://openalex.org/I161593684"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Nanjiang Shu","raw_affiliation_strings":["Division of Structural Chemistry, Stockholm University, Stockholm SE-106 91, Sweden"],"affiliations":[{"raw_affiliation_string":"Division of Structural Chemistry, Stockholm University, Stockholm SE-106 91, Sweden","institution_ids":["https://openalex.org/I161593684"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075675047","display_name":"Sven Hovm\u00f6ller","orcid":"https://orcid.org/0000-0003-1717-0455"},"institutions":[{"id":"https://openalex.org/I161593684","display_name":"Stockholm University","ror":"https://ror.org/05f0yaq80","country_code":"SE","type":"education","lineage":["https://openalex.org/I161593684"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Sven Hovm\u00f6ller","raw_affiliation_strings":["Division of Structural Chemistry, Stockholm University, Stockholm SE-106 91, Sweden"],"affiliations":[{"raw_affiliation_string":"Division of Structural Chemistry, Stockholm University, Stockholm SE-106 91, Sweden","institution_ids":["https://openalex.org/I161593684"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109806922"],"corresponding_institution_ids":["https://openalex.org/I161593684"],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":null,"fwci":1.3123,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.79851405,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"26","issue":"4","first_page":"470","last_page":"477"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10044","display_name":"Protein Structure and Dynamics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11162","display_name":"Enzyme Structure and Function","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/protein-secondary-structure","display_name":"Protein secondary structure","score":0.6998986005783081},{"id":"https://openalex.org/keywords/protein-structure-prediction","display_name":"Protein structure prediction","score":0.596752405166626},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5709245800971985},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5564313530921936},{"id":"https://openalex.org/keywords/protein-structure","display_name":"Protein structure","score":0.506632387638092},{"id":"https://openalex.org/keywords/fragment","display_name":"Fragment (logic)","score":0.5035812258720398},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.49499720335006714},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.4463731050491333},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4372140169143677},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3625554144382477},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.30459389090538025},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.12210813164710999},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11878716945648193},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.09015083312988281}],"concepts":[{"id":"https://openalex.org/C62614982","wikidata":"https://www.wikidata.org/wiki/Q904984","display_name":"Protein secondary structure","level":2,"score":0.6998986005783081},{"id":"https://openalex.org/C18051474","wikidata":"https://www.wikidata.org/wiki/Q899656","display_name":"Protein structure prediction","level":3,"score":0.596752405166626},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5709245800971985},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5564313530921936},{"id":"https://openalex.org/C47701112","wikidata":"https://www.wikidata.org/wiki/Q735188","display_name":"Protein structure","level":2,"score":0.506632387638092},{"id":"https://openalex.org/C2776235265","wikidata":"https://www.wikidata.org/wiki/Q18392052","display_name":"Fragment (logic)","level":2,"score":0.5035812258720398},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.49499720335006714},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.4463731050491333},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4372140169143677},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3625554144382477},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.30459389090538025},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.12210813164710999},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11878716945648193},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.09015083312988281},{"id":"https://openalex.org/C46141821","wikidata":"https://www.wikidata.org/wiki/Q209402","display_name":"Nuclear magnetic resonance","level":1,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008958","descriptor_name":"Models, Molecular","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D011506","descriptor_name":"Proteins","qualifier_ui":"Q000737","qualifier_name":"chemistry","is_major_topic":false},{"descriptor_ui":"D017433","descriptor_name":"Protein Structure, Secondary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017433","descriptor_name":"Protein Structure, Secondary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017433","descriptor_name":"Protein Structure, Secondary","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D019295","descriptor_name":"Computational Biology","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D020539","descriptor_name":"Sequence Analysis, Protein","qualifier_ui":"Q000379","qualifier_name":"methods","is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D030562","descriptor_name":"Databases, Protein","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false}],"locations_count":2,"locations":[{"id":"doi:10.1093/bioinformatics/btp679","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btp679","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/26/4/470/16896756/btp679.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmid:20007252","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/20007252","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics (Oxford, England)","raw_type":null}],"best_oa_location":{"id":"doi:10.1093/bioinformatics/btp679","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btp679","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/26/4/470/16896756/btp679.pdf","source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2145468550.pdf","grobid_xml":"https://content.openalex.org/works/W2145468550.grobid-xml"},"referenced_works_count":42,"referenced_works":["https://openalex.org/W255996521","https://openalex.org/W1490138956","https://openalex.org/W1969621320","https://openalex.org/W1978520289","https://openalex.org/W1981132436","https://openalex.org/W1985818354","https://openalex.org/W2008708467","https://openalex.org/W2008807736","https://openalex.org/W2011495938","https://openalex.org/W2013136212","https://openalex.org/W2035066314","https://openalex.org/W2041369927","https://openalex.org/W2047544230","https://openalex.org/W2047962024","https://openalex.org/W2049695588","https://openalex.org/W2060178110","https://openalex.org/W2062693912","https://openalex.org/W2086403919","https://openalex.org/W2091194233","https://openalex.org/W2107538253","https://openalex.org/W2114520383","https://openalex.org/W2116268847","https://openalex.org/W2116689128","https://openalex.org/W2118836759","https://openalex.org/W2124919568","https://openalex.org/W2125725297","https://openalex.org/W2130479394","https://openalex.org/W2135079066","https://openalex.org/W2139753312","https://openalex.org/W2142013909","https://openalex.org/W2144483796","https://openalex.org/W2144727125","https://openalex.org/W2145268834","https://openalex.org/W2147905080","https://openalex.org/W2148557779","https://openalex.org/W2153026148","https://openalex.org/W2153153865","https://openalex.org/W2153187042","https://openalex.org/W2158714788","https://openalex.org/W2164886928","https://openalex.org/W3147254695","https://openalex.org/W4246356731"],"related_works":["https://openalex.org/W2928838901","https://openalex.org/W2574528486","https://openalex.org/W2494604670","https://openalex.org/W1578077690","https://openalex.org/W1998289425","https://openalex.org/W2303656598","https://openalex.org/W1510508486","https://openalex.org/W4206825711","https://openalex.org/W2114568928","https://openalex.org/W3086268169"],"abstract_inverted_index":{"By":[0,139],"exploiting":[1],"the":[2,18,44,77,100,117,142,155,165],"vast":[3],"protein":[4,7,42],"sequence":[5,38],"and":[6,61,67,86,120],"structure":[8,84,150],"data":[9,145],"available,":[10],"we":[11,107,152],"have":[12,71],"brought":[13],"secondary-structure":[14,49],"prediction":[15,85,151],"closer":[16],"to":[17],"expected":[19],"theoretical":[20],"limit.":[21],"When":[22],"tested":[23,95],"by":[24,124,158],"a":[25,30,112],"leave-one-out":[26],"cross":[27],"validation":[28],"on":[29,96,148],"non-redundant":[31],"set":[32],"of":[33,80,144,164],"PDB":[34],"cutting":[35],"at":[36,130],"30%":[37],"identity":[39],"containing":[40],"5860":[41],"chains,":[43],"overall":[45,56],"per-residue":[46,57],"accuracy":[47,58,134,156],"for":[48,59,82,135],"prediction,":[50],"i.e.":[51],"Q3":[52,93],"is":[53],"82.9%.":[54],"The":[55],"three-":[60],"eight-state":[62],"Shape":[63,105,137],"Strings":[64],"are":[65],"85.1":[66],"71.5%,":[68],"respectively.":[69],"We":[70],"also":[72],"benchmarked":[73],"our":[74,87,109],"program":[75,88,128],"with":[76,99,111,116,161],"latest":[78],"version":[79],"PSIPRED":[81],"secondary":[83],"predicted":[89,129],"0.3%":[90],"better":[91,132],"in":[92,133],"when":[94],"2241":[97],"chains":[98],"same":[101,118],"training":[102],"set.":[103],"For":[104],"Strings,":[106],"compared":[108],"method":[110,115],"recently":[113],"published":[114],"dataset":[119],"definition":[121],"as":[122],"used":[123],"that":[125,154],"method.":[126],"Our":[127],"2.2%":[131],"three-state":[136],"Strings.":[138],"quantitatively":[140],"investigating":[141],"effect":[143],"base":[146],"size":[147],"1D":[149],"show":[153],"increases":[157],"approximately":[159],"1%":[160],"every":[162],"doubling":[163],"database":[166],"size.":[167]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
