{"id":"https://openalex.org/W4247827554","doi":"https://doi.org/10.1093/bioinformatics/btq251","title":"A support vector machine model for the prediction of proteotypic peptides for accurate mass and time proteomics","display_name":"A support vector machine model for the prediction of proteotypic peptides for accurate mass and time proteomics","publication_year":2010,"publication_date":"2010-06-16","ids":{"openalex":"https://openalex.org/W4247827554","doi":"https://doi.org/10.1093/bioinformatics/btq251"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/btq251","is_oa":false,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btq251","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020443342","display_name":"Bobbie\u2010Jo Webb\u2010Robertson","orcid":"https://orcid.org/0000-0002-4744-2397"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bobbie-Jo M. Webb-Robertson","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058577320","display_name":"William R. Cannon","orcid":"https://orcid.org/0000-0003-3789-7889"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William R. Cannon","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013287908","display_name":"Christopher Oehmen","orcid":"https://orcid.org/0009-0004-5246-930X"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher S. Oehmen","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113935679","display_name":"Anuj Shah","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anuj R. Shah","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043714956","display_name":"Vidhya Gurumoorthi","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vidhya Gurumoorthi","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085384361","display_name":"Mary Lipton","orcid":"https://orcid.org/0000-0001-7749-0077"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mary S. Lipton","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5053476989","display_name":"Katrina M. Waters","orcid":"https://orcid.org/0000-0003-4696-5396"},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Katrina M. Waters","raw_affiliation_strings":["1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory"],"affiliations":[{"raw_affiliation_string":"1 Computational Biology & Bioinformatics, 2 Scientific Data Management, 3 Applied Computer Science and 4 Biological Separations and Mass Spectrometry, Pacific Northwest National Laboratory","institution_ids":["https://openalex.org/I142606810"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5020443342"],"corresponding_institution_ids":["https://openalex.org/I142606810"],"apc_list":{"value":3618,"currency":"USD","value_usd":3618},"apc_paid":null,"fwci":2.1147,"has_fulltext":false,"cited_by_count":40,"citation_normalized_percentile":{"value":0.87276534,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"26","issue":"13","first_page":"1677","last_page":"1683"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.6243266463279724},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.603323757648468},{"id":"https://openalex.org/keywords/mass-spectrometry","display_name":"Mass spectrometry","score":0.4919686019420624},{"id":"https://openalex.org/keywords/tandem-mass-spectrometry","display_name":"Tandem mass spectrometry","score":0.47827088832855225},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.47278520464897156},{"id":"https://openalex.org/keywords/computational-biology","display_name":"Computational biology","score":0.4448801279067993},{"id":"https://openalex.org/keywords/shewanella-oneidensis","display_name":"Shewanella oneidensis","score":0.4312220811843872},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4277617931365967},{"id":"https://openalex.org/keywords/proteomics","display_name":"Proteomics","score":0.4166874587535858},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.328673779964447},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.3073557913303375},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.26761019229888916},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.18642014265060425},{"id":"https://openalex.org/keywords/biochemistry","display_name":"Biochemistry","score":0.140498548746109},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.08883747458457947}],"concepts":[{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.6243266463279724},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.603323757648468},{"id":"https://openalex.org/C162356407","wikidata":"https://www.wikidata.org/wiki/Q180809","display_name":"Mass spectrometry","level":2,"score":0.4919686019420624},{"id":"https://openalex.org/C31827203","wikidata":"https://www.wikidata.org/wiki/Q874296","display_name":"Tandem mass spectrometry","level":3,"score":0.47827088832855225},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.47278520464897156},{"id":"https://openalex.org/C70721500","wikidata":"https://www.wikidata.org/wiki/Q177005","display_name":"Computational biology","level":1,"score":0.4448801279067993},{"id":"https://openalex.org/C2781170380","wikidata":"https://www.wikidata.org/wiki/Q4049396","display_name":"Shewanella oneidensis","level":3,"score":0.4312220811843872},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4277617931365967},{"id":"https://openalex.org/C46111723","wikidata":"https://www.wikidata.org/wiki/Q471857","display_name":"Proteomics","level":3,"score":0.4166874587535858},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.328673779964447},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.3073557913303375},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.26761019229888916},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.18642014265060425},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.140498548746109},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.08883747458457947},{"id":"https://openalex.org/C523546767","wikidata":"https://www.wikidata.org/wiki/Q10876","display_name":"Bacteria","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1093/bioinformatics/btq251","is_oa":false,"landing_page_url":"https://doi.org/10.1093/bioinformatics/btq251","pdf_url":null,"source":{"id":"https://openalex.org/S52395412","display_name":"Bioinformatics","issn_l":"1367-4803","issn":["1367-4803","1367-4811"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320338354","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W73675633","https://openalex.org/W1495935761","https://openalex.org/W1519199376","https://openalex.org/W1536270569","https://openalex.org/W1563088657","https://openalex.org/W1572033224","https://openalex.org/W1578462894","https://openalex.org/W1597678601","https://openalex.org/W1975304761","https://openalex.org/W1978576205","https://openalex.org/W1982411844","https://openalex.org/W1995062121","https://openalex.org/W2005794750","https://openalex.org/W2007683306","https://openalex.org/W2015556811","https://openalex.org/W2023919356","https://openalex.org/W2026582002","https://openalex.org/W2044573154","https://openalex.org/W2046872827","https://openalex.org/W2050783490","https://openalex.org/W2051644573","https://openalex.org/W2053418558","https://openalex.org/W2053679126","https://openalex.org/W2053827324","https://openalex.org/W2059572899","https://openalex.org/W2062649377","https://openalex.org/W2073637473","https://openalex.org/W2084151531","https://openalex.org/W2086307871","https://openalex.org/W2130447268","https://openalex.org/W2143426320","https://openalex.org/W2148342439","https://openalex.org/W2155553629","https://openalex.org/W2156909104","https://openalex.org/W2161811833","https://openalex.org/W2167367944","https://openalex.org/W4388297464","https://openalex.org/W6632155089","https://openalex.org/W6652114615"],"related_works":["https://openalex.org/W2327186020","https://openalex.org/W2280454186","https://openalex.org/W2148274908","https://openalex.org/W2245307148","https://openalex.org/W2215869640","https://openalex.org/W1916525861","https://openalex.org/W1556573660","https://openalex.org/W2738776981","https://openalex.org/W2103021125","https://openalex.org/W2051901836"],"abstract_inverted_index":{"Abstract":[0],"Motivation:":[1],"The":[2],"standard":[3],"approach":[4],"to":[5,25,44,49],"identifying":[6],"peptides":[7,29,54],"based":[8,76],"on":[9,77],"accurate":[10],"mass":[11,23,34],"and":[12,47,86,109,112,145],"elution":[13],"time":[14],"(AMT)":[15],"compares":[16],"profiles":[17],"obtained":[18],"from":[19,32],"a":[20,26,64,72,139],"high":[21,148],"resolution":[22],"spectrometer":[24],"database":[27],"of":[28,80,92,123,128,142],"previously":[30],"identified":[31],"tandem":[33],"spectrometry":[35],"(MS/MS)":[36],"studies.":[37],"It":[38],"would":[39],"be":[40],"advantageous,":[41],"with":[42,125,138],"respect":[43],"both":[45],"accuracy":[46,121],"cost,":[48],"only":[50],"search":[51],"for":[52,88,107],"those":[53],"that":[55,70,133],"are":[56,136,159],"detectable":[57],"by":[58],"MS":[59],"(proteotypic).":[60],"Results:":[61],"We":[62],"present":[63],"support":[65],"vector":[66],"machine":[67],"(SVM)":[68],"model":[69],"uses":[71],"simple":[73],"descriptor":[74],"space":[75],"35":[78],"properties":[79],"amino":[81],"acid":[82],"content,":[83],"charge,":[84],"hydrophilicity":[85],"polarity":[87],"the":[89,115],"quantitative":[90],"prediction":[91],"proteotypic":[93],"peptides.":[94],"Using":[95],"three":[96],"independently":[97],"derived":[98],"AMT":[99],"databases":[100],"(Shewanella":[101],"oneidensis,":[102],"Salmonella":[103],"typhimurium,":[104],"Yersinia":[105],"pestis)":[106],"training":[108],"validation":[110],"within":[111],"across":[113],"species,":[114],"SVM":[116],"resulted":[117],"in":[118],"an":[119,126],"average":[120],"measure":[122],"\u223c0.83":[124],"SD":[127],"&amp;lt;0.038.":[129],"Furthermore,":[130],"we":[131],"demonstrate":[132],"these":[134],"results":[135],"achievable":[137],"small":[140],"set":[141],"13":[143],"variables":[144],"can":[146],"achieve":[147],"proteome":[149],"coverage.":[150],"Availability:":[151],"http://omics.pnl.gov/software/STEPP.php":[152],"Contact:":[153],"bj@pnl.gov":[154],"Supplementary":[155,157],"information:":[156],"data":[158],"available":[160],"at":[161],"Bioinformatics":[162],"online.":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":7},{"year":2013,"cited_by_count":6},{"year":2012,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
