{"id":"https://openalex.org/W2117942198","doi":"https://doi.org/10.1145/1458449.1458459","title":"Peptide programs","display_name":"Peptide programs","publication_year":2008,"publication_date":"2008-10-30","ids":{"openalex":"https://openalex.org/W2117942198","doi":"https://doi.org/10.1145/1458449.1458459","mag":"2117942198"},"language":"en","primary_location":{"id":"doi:10.1145/1458449.1458459","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458449.1458459","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd international workshop on Data and text mining in bioinformatics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076982064","display_name":"Andr\u00e9 O. Falc\u00e3o","orcid":"https://orcid.org/0000-0002-3588-8746"},"institutions":[{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":true,"raw_author_name":"Andre O. Falcao","raw_affiliation_strings":["University of Lisbon, Lisbon, Portugal"],"affiliations":[{"raw_affiliation_string":"University of Lisbon, Lisbon, Portugal","institution_ids":["https://openalex.org/I141596103"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072979086","display_name":"Daniel Faria","orcid":"https://orcid.org/0000-0003-1511-277X"},"institutions":[{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Daniel Faria","raw_affiliation_strings":["University of Lisbon, Lisbon, Portugal"],"affiliations":[{"raw_affiliation_string":"University of Lisbon, Lisbon, Portugal","institution_ids":["https://openalex.org/I141596103"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047651121","display_name":"Ant\u00f3nio E. N. Ferreira","orcid":"https://orcid.org/0000-0002-9625-8115"},"institutions":[{"id":"https://openalex.org/I141596103","display_name":"University of Lisbon","ror":"https://ror.org/01c27hj86","country_code":"PT","type":"education","lineage":["https://openalex.org/I141596103"]}],"countries":["PT"],"is_corresponding":false,"raw_author_name":"Ant\u00f3nio Ferreira","raw_affiliation_strings":["University of Lisbon, Lisbon, Portugal"],"affiliations":[{"raw_affiliation_string":"University of Lisbon, Lisbon, Portugal","institution_ids":["https://openalex.org/I141596103"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5076982064"],"corresponding_institution_ids":["https://openalex.org/I141596103"],"apc_list":null,"apc_paid":null,"fwci":0.2693,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.60022031,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"37","last_page":"44"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10519","display_name":"Advanced Proteomics Techniques and Applications","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1607","display_name":"Spectroscopy"},"field":{"id":"https://openalex.org/fields/16","display_name":"Chemistry"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10521","display_name":"RNA and protein synthesis mechanisms","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7469638586044312},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5775889158248901},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.571368396282196},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5660129189491272},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5387841463088989},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.5207028985023499},{"id":"https://openalex.org/keywords/protein-sequencing","display_name":"Protein sequencing","score":0.486227422952652},{"id":"https://openalex.org/keywords/binary-classification","display_name":"Binary classification","score":0.4853455126285553},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.44918641448020935},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.43583351373672485},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4214867353439331},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.4118429720401764},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.41184067726135254},{"id":"https://openalex.org/keywords/peptide-sequence","display_name":"Peptide sequence","score":0.30703309178352356},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12939870357513428}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7469638586044312},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5775889158248901},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.571368396282196},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5660129189491272},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5387841463088989},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.5207028985023499},{"id":"https://openalex.org/C10010492","wikidata":"https://www.wikidata.org/wiki/Q3142557","display_name":"Protein sequencing","level":4,"score":0.486227422952652},{"id":"https://openalex.org/C66905080","wikidata":"https://www.wikidata.org/wiki/Q17005494","display_name":"Binary classification","level":3,"score":0.4853455126285553},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.44918641448020935},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.43583351373672485},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4214867353439331},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.4118429720401764},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.41184067726135254},{"id":"https://openalex.org/C167625842","wikidata":"https://www.wikidata.org/wiki/Q899763","display_name":"Peptide sequence","level":3,"score":0.30703309178352356},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12939870357513428},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1458449.1458459","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458449.1458459","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd international workshop on Data and text mining in bioinformatics","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W141916262","https://openalex.org/W183334939","https://openalex.org/W1484341170","https://openalex.org/W1569127951","https://openalex.org/W1576818901","https://openalex.org/W1955025754","https://openalex.org/W1975394843","https://openalex.org/W1979434225","https://openalex.org/W1982597966","https://openalex.org/W1988790447","https://openalex.org/W1990215053","https://openalex.org/W1995918845","https://openalex.org/W2015809665","https://openalex.org/W2027364181","https://openalex.org/W2027716098","https://openalex.org/W2032838501","https://openalex.org/W2037104504","https://openalex.org/W2079766279","https://openalex.org/W2081998091","https://openalex.org/W2085176241","https://openalex.org/W2098223336","https://openalex.org/W2100320834","https://openalex.org/W2106207199","https://openalex.org/W2107432340","https://openalex.org/W2109553965","https://openalex.org/W2117619142","https://openalex.org/W2117806412","https://openalex.org/W2119027485","https://openalex.org/W2123858481","https://openalex.org/W2129368756","https://openalex.org/W2129922540","https://openalex.org/W2135217050","https://openalex.org/W2136769496","https://openalex.org/W2142013909","https://openalex.org/W2148279834","https://openalex.org/W2158292827","https://openalex.org/W2158714788","https://openalex.org/W3104778163"],"related_works":["https://openalex.org/W2053028024","https://openalex.org/W2011602722","https://openalex.org/W2024383575","https://openalex.org/W1965617697","https://openalex.org/W2072002764","https://openalex.org/W2012033675","https://openalex.org/W2033162017","https://openalex.org/W2073512219","https://openalex.org/W1991987880","https://openalex.org/W2061704447"],"abstract_inverted_index":{"Functional":[0],"prediction/classification":[1],"of":[2,26,96,112,131,142,176,191,210],"proteins":[3],"is":[4,68,99,153,170,195],"a":[5,13,53,63,73,106,120,151],"central":[6],"problem":[7],"in":[8,70,93,104,172,197,201],"bioinformatics.":[9],"Alignment":[10],"methods":[11],"are":[12,35,148],"useful":[14],"approach,":[15],"but":[16],"have":[17,20],"limitations,":[18],"which":[19,135],"prompted":[21],"the":[22,94,113,123,129,132,143,173,192,204,208,211],"development":[23],"and":[24,42,66,117,150,165,199,214],"use":[25,44],"machine":[27,32,86],"learning":[28,33,87],"approaches.":[29],"However,":[30],"traditional":[31],"approaches":[34],"unable":[36],"to":[37,51,61,110,217],"exploit":[38,77],"sequence":[39,46,78,221],"data":[40,79],"directly,":[41],"instead":[43],"derived":[45],"features":[47],"or":[48],"Kernel":[49],"functions":[50],"obtain":[52],"feature":[54],"space.":[55],"Because":[56],"theoretically":[57],"all":[58],"information":[59],"necessary":[60],"predict":[62],"protein's":[64],"structure":[65],"function":[67],"contained":[69],"its":[71,137,215],"sequence,":[72],"methodology":[74,88,102,144,169],"that":[75],"could":[76,81],"directly":[80],"be":[82],"advantageous.":[83],"A":[84],"novel":[85],"for":[89,155],"protein":[90,121],"classification,":[91],"inspired":[92],"concept":[95],"fragment":[97],"programs,":[98],"presented.":[100],"This":[101],"consists":[103],"assigning":[105],"minimal":[107],"computer":[108],"program":[109,124],"each":[111],"20":[114],"amino":[115,133],"acids,":[116],"then":[118],"representing":[119],"as":[122],"resulting":[125],"from":[126,220],"applying":[127],"sequentially":[128],"programs":[130],"acids":[134],"compose":[136],"sequence.":[138],"The":[139,168,186],"basic":[140],"concepts":[141],"presented":[145],"(peptide":[146],"programs)":[147],"discussed":[149],"framework":[152],"proposed":[154,212],"their":[156],"implementation,":[157],"including":[158],"instruction":[159],"set,":[160],"virtual":[161],"machine,":[162],"evaluation":[163],"procedures":[164],"convergence":[166],"methods.":[167],"tested":[171],"binary":[174,193],"classification":[175],"33,500":[177],"enzymes":[178],"into":[179],"182":[180],"distinct":[181],"Enzyme":[182],"Commission":[183],"(EC)":[184],"classes.":[185],"average":[187],"Matthews":[188],"correlation":[189],"coefficient":[190],"classifiers":[194],"0.75":[196],"training":[198],"0.68":[200],"validation.":[202],"Overall,":[203],"results":[205],"obtained":[206],"demonstrate":[207],"potential":[209],"methodology,":[213],"ability":[216],"extract":[218],"knowledge":[219],"data,":[222],"using":[223],"very":[224],"few":[225],"computational":[226],"resources":[227]},"counts_by_year":[{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2016-06-24T00:00:00"}
