{"id":"https://openalex.org/W2016202965","doi":"https://doi.org/10.1145/1102351.1102458","title":"Large scale genomic sequence SVM classifiers","display_name":"Large scale genomic sequence SVM classifiers","publication_year":2005,"publication_date":"2005-01-01","ids":{"openalex":"https://openalex.org/W2016202965","doi":"https://doi.org/10.1145/1102351.1102458","mag":"2016202965"},"language":"en","primary_location":{"id":"doi:10.1145/1102351.1102458","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1102351.1102458","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd international conference on Machine learning  - ICML '05","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110197966","display_name":"S\u00f6ren Sonnenburg","orcid":null},"institutions":[{"id":"https://openalex.org/I4923324","display_name":"Fraunhofer Society","ror":"https://ror.org/05hkkdn48","country_code":"DE","type":"funder","lineage":["https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"S\u00f6ren Sonnenburg","raw_affiliation_strings":["Fraunhofer Institute FIRST, Berlin, Germany","Fraunhofer\u2013Institute FIRST, Berlin, Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer Institute FIRST, Berlin, Germany","institution_ids":["https://openalex.org/I4923324"]},{"raw_affiliation_string":"Fraunhofer\u2013Institute FIRST, Berlin, Germany","institution_ids":["https://openalex.org/I4923324"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035416263","display_name":"Gunnar R\u00e4tsch","orcid":"https://orcid.org/0000-0001-5486-8532"},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"funder","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210147862","display_name":"Friedrich Miescher Laboratory","ror":"https://ror.org/04vh1tq58","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210147862"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gunnar R\u00e4tsch","raw_affiliation_strings":["Friedrich Miescher Laboratory of the Max Planck Society, T\u00fcbingen, Germany","Friedrich Miescher Laboratory of the Max Planck Society, T\u00fcbingen, Germany#TAB#"],"affiliations":[{"raw_affiliation_string":"Friedrich Miescher Laboratory of the Max Planck Society, T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I4210147862","https://openalex.org/I149899117"]},{"raw_affiliation_string":"Friedrich Miescher Laboratory of the Max Planck Society, T\u00fcbingen, Germany#TAB#","institution_ids":["https://openalex.org/I149899117"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044005697","display_name":"Bernhard Sch\u00f6lkopf","orcid":"https://orcid.org/0000-0002-8177-0925"},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"funder","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210112925","display_name":"Max Planck Institute for Biological Cybernetics","ror":"https://ror.org/026nmvv73","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210112925"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Bernhard Sch\u00f6lkopf","raw_affiliation_strings":["Max Planck Institute for Biological Cybernetics, T\u00fcbingen, Germany","Max-Planck-Institute for Biological Cybernetics, T\u00fcbingen, Germany#TAB#"],"affiliations":[{"raw_affiliation_string":"Max Planck Institute for Biological Cybernetics, T\u00fcbingen, Germany","institution_ids":["https://openalex.org/I4210112925"]},{"raw_affiliation_string":"Max-Planck-Institute for Biological Cybernetics, T\u00fcbingen, Germany#TAB#","institution_ids":["https://openalex.org/I149899117"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110197966"],"corresponding_institution_ids":["https://openalex.org/I4923324"],"apc_list":null,"apc_paid":null,"fwci":7.8974,"has_fulltext":false,"cited_by_count":48,"citation_normalized_percentile":{"value":0.97274644,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"848","last_page":"855"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10015","display_name":"Genomics and Phylogenetic Studies","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.7770334482192993},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.7561633586883545},{"id":"https://openalex.org/keywords/string-kernel","display_name":"String kernel","score":0.6876431107521057},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6621381640434265},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6126686334609985},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5907819271087646},{"id":"https://openalex.org/keywords/tree-kernel","display_name":"Tree kernel","score":0.579856276512146},{"id":"https://openalex.org/keywords/kernel-method","display_name":"Kernel method","score":0.5570458173751831},{"id":"https://openalex.org/keywords/sequential-minimal-optimization","display_name":"Sequential minimal optimization","score":0.5378742218017578},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.505962073802948},{"id":"https://openalex.org/keywords/radial-basis-function-kernel","display_name":"Radial basis function kernel","score":0.46696192026138306},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.46107104420661926},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4325609803199768},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3497313857078552},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.25622886419296265},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.10927170515060425},{"id":"https://openalex.org/keywords/genetics","display_name":"Genetics","score":0.08476406335830688}],"concepts":[{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.7770334482192993},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.7561633586883545},{"id":"https://openalex.org/C55851704","wikidata":"https://www.wikidata.org/wiki/Q7623983","display_name":"String kernel","level":5,"score":0.6876431107521057},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6621381640434265},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6126686334609985},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5907819271087646},{"id":"https://openalex.org/C140417398","wikidata":"https://www.wikidata.org/wiki/Q16933942","display_name":"Tree kernel","level":5,"score":0.579856276512146},{"id":"https://openalex.org/C122280245","wikidata":"https://www.wikidata.org/wiki/Q620622","display_name":"Kernel method","level":3,"score":0.5570458173751831},{"id":"https://openalex.org/C10719679","wikidata":"https://www.wikidata.org/wiki/Q2679145","display_name":"Sequential minimal optimization","level":3,"score":0.5378742218017578},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.505962073802948},{"id":"https://openalex.org/C75866337","wikidata":"https://www.wikidata.org/wiki/Q7280263","display_name":"Radial basis function kernel","level":4,"score":0.46696192026138306},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.46107104420661926},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4325609803199768},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3497313857078552},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.25622886419296265},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.10927170515060425},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.08476406335830688},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1102351.1102458","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1102351.1102458","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 22nd international conference on Machine learning  - ICML '05","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W854322902","https://openalex.org/W1512098439","https://openalex.org/W1542652324","https://openalex.org/W1563088657","https://openalex.org/W1576520375","https://openalex.org/W1601740268","https://openalex.org/W1602916555","https://openalex.org/W1968114652","https://openalex.org/W2020816856","https://openalex.org/W2041956242","https://openalex.org/W2099401974","https://openalex.org/W2106868411","https://openalex.org/W2107751776","https://openalex.org/W2108995755","https://openalex.org/W2111765516","https://openalex.org/W2114049512","https://openalex.org/W2114281975","https://openalex.org/W2119821739","https://openalex.org/W2124158580","https://openalex.org/W2124225821","https://openalex.org/W2127949964","https://openalex.org/W2136145671","https://openalex.org/W2149684865","https://openalex.org/W2155653793","https://openalex.org/W2156455118","https://openalex.org/W2539561358","https://openalex.org/W3023786531","https://openalex.org/W3144379435","https://openalex.org/W4239510810","https://openalex.org/W4293196852"],"related_works":["https://openalex.org/W1558903433","https://openalex.org/W2043334680","https://openalex.org/W1550105856","https://openalex.org/W2022862073","https://openalex.org/W2963372274","https://openalex.org/W2604913466","https://openalex.org/W2020816856","https://openalex.org/W2189183545","https://openalex.org/W2016202965","https://openalex.org/W2107725114"],"abstract_inverted_index":{"In":[0,28,50],"genomic":[1],"sequence":[2],"analysis":[3],"tasks":[4],"like":[5],"splice":[6],"site":[7],"recognition":[8],"or":[9],"promoter":[10],"identification,":[11],"large":[12,93,148],"amounts":[13],"of":[14,61,73,102,136],"training":[15,65,72,96],"sequences":[16,121],"are":[17],"available,":[18],"and":[19,36,44,59,76,90,104],"indeed":[20],"needed":[21],"to":[22,69,143],"achieve":[23],"sufficiently":[24],"high":[25],"classification":[26],"performances.":[27],"this":[29],"work":[30],"we":[31,52],"study":[32],"two":[33],"recently":[34],"proposed":[35],"successfully":[37],"used":[38],"kernels,":[39],"namely":[40],"the":[41,45,71,74,87,129,134],"Spectrum":[42],"kernel":[43,48,89,115],"Weighted":[46],"Degree":[47],"(WD).":[49],"particular,":[51],"suggest":[53],"several":[54,124],"extensions":[55],"using":[56,109,128],"Suffix":[57],"Trees":[58],"modifications":[60],"an":[62],"SMO-like":[63],"SVM":[64,95],"algorithm":[66],"in":[67],"order":[68],"accelerate":[70],"SVMs":[75],"their":[77],"evaluation":[78,118],"on":[79,119,133,145],"test":[80],"sequences.":[81,152],"Our":[82,139],"simulations":[83],"show":[84],"that":[85],"for":[86],"spectrum":[88],"WD":[91],"kernel,":[92],"scale":[94],"can":[97],"be":[98],"accelerated":[99],"by":[100],"factors":[101],"20":[103],"4":[105],"times,":[106],"respectively,":[107],"while":[108],"much":[110],"less":[111],"memory":[112],"(e.g.":[113],"no":[114],"caching).":[116],"The":[117],"new":[120,130],"is":[122],"often":[123],"thousand":[125],"times":[126],"faster":[127],"techniques":[131],"(depending":[132],"number":[135],"Support":[137],"Vectors).":[138],"method":[140],"allows":[141],"us":[142],"train":[144],"sets":[146],"as":[147,149],"one":[150],"million":[151]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
