{"id":"https://openalex.org/W2076898137","doi":"https://doi.org/10.1145/1031171.1031209","title":"Scalable sequential pattern mining for biological sequences","display_name":"Scalable sequential pattern mining for biological sequences","publication_year":2004,"publication_date":"2004-11-13","ids":{"openalex":"https://openalex.org/W2076898137","doi":"https://doi.org/10.1145/1031171.1031209","mag":"2076898137"},"language":"en","primary_location":{"id":"doi:10.1145/1031171.1031209","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1031171.1031209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the thirteenth ACM international conference on Information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100726480","display_name":"Ke Wang","orcid":"https://orcid.org/0000-0002-8483-3047"},"institutions":[{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Ke Wang","raw_affiliation_strings":["Simon Fraser University"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University","institution_ids":["https://openalex.org/I18014758"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102127734","display_name":"Yabo Xu","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]},{"id":"https://openalex.org/I18014758","display_name":"Simon Fraser University","ror":"https://ror.org/0213rcc28","country_code":"CA","type":"education","lineage":["https://openalex.org/I18014758"]}],"countries":["CA","HK"],"is_corresponding":false,"raw_author_name":"Yabo Xu","raw_affiliation_strings":["Simon Fraser University and Chinese University of Hong Kong","Simon Fraser University and Chinese University of Hong Kong#TAB#"],"affiliations":[{"raw_affiliation_string":"Simon Fraser University and Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633","https://openalex.org/I18014758"]},{"raw_affiliation_string":"Simon Fraser University and Chinese University of Hong Kong#TAB#","institution_ids":["https://openalex.org/I177725633","https://openalex.org/I18014758"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075642293","display_name":"Jeffrey Xu Yu","orcid":"https://orcid.org/0000-0002-9738-827X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jeffrey Xu Yu","raw_affiliation_strings":["Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100726480"],"corresponding_institution_ids":["https://openalex.org/I18014758"],"apc_list":null,"apc_paid":null,"fwci":13.4141,"has_fulltext":false,"cited_by_count":102,"citation_normalized_percentile":{"value":0.98283798,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"178","last_page":"187"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7322434186935425},{"id":"https://openalex.org/keywords/pattern-search","display_name":"Pattern search","score":0.7199238538742065},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7030107378959656},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.6724215745925903},{"id":"https://openalex.org/keywords/alphabet","display_name":"Alphabet","score":0.5573329329490662},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5452658534049988},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5031053423881531},{"id":"https://openalex.org/keywords/phase","display_name":"Phase (matter)","score":0.49748876690864563},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4631352722644806},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4490920305252075},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.39922481775283813},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30456581711769104},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20992371439933777},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.07858780026435852},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.07564771175384521}],"concepts":[{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7322434186935425},{"id":"https://openalex.org/C82691427","wikidata":"https://www.wikidata.org/wiki/Q4291856","display_name":"Pattern search","level":2,"score":0.7199238538742065},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7030107378959656},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.6724215745925903},{"id":"https://openalex.org/C112876837","wikidata":"https://www.wikidata.org/wiki/Q837518","display_name":"Alphabet","level":2,"score":0.5573329329490662},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5452658534049988},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5031053423881531},{"id":"https://openalex.org/C44280652","wikidata":"https://www.wikidata.org/wiki/Q104837","display_name":"Phase (matter)","level":2,"score":0.49748876690864563},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4631352722644806},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4490920305252075},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.39922481775283813},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30456581711769104},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20992371439933777},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.07858780026435852},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.07564771175384521},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1031171.1031209","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1031171.1031209","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the thirteenth ACM international conference on Information and knowledge management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4099999964237213,"display_name":"Responsible consumption and production","id":"https://metadata.un.org/sdg/12"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1584003909","https://openalex.org/W1585338396","https://openalex.org/W1597561788","https://openalex.org/W1608194207","https://openalex.org/W1641039719","https://openalex.org/W1956090332","https://openalex.org/W1994085050","https://openalex.org/W2009418433","https://openalex.org/W2009566340","https://openalex.org/W2032991899","https://openalex.org/W2036667662","https://openalex.org/W2068383400","https://openalex.org/W2069356553","https://openalex.org/W2108560469","https://openalex.org/W2126332379","https://openalex.org/W2141115288","https://openalex.org/W2147694185","https://openalex.org/W2154765457","https://openalex.org/W2156026066","https://openalex.org/W2158454296"],"related_works":["https://openalex.org/W4245829522","https://openalex.org/W4249081720","https://openalex.org/W2076898137","https://openalex.org/W1792581674","https://openalex.org/W2037965016","https://openalex.org/W2092552144","https://openalex.org/W2129436231","https://openalex.org/W2532549791","https://openalex.org/W2083577879","https://openalex.org/W127511151"],"abstract_inverted_index":{"Biosequences":[0],"typically":[1],"have":[2],"a":[3,6,26,56],"small":[4],"alphabet,":[5],"long":[7,88],"length,":[8],"and":[9,54,124,126,142],"patterns":[10,21,73,89],"containing":[11,74,90],"gaps":[12],"(i.e.,":[13],"\"don't":[14],"care\")":[15],"of":[16,29,105],"arbitrary":[17],"size.":[18],"Mining":[19],"frequent":[20],"in":[22,32,37,132],"such":[23],"sequences":[24,34],"faces":[25],"different":[27],"type":[28],"explosion":[30,47],"than":[31],"transaction":[33],"primarily":[35],"motivated":[36],"market-basket":[38],"analysis.":[39],"In":[40],"this":[41,46,63,138],"paper,":[42],"we":[43],"study":[44],"how":[45],"affects":[48],"the":[49,111,115,121,129,133],"classic":[50],"sequential":[51],"pattern":[52,122],"mining,":[53],"present":[55],"scalable":[57],"two-phase":[58],"algorithm":[59],"to":[60,109,118,127],"deal":[61],"with":[62],"new":[64],"explosion.":[65],"The":[66,83,103],"<i>Segment":[67],"Phase</i>":[68,85],"first":[69,116],"searches":[70,86],"for":[71,87],"short":[72],"no":[75],"gaps,":[76],"called":[77],"<i>segments</i>.":[78],"This":[79,98],"phase":[80,99,117],"is":[81,100,108],"efficient.":[82],"<i>Pattern":[84],"multiple":[91],"segments":[92],"separated":[93],"by":[94],"variable":[95],"length":[96],"gaps.":[97],"time":[101],"consuming.":[102],"purpose":[104],"two":[106],"phases":[107],"exploit":[110],"information":[112],"obtained":[113],"from":[114],"speed":[119],"up":[120],"growth":[123],"matching":[125],"prune":[128],"search":[130],"space":[131],"second":[134],"phase.":[135],"We":[136],"evaluate":[137],"approach":[139],"on":[140],"synthetic":[141],"real":[143],"life":[144],"data":[145],"sets.":[146]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":11},{"year":2014,"cited_by_count":13},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":10}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
