{"id":"https://openalex.org/W2014148372","doi":"https://doi.org/10.1093/bioinformatics/9.3.343","title":"The position end-set tree: A small automaton for word recognition in biological sequences","display_name":"The position end-set tree: A small automaton for word recognition in biological sequences","publication_year":1993,"publication_date":"1993-01-01","ids":{"openalex":"https://openalex.org/W2014148372","doi":"https://doi.org/10.1093/bioinformatics/9.3.343","mag":"2014148372","pmid":"https://pubmed.ncbi.nlm.nih.gov/8324635"},"language":"en","primary_location":{"id":"doi:10.1093/bioinformatics/9.3.343","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/9.3.343","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/9/3/343/604550/9-3-343.pdf","source":{"id":"https://openalex.org/S4210188263","display_name":"Computer applications in the biosciences","issn_l":"0266-7061","issn":["0266-7061","1460-2059"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://academic.oup.com/bioinformatics/article-pdf/9/3/343/604550/9-3-343.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015331935","display_name":"Christophe Lef\u00e8vre","orcid":"https://orcid.org/0000-0002-2876-0648"},"institutions":[{"id":"https://openalex.org/I1314466530","display_name":"Tokai University","ror":"https://ror.org/01p7qe739","country_code":"JP","type":"education","lineage":["https://openalex.org/I1314466530"]},{"id":"https://openalex.org/I4210110781","display_name":"ARCH Development Corporation","ror":"https://ror.org/021wdzv30","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210110781"]}],"countries":["JP","US"],"is_corresponding":false,"raw_author_name":"Christophe Lef\u00e8vre","raw_affiliation_strings":["Genosphere Project, ERATO, JRDC, Tokai University School of Medicine, Kanagawa, Japan","Genosphere Project, ERATO, JRDC, Tokai University School of MedicineIsehara, Kanagawa 259-11, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Genosphere Project, ERATO, JRDC, Tokai University School of Medicine, Kanagawa, Japan","institution_ids":["https://openalex.org/I1314466530","https://openalex.org/I4210110781"]},{"raw_affiliation_string":"Genosphere Project, ERATO, JRDC, Tokai University School of MedicineIsehara, Kanagawa 259-11, Japan","institution_ids":["https://openalex.org/I1314466530"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5110009465","display_name":"Joh\u2010E Ikeda","orcid":null},"institutions":[{"id":"https://openalex.org/I1314466530","display_name":"Tokai University","ror":"https://ror.org/01p7qe739","country_code":"JP","type":"education","lineage":["https://openalex.org/I1314466530"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Joh-E Ikeda","raw_affiliation_strings":["Genosphere Project, ERATO, JRDC, Tokai University School of Medicine Isehara, Kanagawa 259-11, Japan","Genosphere Project, ERATO, JRDC, Tokai University School of MedicineIsehara, Kanagawa 259-11, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Genosphere Project, ERATO, JRDC, Tokai University School of Medicine Isehara, Kanagawa 259-11, Japan","institution_ids":["https://openalex.org/I1314466530"]},{"raw_affiliation_string":"Genosphere Project, ERATO, JRDC, Tokai University School of MedicineIsehara, Kanagawa 259-11, Japan","institution_ids":["https://openalex.org/I1314466530"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.7493,"has_fulltext":true,"cited_by_count":8,"citation_normalized_percentile":{"value":0.85747335,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"9","issue":"3","first_page":"343","last_page":"348"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12254","display_name":"Machine Learning in Bioinformatics","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9793000221252441,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/substring","display_name":"Substring","score":0.8230117559432983},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.7199587225914001},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6602059602737427},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5753818154335022},{"id":"https://openalex.org/keywords/deterministic-finite-automaton","display_name":"Deterministic finite automaton","score":0.5736095905303955},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.5433292388916016},{"id":"https://openalex.org/keywords/automaton","display_name":"Automaton","score":0.5382888317108154},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5376016497612},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.529455840587616},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.5075684785842896},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4968107044696808},{"id":"https://openalex.org/keywords/suffix-tree","display_name":"Suffix tree","score":0.4702547788619995},{"id":"https://openalex.org/keywords/finite-state-machine","display_name":"Finite-state machine","score":0.4615042805671692},{"id":"https://openalex.org/keywords/string-searching-algorithm","display_name":"String searching algorithm","score":0.4538584351539612},{"id":"https://openalex.org/keywords/deterministic-automaton","display_name":"Deterministic automaton","score":0.4438523054122925},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.4398486316204071},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.43790119886398315},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3029961884021759},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.28297749161720276},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2711992859840393},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.22692766785621643},{"id":"https://openalex.org/keywords/combinatorics","display_name":"Combinatorics","score":0.21805882453918457},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.08136293292045593}],"concepts":[{"id":"https://openalex.org/C182407805","wikidata":"https://www.wikidata.org/wiki/Q2626534","display_name":"Substring","level":3,"score":0.8230117559432983},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.7199587225914001},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6602059602737427},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5753818154335022},{"id":"https://openalex.org/C104091681","wikidata":"https://www.wikidata.org/wiki/Q837528","display_name":"Deterministic finite automaton","level":3,"score":0.5736095905303955},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.5433292388916016},{"id":"https://openalex.org/C112505250","wikidata":"https://www.wikidata.org/wiki/Q787116","display_name":"Automaton","level":2,"score":0.5382888317108154},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5376016497612},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.529455840587616},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.5075684785842896},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4968107044696808},{"id":"https://openalex.org/C2781166958","wikidata":"https://www.wikidata.org/wiki/Q1426863","display_name":"Suffix tree","level":3,"score":0.4702547788619995},{"id":"https://openalex.org/C167822520","wikidata":"https://www.wikidata.org/wiki/Q176452","display_name":"Finite-state machine","level":2,"score":0.4615042805671692},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.4538584351539612},{"id":"https://openalex.org/C194525867","wikidata":"https://www.wikidata.org/wiki/Q5265707","display_name":"Deterministic automaton","level":3,"score":0.4438523054122925},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4398486316204071},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.43790119886398315},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3029961884021759},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.28297749161720276},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2711992859840393},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.22692766785621643},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.21805882453918457},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.08136293292045593},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0}],"mesh":[{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D000465","descriptor_name":"Algorithms","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D001330","descriptor_name":"Electronic Data Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001330","descriptor_name":"Electronic Data Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D001330","descriptor_name":"Electronic Data Processing","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008838","descriptor_name":"Microcomputers","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008838","descriptor_name":"Microcomputers","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D008838","descriptor_name":"Microcomputers","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009862","descriptor_name":"Online Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009862","descriptor_name":"Online Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D009862","descriptor_name":"Online Systems","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D010363","descriptor_name":"Pattern Recognition, Automated","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011382","descriptor_name":"Programming, Linear","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011382","descriptor_name":"Programming, Linear","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D011382","descriptor_name":"Programming, Linear","qualifier_ui":null,"qualifier_name":null,"is_major_topic":false},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true},{"descriptor_ui":"D017421","descriptor_name":"Sequence Analysis","qualifier_ui":null,"qualifier_name":null,"is_major_topic":true}],"locations_count":2,"locations":[{"id":"doi:10.1093/bioinformatics/9.3.343","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/9.3.343","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/9/3/343/604550/9-3-343.pdf","source":{"id":"https://openalex.org/S4210188263","display_name":"Computer applications in the biosciences","issn_l":"0266-7061","issn":["0266-7061","1460-2059"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},{"id":"pmid:8324635","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/8324635","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computer applications in the biosciences : CABIOS","raw_type":null}],"best_oa_location":{"id":"doi:10.1093/bioinformatics/9.3.343","is_oa":true,"landing_page_url":"https://doi.org/10.1093/bioinformatics/9.3.343","pdf_url":"https://academic.oup.com/bioinformatics/article-pdf/9/3/343/604550/9-3-343.pdf","source":{"id":"https://openalex.org/S4210188263","display_name":"Computer applications in the biosciences","issn_l":"0266-7061","issn":["0266-7061","1460-2059"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Bioinformatics","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2014148372.pdf","grobid_xml":"https://content.openalex.org/works/W2014148372.grobid-xml"},"referenced_works_count":4,"referenced_works":["https://openalex.org/W1991864975","https://openalex.org/W2010808181","https://openalex.org/W4236236547","https://openalex.org/W4302339081"],"related_works":["https://openalex.org/W2102450363","https://openalex.org/W2162655434","https://openalex.org/W1608420182","https://openalex.org/W2902482624","https://openalex.org/W2067956663","https://openalex.org/W1593730394","https://openalex.org/W52396946","https://openalex.org/W2298204719","https://openalex.org/W3022344494","https://openalex.org/W2070949798"],"abstract_inverted_index":{"We":[0,41,68],"consider":[1],"the":[2,34,39,62,84,97],"basic":[3],"function":[4],"which":[5],"locates":[6],"a":[7,13,43,47,55,66,80,90],"specific":[8],"string":[9],"of":[10,65,87,99],"symbols":[11],"within":[12],"longer":[14],"sequence.":[15,67],"When":[16],"one":[17],"is":[18,26],"expecting":[19],"to":[20,28,33,36,45],"do":[21],"many":[22],"substring":[23],"searches":[24],"it":[25],"worthwhile":[27],"build":[29],"an":[30,70],"auxiliary":[31],"index":[32,49],"sequence":[35,91,101],"aid":[37],"in":[38,76,89,96],"search.":[40],"propose":[42],"method":[44],"generate":[46],"compact":[48],"that":[50],"can":[51,93],"be":[52,94],"viewed":[53],"as":[54],"small":[56],"(partial)":[57],"deterministic":[58],"finite":[59],"automaton":[60],"recognizing":[61],"subword":[63],"structure":[64,82],"present":[69],"algorithm":[71],"for":[72],"its":[73],"construction":[74],"on-line":[75],"linear":[77],"time.":[78],"Such":[79],"data":[81],"permits":[83],"efficient":[85],"localization":[86],"subwords":[88],"and":[92],"used":[95],"development":[98],"interactive":[100],"analysis":[102],"software.":[103]},"counts_by_year":[{"year":2017,"cited_by_count":1}],"updated_date":"2026-06-16T09:24:06.705377","created_date":"2025-10-10T00:00:00"}
