{"id":"https://openalex.org/W2040254860","doi":"https://doi.org/10.1145/2590774","title":"Space-Efficient Frameworks for Top- <i>k</i> String Retrieval","display_name":"Space-Efficient Frameworks for Top- <i>k</i> String Retrieval","publication_year":2014,"publication_date":"2014-04-01","ids":{"openalex":"https://openalex.org/W2040254860","doi":"https://doi.org/10.1145/2590774","mag":"2040254860"},"language":"en","primary_location":{"id":"doi:10.1145/2590774","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2590774","pdf_url":null,"source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013112058","display_name":"Wing-Kai Hon","orcid":"https://orcid.org/0000-0002-0570-2904"},"institutions":[{"id":"https://openalex.org/I25846049","display_name":"National Tsing Hua University","ror":"https://ror.org/00zdnkx70","country_code":"TW","type":"education","lineage":["https://openalex.org/I25846049"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Wing-Kai Hon","raw_affiliation_strings":["National Tsing Hua University, Taiwan, China","National Tsing Hua University, Taiwan, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National Tsing Hua University, Taiwan, China","institution_ids":["https://openalex.org/I25846049"]},{"raw_affiliation_string":"National Tsing Hua University, Taiwan, China#TAB#","institution_ids":["https://openalex.org/I25846049"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105778361","display_name":"Rahul Shah","orcid":"https://orcid.org/0000-0002-0605-5681"},"institutions":[{"id":"https://openalex.org/I121820613","display_name":"Louisiana State University","ror":"https://ror.org/05ect4e57","country_code":"US","type":"education","lineage":["https://openalex.org/I121820613"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rahul Shah","raw_affiliation_strings":["Louisiana State University, Baton Rouge, LA","Louisiana State University , Baton Rouge, LA"],"affiliations":[{"raw_affiliation_string":"Louisiana State University, Baton Rouge, LA","institution_ids":["https://openalex.org/I121820613"]},{"raw_affiliation_string":"Louisiana State University , Baton Rouge, LA","institution_ids":["https://openalex.org/I121820613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049669178","display_name":"Sharma V. Thankachan","orcid":"https://orcid.org/0000-0002-6852-1035"},"institutions":[{"id":"https://openalex.org/I121820613","display_name":"Louisiana State University","ror":"https://ror.org/05ect4e57","country_code":"US","type":"education","lineage":["https://openalex.org/I121820613"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sharma V. Thankachan","raw_affiliation_strings":["Louisiana State University, Baton Rouge, LA","Louisiana State University , Baton Rouge, LA"],"affiliations":[{"raw_affiliation_string":"Louisiana State University, Baton Rouge, LA","institution_ids":["https://openalex.org/I121820613"]},{"raw_affiliation_string":"Louisiana State University , Baton Rouge, LA","institution_ids":["https://openalex.org/I121820613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003340402","display_name":"Jeffrey Scott Vitter","orcid":"https://orcid.org/0000-0001-7970-6118"},"institutions":[{"id":"https://openalex.org/I146416000","display_name":"University of Kansas","ror":"https://ror.org/001tmjg57","country_code":"US","type":"education","lineage":["https://openalex.org/I146416000"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jeffrey Scott Vitter","raw_affiliation_strings":["The University of Kansas, Lawrence, KS"],"affiliations":[{"raw_affiliation_string":"The University of Kansas, Lawrence, KS","institution_ids":["https://openalex.org/I146416000"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5013112058"],"corresponding_institution_ids":["https://openalex.org/I25846049"],"apc_list":null,"apc_paid":null,"fwci":6.9532,"has_fulltext":false,"cited_by_count":30,"citation_normalized_percentile":{"value":0.96895375,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"61","issue":"2","first_page":"1","last_page":"36"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6905906796455383},{"id":"https://openalex.org/keywords/inverted-index","display_name":"Inverted index","score":0.6317982077598572},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.6292915344238281},{"id":"https://openalex.org/keywords/string","display_name":"String (physics)","score":0.6202245354652405},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6114537715911865},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6111261248588562},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6104280352592468},{"id":"https://openalex.org/keywords/phrase","display_name":"Phrase","score":0.5456893444061279},{"id":"https://openalex.org/keywords/string-searching-algorithm","display_name":"String searching algorithm","score":0.5455141067504883},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.46593016386032104},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.46393874287605286},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.45935606956481934},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.448337584733963},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.42835038900375366},{"id":"https://openalex.org/keywords/pattern-matching","display_name":"Pattern matching","score":0.31570467352867126},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.2522960901260376},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.24899649620056152},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.23213961720466614},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.222852885723114}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6905906796455383},{"id":"https://openalex.org/C130590232","wikidata":"https://www.wikidata.org/wiki/Q1671754","display_name":"Inverted index","level":3,"score":0.6317982077598572},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.6292915344238281},{"id":"https://openalex.org/C157486923","wikidata":"https://www.wikidata.org/wiki/Q1376436","display_name":"String (physics)","level":2,"score":0.6202245354652405},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6114537715911865},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6111261248588562},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6104280352592468},{"id":"https://openalex.org/C2776224158","wikidata":"https://www.wikidata.org/wiki/Q187931","display_name":"Phrase","level":2,"score":0.5456893444061279},{"id":"https://openalex.org/C7757238","wikidata":"https://www.wikidata.org/wiki/Q374040","display_name":"String searching algorithm","level":3,"score":0.5455141067504883},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.46593016386032104},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.46393874287605286},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.45935606956481934},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.448337584733963},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.42835038900375366},{"id":"https://openalex.org/C68859911","wikidata":"https://www.wikidata.org/wiki/Q1503724","display_name":"Pattern matching","level":2,"score":0.31570467352867126},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.2522960901260376},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.24899649620056152},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.23213961720466614},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.222852885723114},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C37914503","wikidata":"https://www.wikidata.org/wiki/Q156495","display_name":"Mathematical physics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2590774","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2590774","pdf_url":null,"source":{"id":"https://openalex.org/S118992489","display_name":"Journal of the ACM","issn_l":"0004-5411","issn":["0004-5411","1557-735X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of the ACM","raw_type":"journal-article"},{"id":"pmh:oai:repository.lsu.edu:eecs_pubs-3648","is_oa":false,"landing_page_url":"https://repository.lsu.edu/eecs_pubs/2646","pdf_url":null,"source":{"id":"https://openalex.org/S4210169993","display_name":"Civil War Book Review","issn_l":"1528-6592","issn":["1528-6592"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310315936","host_organization_name":"Louisiana State University","host_organization_lineage":["https://openalex.org/P4310315936"],"host_organization_lineage_names":["Louisiana State University"],"type":"journal"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Faculty Publications","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2645501517","display_name":null,"funder_award_id":"CCF-1017623/CCF-1218904","funder_id":"https://openalex.org/F4320337387","funder_display_name":"Division of Computing and Communication Foundations"},{"id":"https://openalex.org/G4410987","display_name":null,"funder_award_id":"99-2221-E-007-123 and 102-2221-E-007-068","funder_id":"https://openalex.org/F4320321040","funder_display_name":"National Science Council"}],"funders":[{"id":"https://openalex.org/F4320321040","display_name":"National Science Council","ror":"https://ror.org/02kv4zf79"},{"id":"https://openalex.org/F4320337387","display_name":"Division of Computing and Communication Foundations","ror":"https://ror.org/01mng8331"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":72,"referenced_works":["https://openalex.org/W80537337","https://openalex.org/W92500321","https://openalex.org/W110689283","https://openalex.org/W135814361","https://openalex.org/W227213435","https://openalex.org/W297061308","https://openalex.org/W1480869033","https://openalex.org/W1504477191","https://openalex.org/W1506856932","https://openalex.org/W1509727978","https://openalex.org/W1518925092","https://openalex.org/W1520568851","https://openalex.org/W1608371561","https://openalex.org/W1672848638","https://openalex.org/W1705815624","https://openalex.org/W1752316941","https://openalex.org/W1854214752","https://openalex.org/W1860074289","https://openalex.org/W1876495223","https://openalex.org/W1965490077","https://openalex.org/W1970194312","https://openalex.org/W1974033543","https://openalex.org/W1985108724","https://openalex.org/W1986970296","https://openalex.org/W1989749956","https://openalex.org/W1996641400","https://openalex.org/W2007791040","https://openalex.org/W2013291893","https://openalex.org/W2014318353","https://openalex.org/W2027252317","https://openalex.org/W2038142281","https://openalex.org/W2044014345","https://openalex.org/W2049415039","https://openalex.org/W2051158076","https://openalex.org/W2065209187","https://openalex.org/W2072336782","https://openalex.org/W2073921136","https://openalex.org/W2080106004","https://openalex.org/W2085218027","https://openalex.org/W2085933841","https://openalex.org/W2088386938","https://openalex.org/W2090021115","https://openalex.org/W2093918274","https://openalex.org/W2095875205","https://openalex.org/W2099649694","https://openalex.org/W2107079154","https://openalex.org/W2107082304","https://openalex.org/W2111046826","https://openalex.org/W2111340560","https://openalex.org/W2114790712","https://openalex.org/W2118274795","https://openalex.org/W2121252285","https://openalex.org/W2134696992","https://openalex.org/W2137120608","https://openalex.org/W2141957180","https://openalex.org/W2144759920","https://openalex.org/W2149530645","https://openalex.org/W2151453116","https://openalex.org/W2158874082","https://openalex.org/W2159647614","https://openalex.org/W2160484851","https://openalex.org/W2165621523","https://openalex.org/W2170899819","https://openalex.org/W2173123188","https://openalex.org/W2191209163","https://openalex.org/W2533248932","https://openalex.org/W2621280964","https://openalex.org/W2912556076","https://openalex.org/W2951188822","https://openalex.org/W3124327069","https://openalex.org/W4242124034","https://openalex.org/W4292081093"],"related_works":["https://openalex.org/W118734887","https://openalex.org/W3145288231","https://openalex.org/W2371263218","https://openalex.org/W2092552144","https://openalex.org/W2354196777","https://openalex.org/W2965473297","https://openalex.org/W2108265183","https://openalex.org/W2257399947","https://openalex.org/W2248278495","https://openalex.org/W2001669800"],"abstract_inverted_index":{"The":[0,161,171,221,342],"inverted":[1],"index":[2,21,413],"is":[3,43,149,195,284,323,358],"the":[4,20,23,37,50,55,59,133,136,152,197,206,219,288,291,309,380,394],"backbone":[5],"of":[6,17,25,34,39,49,62,78,116,135,145,166,173,208,218,229,268,287,305,320,325,382,396],"modern":[7],"web":[8,18],"search":[9,41,137],"engines.":[10],"For":[11],"each":[12],"word":[13,29,80],"in":[14,122,156,274,302,412],"a":[15,32,40,46,68,89,99,140,179,249,275,285,402],"collection":[16],"documents,":[19],"records":[22],"list":[24,48],"documents":[26,53,297],"where":[27],"this":[28,272],"occurs.":[30],"Given":[31],"set":[33,100,128],"query":[35,60,142,162,340,343,384,416],"words,":[36],"job":[38],"engine":[42],"to":[44,150,196,225,299,392],"output":[45],"ranked":[47],"most":[51,294],"relevant":[52,85,191,295],"containing":[54,158],"query.":[56],"However,":[57],"if":[58,355],"consists":[61],"an":[63,126],"arbitrary":[64,327],"string\u2014which":[65],"can":[66,175,345],"be":[67,176,300,346],"partial":[69],"word,":[70],"multiword":[71],"phrase,":[72],"or":[73,168,215,415,418],"more":[74,169,277],"generally":[75],"any":[76],"sequence":[77],"characters\u2014then":[79],"boundaries":[81],"are":[82,97,205,298],"no":[83],"longer":[84],"and":[86,132,245,255,290,366],"we":[87,96,362,388],"need":[88],"different":[90],"approach.":[91],"In":[92],"string":[93],"retrieval":[94,230],"settings,":[95],"given":[98,141,233],"D":[101,114,117,157],"={":[102],"d":[103,106,109,113,185,193],"1":[104],",":[105,108,111,148,184],"2":[107],"3":[110],"\u2026,":[112],"}":[115],"strings":[118,155],"with":[119,330],"n":[120,263,265,317],"characters":[121],"total":[123],"taken":[124],"from":[125,400],"alphabet":[127],"\u03a3":[129],"=":[130],"[\u03c3],":[131],"task":[134],"engine,":[138],"for":[139,242],"pattern":[143,198,209,213],"P":[144,159,183,199],"length":[146],"p":[147,334,351],"report":[151],"\u201cmost":[153],"relevant\u201d":[154],".":[160,200],"may":[163],"also":[164,407],"consist":[165],"two":[167,240],"patterns.":[170,398],"notion":[172],"relevance":[174],"captured":[177],"by":[178,234],"function":[180],"score":[181,203,328,373],"(":[182,262,316,333,350],"r":[186,194],"),":[187],"which":[188],"indicates":[189],"how":[190],"document":[192],"Some":[201],"example":[202],"functions":[204,329],"frequency":[207,244],"occurrences,":[210,214],"proximity":[211],"between":[212],"pattern-independent":[216],"PageRank":[217],"document.":[220],"first":[222,310],"formal":[223],"framework":[224,312,391],"study":[226,271],"such":[227],"kinds":[228],"problems":[231],"was":[232],"Muthukrishnan":[235],"[SODA":[236],"2002].":[237],"He":[238,247],"considered":[239],"metrics":[241,254],"relevance:":[243],"proximity.":[246],"took":[248],"threshold-based":[250],"approach":[251],"on":[252],"these":[253],"gave":[256],"data":[257],"structures":[258],"that":[259,322],"use":[260],"O":[261,315,332,349],"log":[264,337],")":[266,318,339,354],"words":[267,319],"space.":[269],"We":[270,307],"problem":[273],"somewhat":[276],"natural":[278],"top-":[279],"k":[280,283,293,336,338,353],"framework.":[281],"Here,":[282],"part":[286],"query,":[289],"top":[292],"(highest-scoring)":[296],"reported":[301],"sorted":[303,356],"order":[304,357],"score.":[306],"present":[308],"linear-space":[311],"(i.e.,":[313],"using":[314],"space)":[321],"capable":[324],"handling":[326],"near-optimal":[331],"+":[335,352],"time.":[341,385],"time":[344,417],"made":[347],"optimal":[348],"not":[359],"necessary.":[360],"Further,":[361],"derive":[363],"compact":[364],"space":[365,368,376,414],"succinct":[367],"indexes":[369],"(for":[370],"some":[371],"specific":[372],"functions).":[374],"This":[375],"compression":[377],"comes":[378],"at":[379],"cost":[381],"higher":[383],"At":[386],"last,":[387],"extend":[389],"our":[390,405],"handle":[393],"case":[395],"multiple":[397],"Apart":[399],"providing":[401],"robust":[403],"framework,":[404],"results":[406,411],"improve":[408],"many":[409],"earlier":[410],"both.":[419]},"counts_by_year":[{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
