{"id":"https://openalex.org/W2088039650","doi":"https://doi.org/10.1145/1353343.1353408","title":"Efficient LCA based keyword search in XML data","display_name":"Efficient LCA based keyword search in XML data","publication_year":2008,"publication_date":"2008-03-25","ids":{"openalex":"https://openalex.org/W2088039650","doi":"https://doi.org/10.1145/1353343.1353408","mag":"2088039650"},"language":"en","primary_location":{"id":"doi:10.1145/1353343.1353408","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1353343.1353408","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1353343.1353408","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th international conference on Extending database technology: Advances in database technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/1353343.1353408","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101854939","display_name":"Yu Xu","orcid":"https://orcid.org/0000-0003-1498-8331"},"institutions":[{"id":"https://openalex.org/I4210158714","display_name":"Teradata (United States)","ror":"https://ror.org/04vkkat38","country_code":"US","type":"company","lineage":["https://openalex.org/I4210158714"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yu Xu","raw_affiliation_strings":["Teradata, San Diego, CA"],"affiliations":[{"raw_affiliation_string":"Teradata, San Diego, CA","institution_ids":["https://openalex.org/I4210158714"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059167302","display_name":"Yannis Papakonstantinou","orcid":"https://orcid.org/0009-0007-6360-9496"},"institutions":[{"id":"https://openalex.org/I36258959","display_name":"University of California San Diego","ror":"https://ror.org/0168r3w48","country_code":"US","type":"education","lineage":["https://openalex.org/I36258959"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yannis Papakonstantinou","raw_affiliation_strings":["University of California, San Diego, CA"],"affiliations":[{"raw_affiliation_string":"University of California, San Diego, CA","institution_ids":["https://openalex.org/I36258959"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5101854939"],"corresponding_institution_ids":["https://openalex.org/I4210158714"],"apc_list":null,"apc_paid":null,"fwci":19.2483,"has_fulltext":true,"cited_by_count":119,"citation_normalized_percentile":{"value":0.99408284,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"535","last_page":"546"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8137478828430176},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.7477643489837646},{"id":"https://openalex.org/keywords/stack","display_name":"Stack (abstract data type)","score":0.633596658706665},{"id":"https://openalex.org/keywords/keyword-density","display_name":"Keyword density","score":0.5867351293563843},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5523258447647095},{"id":"https://openalex.org/keywords/keyword-search","display_name":"Keyword search","score":0.5394870042800903},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.45239442586898804},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4515463709831238},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35629552602767944},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.34901320934295654},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34191828966140747},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14439740777015686},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.07810118794441223}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8137478828430176},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.7477643489837646},{"id":"https://openalex.org/C9395851","wikidata":"https://www.wikidata.org/wiki/Q177929","display_name":"Stack (abstract data type)","level":2,"score":0.633596658706665},{"id":"https://openalex.org/C57560718","wikidata":"https://www.wikidata.org/wiki/Q125627","display_name":"Keyword density","level":3,"score":0.5867351293563843},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5523258447647095},{"id":"https://openalex.org/C2988412617","wikidata":"https://www.wikidata.org/wiki/Q7441656","display_name":"Keyword search","level":2,"score":0.5394870042800903},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.45239442586898804},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4515463709831238},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35629552602767944},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.34901320934295654},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34191828966140747},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14439740777015686},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.07810118794441223},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1353343.1353408","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1353343.1353408","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1353343.1353408","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th international conference on Extending database technology: Advances in database technology","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/1353343.1353408","is_oa":true,"landing_page_url":"https://doi.org/10.1145/1353343.1353408","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/1353343.1353408","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 11th international conference on Extending database technology: Advances in database technology","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2088039650.pdf","grobid_xml":"https://content.openalex.org/works/W2088039650.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W1538246304","https://openalex.org/W1565494300","https://openalex.org/W1605802622","https://openalex.org/W1671881141","https://openalex.org/W1973828215","https://openalex.org/W2074863013","https://openalex.org/W2084243240","https://openalex.org/W2088499566","https://openalex.org/W2098388305","https://openalex.org/W2105819430","https://openalex.org/W2108572131","https://openalex.org/W2113112851","https://openalex.org/W2115221525","https://openalex.org/W2121350579","https://openalex.org/W2125630417","https://openalex.org/W2128034913","https://openalex.org/W2138540053","https://openalex.org/W2148126307","https://openalex.org/W2169624745","https://openalex.org/W2171874178","https://openalex.org/W6633810142","https://openalex.org/W6635724992","https://openalex.org/W6637382334"],"related_works":["https://openalex.org/W2197440050","https://openalex.org/W2614415116","https://openalex.org/W2506633375","https://openalex.org/W2265184183","https://openalex.org/W2466354565","https://openalex.org/W2128147992","https://openalex.org/W2011694694","https://openalex.org/W1496822620","https://openalex.org/W1964343189","https://openalex.org/W2103866954"],"abstract_inverted_index":{"Keyword":[0],"search":[1],"in":[2,68,90,104,122,133,165],"XML":[3],"documents":[4],"based":[5,43],"on":[6,44],"the":[7,53,64,69,73,76,82,85,91,95,101,113,118,128,148,168],"notion":[8],"of":[9,16,52,66,75,84,100,135,145,170],"lowest":[10],"common":[11],"ancestors":[12],"(LCAs)":[13],"and":[14,78,110,117,138],"modifications":[15],"it":[17],"has":[18],"recently":[19],"gained":[20],"research":[21],"interest":[22],"[10,":[23],"14,":[24],"22].":[25],"In":[26,93],"this":[27],"paper":[28],"we":[29],"propose":[30],"an":[31],"efficient":[32],"algorithm":[33,56,116,131],"called":[34],"Indexed":[35,54,114,129],"Stack":[36,55,115,130],"to":[37,40,47],"find":[38],"answers":[39],"keyword":[41,89,156],"queries":[42],"XRank's":[45],"semantics":[46],"LCA":[48],"[10].":[49,123],"The":[50,124],"complexity":[51,99],"is":[57,63,72,81,106,163],"O(kd|S1|":[58],"log":[59],"|S|)":[60],"where":[61],"k":[62],"number":[65],"keywords":[67,171],"query,":[70],"d":[71],"depth":[74],"tree":[77],"|S1|":[79],"(|S|)":[80],"occurrence":[83],"least":[86,152],"(most)":[87],"frequent":[88],"query.":[92],"comparison,":[94],"best":[96],"worst":[97],"case":[98],"core":[102,120],"algorithms":[103,121,142],"[10]":[105],"O(kd|S|).":[107],"We":[108],"analytically":[109],"experimentally":[111],"evaluate":[112],"two":[119],"results":[125],"show":[126],"that":[127],"outperforms":[132],"terms":[134],"both":[136],"CPU":[137],"I/O":[139],"costs":[140],"other":[141],"by":[143],"orders":[144],"magnitude":[146],"when":[147],"query":[149],"contains":[150],"at":[151],"one":[153],"low":[154],"frequency":[155,160],"along":[157],"with":[158],"high":[159],"keywords.":[161],"This":[162],"important":[164],"practice":[166],"since":[167],"frequencies":[169],"typically":[172],"vary":[173],"significantly.":[174]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":6},{"year":2016,"cited_by_count":8},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":16},{"year":2012,"cited_by_count":15}],"updated_date":"2026-03-11T06:11:40.159057","created_date":"2025-10-10T00:00:00"}
