{"id":"https://openalex.org/W2148754732","doi":"https://doi.org/10.1109/dasfaa.2003.1192390","title":"PathGuide: an efficient clustering based indexing method for XML path expressions","display_name":"PathGuide: an efficient clustering based indexing method for XML path expressions","publication_year":2003,"publication_date":"2003-01-01","ids":{"openalex":"https://openalex.org/W2148754732","doi":"https://doi.org/10.1109/dasfaa.2003.1192390","mag":"2148754732"},"language":"en","primary_location":{"id":"doi:10.1109/dasfaa.2003.1192390","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasfaa.2003.1192390","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Eighth International Conference on Database Systems for Advanced Applications, 2003. (DASFAA 2003). Proceedings.","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103340525","display_name":"Jiefeng Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiefeng Cheng","raw_affiliation_strings":["Department of Computer Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100782393","display_name":"Ge Yu","orcid":"https://orcid.org/0000-0002-9359-2812"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ge Yu","raw_affiliation_strings":["Department of Computer Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054991337","display_name":"Guoren Wang","orcid":"https://orcid.org/0000-0002-0181-8379"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guoren Wang","raw_affiliation_strings":["Department of Computer Science and Engineering, Northeastern University, Shenyang, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Northeastern University, Shenyang, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075642293","display_name":"Jeffrey Xu Yu","orcid":"https://orcid.org/0000-0002-9738-827X"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"J.X. Yu","raw_affiliation_strings":["Department of System Engineering and Engineering Management, Chinese University of Hong Kong, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Department of System Engineering and Engineering Management, Chinese University of Hong Kong, Hong Kong, China","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103340525"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":0.7083,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.78112692,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"1","issue":null,"first_page":"257","last_page":"264"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8242433071136475},{"id":"https://openalex.org/keywords/joins","display_name":"Joins","score":0.7040717005729675},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.6520518660545349},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6481441259384155},{"id":"https://openalex.org/keywords/path-expression","display_name":"Path expression","score":0.6479007005691528},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.6403248906135559},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.56699538230896},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5630457401275635},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.46308571100234985},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4119185209274292},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.40424054861068726},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.3703748285770416},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.2633270025253296},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.1352325975894928},{"id":"https://openalex.org/keywords/query-language","display_name":"Query language","score":0.12811297178268433},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1006123423576355},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07625320553779602}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8242433071136475},{"id":"https://openalex.org/C2778692605","wikidata":"https://www.wikidata.org/wiki/Q4041866","display_name":"Joins","level":2,"score":0.7040717005729675},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.6520518660545349},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6481441259384155},{"id":"https://openalex.org/C61114434","wikidata":"https://www.wikidata.org/wiki/Q7144649","display_name":"Path expression","level":3,"score":0.6479007005691528},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.6403248906135559},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.56699538230896},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5630457401275635},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.46308571100234985},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4119185209274292},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.40424054861068726},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3703748285770416},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2633270025253296},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.1352325975894928},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.12811297178268433},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1006123423576355},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07625320553779602},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dasfaa.2003.1192390","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dasfaa.2003.1192390","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Eighth International Conference on Database Systems for Advanced Applications, 2003. (DASFAA 2003). Proceedings.","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1520108263","https://openalex.org/W1994694191","https://openalex.org/W2025695428","https://openalex.org/W2061884758","https://openalex.org/W2087060113","https://openalex.org/W2110459974","https://openalex.org/W2113836856","https://openalex.org/W2123645388","https://openalex.org/W2134356404","https://openalex.org/W2136016195","https://openalex.org/W2139475358","https://openalex.org/W2142200612","https://openalex.org/W2152175785","https://openalex.org/W2155512447","https://openalex.org/W2158237121","https://openalex.org/W4255338640","https://openalex.org/W6676678128","https://openalex.org/W6679759574","https://openalex.org/W6680718584","https://openalex.org/W6681184881","https://openalex.org/W6682307788"],"related_works":["https://openalex.org/W2048497404","https://openalex.org/W1551052685","https://openalex.org/W2159478743","https://openalex.org/W2371944575","https://openalex.org/W2128582123","https://openalex.org/W1562549404","https://openalex.org/W2372703907","https://openalex.org/W1994219592","https://openalex.org/W4240916939","https://openalex.org/W1777047301"],"abstract_inverted_index":{"This":[0],"paper":[1],"focuses":[2],"on":[3,84],"the":[4,16,19,42,46,52,70,75,89,102,119,124,131,147,175],"performance":[5],"improvement":[6],"for":[7,28,36,91],"long-path":[8],"XML":[9,31,39,71],"query":[10],"processing.":[11],"It":[12],"is":[13,49,95],"motivated":[14],"by":[15],"fact":[17],"that":[18,172],"existing":[20,47,148],"inverted":[21,72],"index":[22,73,103,143],"and":[23,88,158,168],"join":[24,150,156],"algorithms":[25],"are":[26,34,81,112,166],"efficient":[27],"short":[29],"path":[30,38,86,93,125,137],"queries,":[32],"but":[33],"inefficient":[35],"long":[37],"queries":[40],"since":[41],"response":[43],"time":[44],"of":[45,54,104,121,133],"approaches":[48],"exponential":[50],"to":[51,114,146],"length":[53],"paths.":[55],"We":[56],"propose":[57],"a":[58,98,134],"clustering":[59,76],"based":[60,83],"indexing":[61],"method,":[62,151],"called":[63],"PathGuide,":[64,122],"in":[65,97,129,182],"this":[66],"paper,":[67],"which":[68],"enhances":[69],"with":[74],"technique.":[77],"The":[78,162],"element":[79,106],"nodes":[80],"clustered":[82],"their":[85],"patterns":[87],"summary":[90],"such":[92],"information":[94],"kept":[96],"suffix":[99],"tree":[100],"as":[101],"these":[105],"nodes.":[107],"In":[108],"addition,":[109],"new":[110],"operations":[111],"proposed":[113],"fully":[115],"utilize":[116],"PathGuide.":[117],"With":[118],"assistance":[120],"unlike":[123],"expansion":[126],"approach":[127],"used":[128],"Lore,":[130],"set":[132],"relative":[135],"location":[136],"can":[138],"be":[139],"found":[140],"via":[141],"one-step":[142],"lookup.":[144],"Compared":[145],"structural":[149,176],"PathGuide":[152,173],"significantly":[153],"reduces":[154],"both":[155],"overhead":[157],"disk":[159],"I/O":[160],"cost.":[161],"extensive":[163],"experimental":[164],"studies":[165],"conducted":[167],"our":[169],"results":[170],"show":[171],"outperforms":[174],"joins":[177],"at":[178],"least":[179],"four":[180],"times":[181],"most":[183],"cases.":[184]},"counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
