{"id":"https://openalex.org/W2536202408","doi":"https://doi.org/10.1109/fskd.2016.7603390","title":"Distributed XPath query processing over large XML data based on MapReduce framework","display_name":"Distributed XPath query processing over large XML data based on MapReduce framework","publication_year":2016,"publication_date":"2016-08-01","ids":{"openalex":"https://openalex.org/W2536202408","doi":"https://doi.org/10.1109/fskd.2016.7603390","mag":"2536202408"},"language":"en","primary_location":{"id":"doi:10.1109/fskd.2016.7603390","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fskd.2016.7603390","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 12th International Conference on Natural Computation, Fuzzy Systems and Knowledge Discovery (ICNC-FSKD)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5040666670","display_name":"Hongjie Fan","orcid":"https://orcid.org/0000-0002-4872-8557"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hongjie Fan","raw_affiliation_strings":["School of Electronics Engineering and Computer Science, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics Engineering and Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450581","display_name":"Dongsheng Wang","orcid":"https://orcid.org/0000-0001-7697-562X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongsheng Wang","raw_affiliation_strings":["School of Software and Microelectronics, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Software and Microelectronics, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023014733","display_name":"Junfei Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Junfei Liu","raw_affiliation_strings":["National Engineering Research Center for Software Engineering, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center for Software Engineering, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5040666670"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.5791,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.72642385,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1447","last_page":"1453"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9850000143051147,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xpath","display_name":"XPath","score":0.971290111541748},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8883938789367676},{"id":"https://openalex.org/keywords/xml-database","display_name":"XML database","score":0.7351411581039429},{"id":"https://openalex.org/keywords/streaming-xml","display_name":"Streaming XML","score":0.7259371280670166},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.49783968925476074},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.48037606477737427},{"id":"https://openalex.org/keywords/simple-api-for-xml","display_name":"Simple API for XML","score":0.43258464336395264},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4295041561126709},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.4104107916355133},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.40162524580955505},{"id":"https://openalex.org/keywords/efficient-xml-interchange","display_name":"Efficient XML Interchange","score":0.3808581233024597},{"id":"https://openalex.org/keywords/xml-signature","display_name":"XML Signature","score":0.35249125957489014},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.335548996925354},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.08905142545700073}],"concepts":[{"id":"https://openalex.org/C2780213375","wikidata":"https://www.wikidata.org/wiki/Q16340","display_name":"XPath","level":4,"score":0.971290111541748},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8883938789367676},{"id":"https://openalex.org/C183068750","wikidata":"https://www.wikidata.org/wiki/Q357393","display_name":"XML database","level":3,"score":0.7351411581039429},{"id":"https://openalex.org/C44883583","wikidata":"https://www.wikidata.org/wiki/Q7622687","display_name":"Streaming XML","level":3,"score":0.7259371280670166},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.49783968925476074},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.48037606477737427},{"id":"https://openalex.org/C8595896","wikidata":"https://www.wikidata.org/wiki/Q577094","display_name":"Simple API for XML","level":5,"score":0.43258464336395264},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4295041561126709},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.4104107916355133},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.40162524580955505},{"id":"https://openalex.org/C11508877","wikidata":"https://www.wikidata.org/wiki/Q1124477","display_name":"Efficient XML Interchange","level":3,"score":0.3808581233024597},{"id":"https://openalex.org/C34330436","wikidata":"https://www.wikidata.org/wiki/Q979532","display_name":"XML Signature","level":4,"score":0.35249125957489014},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.335548996925354},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.08905142545700073}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/fskd.2016.7603390","is_oa":false,"landing_page_url":"https://doi.org/10.1109/fskd.2016.7603390","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 12th International Conference on Natural Computation, Fuzzy Systems and Knowledge Discovery (ICNC-FSKD)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":7,"referenced_works":["https://openalex.org/W1965822699","https://openalex.org/W1966540900","https://openalex.org/W2036504249","https://openalex.org/W2051949043","https://openalex.org/W2128549389","https://openalex.org/W2173213060","https://openalex.org/W2238970349"],"related_works":["https://openalex.org/W165852420","https://openalex.org/W207633616","https://openalex.org/W3129453902","https://openalex.org/W2096927233","https://openalex.org/W4252337924","https://openalex.org/W1530834279","https://openalex.org/W252540258","https://openalex.org/W2186509186","https://openalex.org/W2142016651","https://openalex.org/W2121785123"],"abstract_inverted_index":{"The":[0,130],"volume":[1,60],"of":[2,23,61,96],"XML":[3,24,33,62,74,113],"data":[4,12,34,75,114],"is":[5,19,27,136],"tremendous":[6],"in":[7,11,36,100,107],"many":[8],"areas,":[9],"especially":[10],"logging":[13],"and":[14,121,138],"scientific":[15],"areas.":[16],"XPath":[17,48,89],"query":[18,31,49,90],"the":[20,71,80,87,97,103,111,118,128],"core":[21],"operation":[22],"process.":[25],"It":[26],"a":[28,37,58],"challenge":[29],"to":[30,69,79,92,109,126],"massive":[32,59],"stored":[35],"distributed":[38,47,81,88],"manner.":[39],"In":[40],"this":[41,141],"paper,":[42],"we":[43,85,116],"present":[44,86],"an":[45],"efficient":[46,137],"processing":[50],"using":[51,102],"MapReduce,":[52],"which":[53],"simultaneously":[54],"processes":[55],"queries":[56],"for":[57],"data.":[63],"We":[64],"first":[65],"use":[66,122],"virtual":[67],"nodes":[68],"split":[70],"large":[72,112],"scale":[73],"file":[76],"into":[77],"filesplits":[78],"storage":[82],"system.":[83],"Then":[84],"algorithm":[91],"compute":[93],"different":[94],"fragments":[95],"document":[98],"tree":[99],"parallel":[101],"MapReduce":[104],"framework.":[105],"Furthermore,":[106],"order":[108],"handle":[110],"efficiently,":[115],"build":[117],"partitional":[119],"index":[120],"random":[123],"access":[124],"mechanism":[125],"perform":[127],"query.":[129],"experimentation":[131],"shows":[132],"that":[133],"our":[134],"approach":[135],"scalable":[139],"on":[140],"issue.":[142]},"counts_by_year":[{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
