{"id":"https://openalex.org/W2566506518","doi":"https://doi.org/10.1109/tbdata.2016.2640301","title":"Toward Efficient and Flexible Metadata Indexing of Big Data Systems","display_name":"Toward Efficient and Flexible Metadata Indexing of Big Data Systems","publication_year":2016,"publication_date":"2016-12-17","ids":{"openalex":"https://openalex.org/W2566506518","doi":"https://doi.org/10.1109/tbdata.2016.2640301","mag":"2566506518"},"language":"en","primary_location":{"id":"doi:10.1109/tbdata.2016.2640301","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2016.2640301","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Big Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101671477","display_name":"Dongfang Zhao","orcid":"https://orcid.org/0000-0002-0677-634X"},"institutions":[{"id":"https://openalex.org/I201448701","display_name":"University of Washington","ror":"https://ror.org/00cvxb145","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Dongfang Zhao","raw_affiliation_strings":["Department of Computer Science and Engineering, University of Washington, Seattle, WA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, University of Washington, Seattle, WA","institution_ids":["https://openalex.org/I201448701"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109800827","display_name":"Kan Qiao","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kan Qiao","raw_affiliation_strings":["Google Inc., Kirkland, WA"],"affiliations":[{"raw_affiliation_string":"Google Inc., Kirkland, WA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100359931","display_name":"Zhou Zhou","orcid":"https://orcid.org/0000-0002-8637-3654"},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhou Zhou","raw_affiliation_strings":["Department of Computer Science, Illinois Institute of Technology, Chicago, IL"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Illinois Institute of Technology, Chicago, IL","institution_ids":["https://openalex.org/I180949307"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036106961","display_name":"Tonglin Li","orcid":"https://orcid.org/0000-0002-2874-8112"},"institutions":[{"id":"https://openalex.org/I1289243028","display_name":"Oak Ridge National Laboratory","ror":"https://ror.org/01qz5mb56","country_code":"US","type":"facility","lineage":["https://openalex.org/I1289243028","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I4210159294"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tonglin Li","raw_affiliation_strings":["Oak Ridge National Laboratory, Oak Ridge, TN"],"affiliations":[{"raw_affiliation_string":"Oak Ridge National Laboratory, Oak Ridge, TN","institution_ids":["https://openalex.org/I1289243028"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107853490","display_name":"Zhihan L\u00fc","orcid":null},"institutions":[{"id":"https://openalex.org/I45129253","display_name":"University College London","ror":"https://ror.org/02jx3x895","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I45129253"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhihan Lu","raw_affiliation_strings":["Department of Computer Science, University College London, London, United Kingdom"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University College London, London, United Kingdom","institution_ids":["https://openalex.org/I45129253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101619632","display_name":"Xiaohua Xu","orcid":"https://orcid.org/0000-0001-7770-803X"},"institutions":[{"id":"https://openalex.org/I172980758","display_name":"Kennesaw State University","ror":"https://ror.org/00jeqjx33","country_code":"US","type":"education","lineage":["https://openalex.org/I172980758"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaohua Xu","raw_affiliation_strings":["Department of Computer Science, Kennesaw State University, Kennesaw, GA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Kennesaw State University, Kennesaw, GA","institution_ids":["https://openalex.org/I172980758"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101671477"],"corresponding_institution_ids":["https://openalex.org/I201448701"],"apc_list":null,"apc_paid":null,"fwci":2.0399,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.88704662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"3","issue":"1","first_page":"107","last_page":"117"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10742","display_name":"Peer-to-Peer Network Technologies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8595788478851318},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.839158296585083},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6865262389183044},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6669195294380188},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.42852553725242615},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3691822588443756},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3460730314254761},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.235792338848114}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8595788478851318},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.839158296585083},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6865262389183044},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6669195294380188},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.42852553725242615},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3691822588443756},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3460730314254761},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.235792338848114}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tbdata.2016.2640301","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tbdata.2016.2640301","pdf_url":null,"source":{"id":"https://openalex.org/S2491400915","display_name":"IEEE Transactions on Big Data","issn_l":"2332-7790","issn":["2332-7790","2372-2096"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Big Data","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306151","display_name":"Alfred P. Sloan Foundation","ror":"https://ror.org/052csg198"},{"id":"https://openalex.org/F4320306202","display_name":"Gordon and Betty Moore Foundation","ror":"https://ror.org/006wxqw41"},{"id":"https://openalex.org/F4320306854","display_name":"Washington Research Foundation","ror":"https://ror.org/00hasdx88"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W339752665","https://openalex.org/W1491030683","https://openalex.org/W1529205966","https://openalex.org/W1534481387","https://openalex.org/W1734799737","https://openalex.org/W1876353827","https://openalex.org/W1973462929","https://openalex.org/W1981420413","https://openalex.org/W1986447815","https://openalex.org/W1993017904","https://openalex.org/W1999984505","https://openalex.org/W2020572986","https://openalex.org/W2027758281","https://openalex.org/W2034586863","https://openalex.org/W2087946700","https://openalex.org/W2108841814","https://openalex.org/W2110020044","https://openalex.org/W2110298485","https://openalex.org/W2116079991","https://openalex.org/W2119565742","https://openalex.org/W2119738171","https://openalex.org/W2131645490","https://openalex.org/W2136009376","https://openalex.org/W2153704625","https://openalex.org/W2165329839","https://openalex.org/W2168067900","https://openalex.org/W2465447462","https://openalex.org/W2999097477","https://openalex.org/W3138135046","https://openalex.org/W4249823756","https://openalex.org/W4250390143","https://openalex.org/W6611599856","https://openalex.org/W6631739990","https://openalex.org/W6632020668","https://openalex.org/W6637631891","https://openalex.org/W6650418438","https://openalex.org/W6657560871","https://openalex.org/W6676560735","https://openalex.org/W6679471073","https://openalex.org/W6719751959"],"related_works":["https://openalex.org/W4322629366","https://openalex.org/W2808989540","https://openalex.org/W2397053934","https://openalex.org/W1039292361","https://openalex.org/W2731626691","https://openalex.org/W2551093110","https://openalex.org/W2148016376","https://openalex.org/W4237919137","https://openalex.org/W3184179822","https://openalex.org/W3095362084"],"abstract_inverted_index":{"In":[0],"Big":[1],"Data":[2],"era,":[3],"applications":[4],"are":[5,34],"generating":[6],"orders":[7],"of":[8,145,157],"magnitude":[9],"more":[10],"data":[11,24,90],"in":[12,67,73,106],"both":[13,63],"volume":[14],"and":[15,65,148,178],"quantity.":[16],"While":[17],"many":[18],"systems":[19],"emerge":[20],"to":[21,43,50,61,112,118,124,180,194],"address":[22,44,129],"such":[23],"explosion,":[25],"the":[26,45,83,96,155],"fact":[27],"that":[28,154,187],"these":[29],"data's":[30],"descriptors,":[31],"i.e.,":[32],"metadata,":[33],"also":[35],"\u201cbig\u201d":[36],"is":[37,49,58,92,100,160],"often":[38],"overlooked.":[39],"The":[40],"conventional":[41],"approach":[42],"big":[46],"metadata":[47,52,190],"issue":[48],"disperse":[51],"into":[53],"multiple":[54],"machines.":[55],"However,":[56],"it":[57],"extremely":[59],"difficult":[60],"preserve":[62],"load-balance":[64,99],"data-locality":[66],"this":[68,71,74,107],"approach.":[69],"To":[70,128],"end,":[72],"work":[75],"we":[76,132],"propose":[77],"hierarchical":[78],"indirection":[79,97],"layers":[80],"for":[81,139],"indexing":[82,137],"underlying":[84],"distributed":[85,136,175,183],"metadata.":[86,140],"By":[87],"doing":[88],"this,":[89],"locality":[91],"achieved":[93],"efficiently":[94],"by":[95,162,172,192],"while":[98],"preserved.":[101],"Three":[102],"key":[103],"challenges":[104],"exist":[105],"approach,":[108],"however:":[109],"first,":[110],"how":[111,117,123],"achieve":[113],"high":[114],"resilience;":[115],"second,":[116],"ensure":[119],"flexible":[120],"granularity;":[121],"third,":[122],"restrain":[125],"performance":[126],"overhead.":[127,200],"above":[130],"challenges,":[131],"design":[133],"Dindex,":[134],"a":[135,143,173,181,198],"service":[138],"Dindex":[141,159,168,188],"incorporates":[142],"hierarchy":[144],"coarse-grained":[146],"aggregation":[147],"horizontal":[149],"key-coalition.":[150],"Theoretical":[151],"analysis":[152],"shows":[153],"overhead":[156],"building":[158],"compensated":[161],"only":[163],"two":[164],"or":[165],"three":[166],"queries.":[167],"has":[169],"been":[170],"implemented":[171],"lightweight":[174],"key-value":[176],"store":[177],"integrated":[179],"fully-fledged":[182],"filesystem.":[184],"Experiments":[185],"demonstrated":[186],"accelerated":[189],"queries":[191],"up":[193],"60":[195],"percent":[196],"with":[197],"negligible":[199]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
