{"id":"https://openalex.org/W2783639050","doi":"https://doi.org/10.1109/bigdata.2017.8257927","title":"A semantics-aware storage framework for scalable processing of knowledge graphs on Hadoop","display_name":"A semantics-aware storage framework for scalable processing of knowledge graphs on Hadoop","publication_year":2017,"publication_date":"2017-12-01","ids":{"openalex":"https://openalex.org/W2783639050","doi":"https://doi.org/10.1109/bigdata.2017.8257927","mag":"2783639050"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2017.8257927","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8257927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032645513","display_name":"HyeongSik Kim","orcid":"https://orcid.org/0009-0001-7040-0152"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"HyeongSik Kim","raw_affiliation_strings":["North Carolina State University, Raleigh, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, USA","institution_ids":["https://openalex.org/I137902535"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062666005","display_name":"Padmashree Ravindra","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Padmashree Ravindra","raw_affiliation_strings":["Microsoft Corporation, Redmond, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft Corporation, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060624981","display_name":"Kemafor Anyanwu","orcid":"https://orcid.org/0000-0002-9528-061X"},"institutions":[{"id":"https://openalex.org/I137902535","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06","country_code":"US","type":"education","lineage":["https://openalex.org/I137902535"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kemafor Anyanwu","raw_affiliation_strings":["North Carolina State University, Raleigh, USA"],"affiliations":[{"raw_affiliation_string":"North Carolina State University, Raleigh, USA","institution_ids":["https://openalex.org/I137902535"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5032645513"],"corresponding_institution_ids":["https://openalex.org/I137902535"],"apc_list":null,"apc_paid":null,"fwci":0.195,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.64808308,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"4","issue":null,"first_page":"193","last_page":"202"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8429821133613586},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7237457633018494},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6402640342712402},{"id":"https://openalex.org/keywords/knowledge-graph","display_name":"Knowledge graph","score":0.5328624248504639},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.42809635400772095},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.34814804792404175},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.25086796283721924}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8429821133613586},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7237457633018494},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6402640342712402},{"id":"https://openalex.org/C2987255567","wikidata":"https://www.wikidata.org/wiki/Q33002955","display_name":"Knowledge graph","level":2,"score":0.5328624248504639},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.42809635400772095},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.34814804792404175},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.25086796283721924}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2017.8257927","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2017.8257927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6000000238418579,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320310013","display_name":"North Carolina State University","ror":"https://ror.org/04tj63d06"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W60117112","https://openalex.org/W102708294","https://openalex.org/W1561490215","https://openalex.org/W1810256132","https://openalex.org/W1964903741","https://openalex.org/W1982177147","https://openalex.org/W1987822482","https://openalex.org/W1989009626","https://openalex.org/W2036959307","https://openalex.org/W2102440263","https://openalex.org/W2124564928","https://openalex.org/W2140613126","https://openalex.org/W2154139219","https://openalex.org/W2171539317","https://openalex.org/W2247735372","https://openalex.org/W2250093878","https://openalex.org/W2280869227","https://openalex.org/W2293919922","https://openalex.org/W2507920278","https://openalex.org/W2584112015","https://openalex.org/W2604978036","https://openalex.org/W2751095725","https://openalex.org/W6602443812","https://openalex.org/W6638548207","https://openalex.org/W6659739653","https://openalex.org/W6680805174","https://openalex.org/W6697236245","https://openalex.org/W6732869681"],"related_works":["https://openalex.org/W2389214306","https://openalex.org/W4235240664","https://openalex.org/W2965083567","https://openalex.org/W1838576100","https://openalex.org/W2095886385","https://openalex.org/W2889616422","https://openalex.org/W2089704382","https://openalex.org/W1983399550","https://openalex.org/W97075385","https://openalex.org/W64303689"],"abstract_inverted_index":{"Knowledge":[0],"graphs":[1,34,106,150,187,217],"are":[2,56,120],"graph-based":[3],"data":[4,22,49,66,116,197,245,249,256,284,314,317,325,342],"models":[5,50,67,253,319,340],"which":[6,55,159],"employ":[7],"named":[8],"nodes":[9],"and":[10,17,42,76,132,154,170,323,353],"edges":[11,153],"to":[12,39,59,123,165,206,220,281,305,362],"capture":[13],"differentiation":[14],"among":[15],"entities":[16],"relationships":[18],"in":[19,26,44,115,299,310],"richly":[20],"diverse":[21],"collections":[23,38,101,246],"such":[24,81,94,129,255,320],"as":[25,82,95,107,109,130,321],"the":[27,69,96,178,192,202,209,295,307],"biomedical":[28,97],"domain.":[29],"The":[30,199,268,302],"flexibility":[31],"of":[32,78,102,145,180,191,194,201,212,216,223,226,244,292,297,332],"knowledge":[33,156,186,227,308],"allows":[35],"for":[36,63,91,142,148,185,254,260,315,341],"heterogeneous":[37],"be":[40,166],"linked":[41],"integrated":[43],"precise":[45],"ways.":[46],"However,":[47,134],"resulting":[48],"often":[51,160],"have":[52,87,99,140],"irregular":[53],"structures":[54],"not":[57],"easy":[58],"manage":[60],"using":[61],"platforms":[62,128,139],"structured,":[64],"schema-first":[65],"like":[68],"relational":[70],"model.":[71],"To":[72,112],"facilitate":[73],"exchange,":[74],"inter-operability":[75],"reuse":[77],"data,":[79],"standards":[80],"Resource":[83],"Description":[84],"Framework":[85],"(RDF)":[86],"been":[88],"increasingly":[89],"adopted":[90],"representation.":[92],"Domains":[93],"now":[98],"large":[100],"publicly":[103],"available":[104],"RDF":[105,196],"well":[108],"benchmark":[110,355],"workloads.":[111],"achieve":[113],"scalability":[114,169],"processing,":[117,158],"some":[118,136,190],"efforts":[119],"being":[121],"made":[122],"build":[124],"on":[125,287,351],"distributed":[126,137],"processing":[127],"Hadoop":[131],"Spark.":[133],"while":[135,218],"graph":[138,157],"emerged":[141],"certain":[143],"classes":[144],"mining":[146],"workloads":[147],"non-semantic":[149],"(without":[151],"typed":[152],"nodes),":[155],"involves":[161],"ontological":[162],"inferencing,":[163],"continues":[164],"plagued":[167],"by":[168],"efficiency":[171],"challenges.":[172],"In":[173],"this":[174],"paper,":[175],"we":[176],"present":[177],"design":[179,203],"a":[181,233,276],"Hadoop-based":[182,234],"storage":[183,243,252,300,318,339],"architecture":[184],"that":[188,240,312,335,358],"overcomes":[189],"challenges":[193],"big":[195],"processing.":[198],"rationale":[200],"strategy":[204],"is":[205,232,272,294,304,334,360],"go":[207],"beyond":[208],"traditional":[210,264],"approach":[211],"exploiting":[213],"structural":[214],"properties":[215,225],"storing":[219],"include":[221],"exploitation":[222],"semantic":[224],"graphs.":[228],"Our":[229],"system":[230],"SemStorm":[231,293,333,359],"indexed,":[235],"polymorphic,":[236],"signatured":[237],"file":[238,270,279],"organization":[239,271],"supports":[241],"efficient":[242],"with":[247,275],"significant":[248],"heterogeneity.":[250],"Naive":[251],"place":[257],"more":[258],"demands":[259],"meta-data":[261],"management":[262],"than":[263,365],"systems":[265],"can":[266],"support.":[267],"polymorphic":[269],"further":[273],"coupled":[274],"nested,":[277],"column-oriented":[278],"format":[280],"enable":[282],"discriminatory":[283],"access":[285],"based":[286],"queries.":[288],"A":[289],"major":[290,330],"hallmark":[291],"enabling":[296],"semantic-awareness":[298],"framework.":[301],"idea":[303],"exploit":[306],"represented":[309],"ontologies":[311],"accompany":[313],"optimizing":[316],"identifying":[322],"managing":[324],"(sometimes":[326],"implicit)":[327],"redundancies.":[328],"Another":[329],"advantage":[331],"it":[336],"derives":[337],"optimized":[338],"autonomically,":[343],"i.e.,":[344],"without":[345],"user":[346],"input.":[347],"Extensive":[348],"experiments":[349],"conducted":[350],"real-world":[352],"synthetic":[354],"datasets":[356],"show":[357],"up":[361],"10X":[363],"faster":[364],"existing":[366],"approaches.":[367]},"counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
