{"id":"https://openalex.org/W2585128637","doi":"https://doi.org/10.1109/bigdata.2016.7840949","title":"Visualization and diagnosis of earth science data through Hadoop and Spark","display_name":"Visualization and diagnosis of earth science data through Hadoop and Spark","publication_year":2016,"publication_date":"2016-12-01","ids":{"openalex":"https://openalex.org/W2585128637","doi":"https://doi.org/10.1109/bigdata.2016.7840949","mag":"2585128637"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata.2016.7840949","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840949","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103531132","display_name":"Shujia Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I2948394018","display_name":"Northrop Grumman (United States)","ror":"https://ror.org/05kewds18","country_code":"US","type":"company","lineage":["https://openalex.org/I2948394018"]},{"id":"https://openalex.org/I1306266525","display_name":"Goddard Space Flight Center","ror":"https://ror.org/0171mag52","country_code":"US","type":"facility","lineage":["https://openalex.org/I1306266525","https://openalex.org/I4210124779"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Shujia Zhou","raw_affiliation_strings":["NASA Goddard Space Flight Center, Greenbelt, MD","Northrop Grumman Information Technology, McLean, VA"],"affiliations":[{"raw_affiliation_string":"NASA Goddard Space Flight Center, Greenbelt, MD","institution_ids":["https://openalex.org/I1306266525"]},{"raw_affiliation_string":"Northrop Grumman Information Technology, McLean, VA","institution_ids":["https://openalex.org/I2948394018"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100717701","display_name":"Xiaowen Li","orcid":"https://orcid.org/0000-0001-8660-3387"},"institutions":[{"id":"https://openalex.org/I1306266525","display_name":"Goddard Space Flight Center","ror":"https://ror.org/0171mag52","country_code":"US","type":"facility","lineage":["https://openalex.org/I1306266525","https://openalex.org/I4210124779"]},{"id":"https://openalex.org/I83909951","display_name":"Morgan State University","ror":"https://ror.org/017d8gk22","country_code":"US","type":"education","lineage":["https://openalex.org/I83909951"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaowen Li","raw_affiliation_strings":["Morgan State University, Baltimore, MD","NASA Goddard Space Flight Center, Greenbelt, MD"],"affiliations":[{"raw_affiliation_string":"Morgan State University, Baltimore, MD","institution_ids":["https://openalex.org/I83909951"]},{"raw_affiliation_string":"NASA Goddard Space Flight Center, Greenbelt, MD","institution_ids":["https://openalex.org/I1306266525"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030005836","display_name":"Toshihisa Matsui","orcid":"https://orcid.org/0000-0001-7581-0268"},"institutions":[{"id":"https://openalex.org/I66946132","display_name":"University of Maryland, College Park","ror":"https://ror.org/047s2c258","country_code":"US","type":"education","lineage":["https://openalex.org/I66946132"]},{"id":"https://openalex.org/I1306266525","display_name":"Goddard Space Flight Center","ror":"https://ror.org/0171mag52","country_code":"US","type":"facility","lineage":["https://openalex.org/I1306266525","https://openalex.org/I4210124779"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Toshihisa Matsui","raw_affiliation_strings":["NASA Goddard Space Flight Center, Greenbelt, MD","University of Maryland, College Park, MD"],"affiliations":[{"raw_affiliation_string":"NASA Goddard Space Flight Center, Greenbelt, MD","institution_ids":["https://openalex.org/I1306266525"]},{"raw_affiliation_string":"University of Maryland, College Park, MD","institution_ids":["https://openalex.org/I66946132"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035325921","display_name":"Wei\u2010Kuo Tao","orcid":"https://orcid.org/0000-0003-0183-0930"},"institutions":[{"id":"https://openalex.org/I1306266525","display_name":"Goddard Space Flight Center","ror":"https://ror.org/0171mag52","country_code":"US","type":"facility","lineage":["https://openalex.org/I1306266525","https://openalex.org/I4210124779"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weikuo Tao","raw_affiliation_strings":["NASA Goddard Space Flight Center, Greenbelt, MD"],"affiliations":[{"raw_affiliation_string":"NASA Goddard Space Flight Center, Greenbelt, MD","institution_ids":["https://openalex.org/I1306266525"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103531132"],"corresponding_institution_ids":["https://openalex.org/I1306266525","https://openalex.org/I2948394018"],"apc_list":null,"apc_paid":null,"fwci":3.3175,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.93714296,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"99","issue":null,"first_page":"2974","last_page":"2980"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/terabyte","display_name":"Terabyte","score":0.781783938407898},{"id":"https://openalex.org/keywords/netcdf","display_name":"NetCDF","score":0.7660325765609741},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.764271080493927},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.7580591440200806},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.704063355922699},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.6021920442581177},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.5360121726989746},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.48551464080810547},{"id":"https://openalex.org/keywords/data-visualization","display_name":"Data visualization","score":0.4655293822288513},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.4536636471748352},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.23728930950164795},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.19889390468597412},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.0813169777393341}],"concepts":[{"id":"https://openalex.org/C199683683","wikidata":"https://www.wikidata.org/wiki/Q8799","display_name":"Terabyte","level":2,"score":0.781783938407898},{"id":"https://openalex.org/C11090531","wikidata":"https://www.wikidata.org/wiki/Q1361922","display_name":"NetCDF","level":2,"score":0.7660325765609741},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.764271080493927},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.7580591440200806},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.704063355922699},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.6021920442581177},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.5360121726989746},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.48551464080810547},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.4655293822288513},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.4536636471748352},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.23728930950164795},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.19889390468597412},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0813169777393341}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata.2016.7840949","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata.2016.7840949","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W26797728","https://openalex.org/W1988203515","https://openalex.org/W2041811270","https://openalex.org/W2110086534","https://openalex.org/W2119738171","https://openalex.org/W2131645490","https://openalex.org/W2189465200","https://openalex.org/W2209882883","https://openalex.org/W2220600462","https://openalex.org/W2298833372","https://openalex.org/W2562482716","https://openalex.org/W2751095725","https://openalex.org/W6679471073","https://openalex.org/W6687322159","https://openalex.org/W6697540089"],"related_works":["https://openalex.org/W2766461310","https://openalex.org/W4247566972","https://openalex.org/W2936171637","https://openalex.org/W1586214342","https://openalex.org/W4388692845","https://openalex.org/W3091344841","https://openalex.org/W2260589296","https://openalex.org/W3202731209","https://openalex.org/W3157828377","https://openalex.org/W3211874991"],"abstract_inverted_index":{"Large":[0],"data":[1,41,83,91,109,134],"(over":[2],"Terabyte)":[3],"are":[4,42,135],"produced":[5],"by":[6,50,105],"ultra":[7],"high-resolution":[8],"Earth":[9,39,81],"science":[10,40,82],"simulations":[11],"with":[12,65],"a":[13,20,75],"long":[14],"period":[15],"of":[16,95,129,143],"time.":[17],"This":[18],"creates":[19],"challenge":[21],"to":[22,97,111,137],"distribute":[23],"and":[24,30,53,60,79,87,107,123,127,139],"analyze":[25],"in":[26,44],"an":[27],"effective,":[28],"efficient,":[29],"scalable":[31],"way.":[32],"One":[33],"key":[34],"reason":[35],"is":[36,47,103],"that":[37,102],"typical":[38],"represented":[43],"NetCDF,":[45],"which":[46],"not":[48],"supported":[49,104],"the":[51,93,141],"popular":[52],"powerful":[54],"Hadoop":[55,86],"Distribute":[56],"File":[57],"System":[58],"(HDFS)":[59],"consequently":[61],"cannot":[62],"be":[63],"analyzed":[64],"tools":[66],"based":[67,84],"on":[68,85],"HDFS.":[69],"In":[70],"this":[71,144],"paper,":[72],"we":[73],"report":[74],"system":[76],"for":[77],"visualizing":[78],"analyzing":[80],"Spark.":[88],"It":[89],"transforms":[90],"from":[92],"format":[94],"NetCDF":[96],"CSV":[98],"(Comma":[99],"Separated":[100],"Value)":[101],"HDFS":[106],"indexes":[108],"appropriately":[110],"save":[112],"storage":[113],"space":[114],"as":[115,117],"well":[116],"manipulate":[118],"flexibly":[119],"through":[120],"HIVE,":[121],"Impala,":[122],"SparkSQL.":[124],"Adaptive":[125],"subsetting":[126],"visualization":[128],"cloud":[130],"resolve":[131],"model":[132],"simulation":[133],"used":[136],"validate":[138],"demonstrate":[140],"features":[142],"system.":[145]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
