{"id":"https://openalex.org/W2874988644","doi":"https://doi.org/10.1145/3219104.3229288","title":"Building Big Data Processing and Visualization Pipeline through Apache Zeppelin","display_name":"Building Big Data Processing and Visualization Pipeline through Apache Zeppelin","publication_year":2018,"publication_date":"2018-07-12","ids":{"openalex":"https://openalex.org/W2874988644","doi":"https://doi.org/10.1145/3219104.3229288","mag":"2874988644"},"language":"en","primary_location":{"id":"doi:10.1145/3219104.3229288","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3219104.3229288","pdf_url":null,"source":{"id":"https://openalex.org/S4306524298","display_name":"Proceedings of the Practice and Experience on Advanced Research Computing","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Practice and Experience on Advanced Research Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017304873","display_name":"Yanzhe Cheng","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanzhe Cheng","raw_affiliation_strings":["School of Computer Science and Technology, Dalian University of Technology, Dalian, Liaoning Province, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Dalian University of Technology, Dalian, Liaoning Province, China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100453054","display_name":"Fang Liu","orcid":"https://orcid.org/0000-0002-3383-2191"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fang Cherry Liu","raw_affiliation_strings":["Partnership for an Advanced Computing Environment (PACE), Georgia Institute of Technology, Atlanta, GA"],"affiliations":[{"raw_affiliation_string":"Partnership for an Advanced Computing Environment (PACE), Georgia Institute of Technology, Atlanta, GA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068545751","display_name":"Shan Jing","orcid":"https://orcid.org/0000-0003-1763-8417"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shan Jing","raw_affiliation_strings":["School of Chemistry and Biochemistry, Georgia Institute of Technology, Atlanta, GA"],"affiliations":[{"raw_affiliation_string":"School of Chemistry and Biochemistry, Georgia Institute of Technology, Atlanta, GA","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101883722","display_name":"Weijia Xu","orcid":"https://orcid.org/0000-0002-5134-6381"},"institutions":[{"id":"https://openalex.org/I4388891828","display_name":"Texas Advanced Computing Center","ror":"https://ror.org/00xg4bh43","country_code":null,"type":"facility","lineage":["https://openalex.org/I4388891828","https://openalex.org/I86519309"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Weijia Xu","raw_affiliation_strings":["Texas Advanced Computing Center, University of Texas, Austin, TX"],"affiliations":[{"raw_affiliation_string":"Texas Advanced Computing Center, University of Texas, Austin, TX","institution_ids":["https://openalex.org/I4388891828"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020153026","display_name":"Duen Horng Chau","orcid":"https://orcid.org/0000-0001-9824-3323"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Duen Horng Chau","raw_affiliation_strings":["School of Computational Science and Engineering, Georgia Institute of Technology, Atlanta, GA"],"affiliations":[{"raw_affiliation_string":"School of Computational Science and Engineering, Georgia Institute of Technology, Atlanta, GA","institution_ids":["https://openalex.org/I130701444"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5017304873"],"corresponding_institution_ids":["https://openalex.org/I27357992"],"apc_list":null,"apc_paid":null,"fwci":5.105,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.95869205,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9707000255584717,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9685999751091003,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7631534934043884},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7247337102890015},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.6960773468017578},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.6904494166374207},{"id":"https://openalex.org/keywords/data-visualization","display_name":"Data visualization","score":0.6117842793464661},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.40764105319976807},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.34162068367004395},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.33098945021629333},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2854664921760559},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.20621821284294128}],"concepts":[{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7631534934043884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7247337102890015},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.6960773468017578},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.6904494166374207},{"id":"https://openalex.org/C172367668","wikidata":"https://www.wikidata.org/wiki/Q6504956","display_name":"Data visualization","level":3,"score":0.6117842793464661},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.40764105319976807},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.34162068367004395},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.33098945021629333},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2854664921760559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.20621821284294128}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3219104.3229288","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3219104.3229288","pdf_url":null,"source":{"id":"https://openalex.org/S4306524298","display_name":"Proceedings of the Practice and Experience on Advanced Research Computing","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Practice and Experience on Advanced Research Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1499772760","https://openalex.org/W2114353347","https://openalex.org/W2126539515","https://openalex.org/W2135415614","https://openalex.org/W2155461593","https://openalex.org/W2189465200","https://openalex.org/W2912500072","https://openalex.org/W6687322159"],"related_works":["https://openalex.org/W2013728941","https://openalex.org/W4225274103","https://openalex.org/W2579659702","https://openalex.org/W2154046714","https://openalex.org/W1965329638","https://openalex.org/W1574055964","https://openalex.org/W2923661510","https://openalex.org/W2189613078","https://openalex.org/W2586219255","https://openalex.org/W2547096368"],"abstract_inverted_index":{"Big":[0],"data":[1,9,18,20,22,25,39,61,79,104,113,234,239],"analytics":[2,23],"pipeline":[3,115,235],"becomes":[4],"popular":[5],"for":[6,17,95,106,123,219],"large":[7],"volume":[8],"processing,":[10],"Apache":[11],"Zeppelin":[12,92,142,194,227],"provides":[13,196],"an":[14,30,75,129],"integrated":[15],"environment":[16],"ingestion,":[19],"discovery,":[21],"and":[24,27,38,54,68,77,98,191,236,241],"visualization":[26,203,217],"collaboration":[28],"with":[29,87,101,147],"extended":[31],"framework":[32],"which":[33],"allows":[34],"different":[35],"programming":[36,89],"languages":[37,49],"processing":[40,62,114],"back":[41,63],"ends":[42,64],"to":[43,126,140,200,211,231],"be":[44,82,173,187],"plugged":[45],"in.":[46],"The":[47,183],"supported":[48],"include":[50],"Scala,":[51],"Python,":[52],"SQL,":[53],"Shell":[55],"script":[56],"as":[57,59],"well":[58],"big":[60,233],"including":[65],"Hadoop,":[66],"Spark":[67],"Hive.":[69],"With":[70,221],"the":[71,85,112,117,169,177,202,213],"necessary":[72],"tool":[73,139],"sets,":[74],"interactive":[76,99],"dynamic":[78],"analysis":[80,100],"can":[81,153,172,186,228],"done":[83],"on":[84,176],"fly":[86],"heterogeneous":[88],"interfaces.":[90],"Although":[91],"is":[93,120,210],"great":[94],"code":[96,171],"development":[97],"small":[102],"scale":[103],"set":[105,149],"proof-of-concept":[107],"or":[108],"use-case":[109],"presentations,":[110],"running":[111,165],"in":[116,128,132,155],"batch":[118,157],"mode":[119,158],"still":[121],"needed":[122],"performance,":[124],"robustness":[125],"fit":[127],"automated":[130],"workflow":[131,146,185],"some":[133],"cases.":[134],"We":[135],"are":[136],"developing":[137],"a":[138,145,148,156,197],"convert":[141],"notebook":[143],"into":[144],"of":[150,207],"codes":[151],"that":[152,168],"run":[154,192],"through":[159],"command":[160],"line":[161],"interface":[162],"without":[163],"requiring":[164],"Zeppelin,":[166],"so":[167],"prototype":[170],"seamlessly":[174],"deployed":[175],"production":[178],"cluster":[179],"after":[180],"demo":[181],"stage.":[182],"entire":[184],"preserved,":[188],"configured":[189],"manually":[190],"automatically.":[193],"also":[195],"flexible":[198],"way":[199],"integrate":[201],"functionality,":[204],"another":[205],"contribution":[206],"this":[208],"paper":[209],"extend":[212],"Zeppelin's":[214],"existing":[215],"built-in":[216],"component":[218],"D3Network.":[220],"two":[222],"added":[223],"features":[224],"described":[225],"above,":[226],"help":[229],"users":[230],"develop":[232],"visualizing":[237],"graph":[238],"quickly":[240],"efficiently.":[242]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":7},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
