{"id":"https://openalex.org/W2049954235","doi":"https://doi.org/10.1109/icde.2013.6544911","title":"SASH: Enabling continuous incremental analytic workflows on Hadoop","display_name":"SASH: Enabling continuous incremental analytic workflows on Hadoop","publication_year":2013,"publication_date":"2013-04-01","ids":{"openalex":"https://openalex.org/W2049954235","doi":"https://doi.org/10.1109/icde.2013.6544911","mag":"2049954235"},"language":"en","primary_location":{"id":"doi:10.1109/icde.2013.6544911","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde.2013.6544911","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 29th International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110047220","display_name":"Manish Sethi","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210103279","display_name":"IBM Research - India","ror":"https://ror.org/014wt7r80","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210103279","https://openalex.org/I4210114115"]}],"countries":["IN","US"],"is_corresponding":true,"raw_author_name":"M. Sethi","raw_affiliation_strings":["IBM India Research Laboratory, Bangalore, India","[IBM India Res. Lab., Bangalore, India]"],"affiliations":[{"raw_affiliation_string":"IBM India Research Laboratory, Bangalore, India","institution_ids":["https://openalex.org/I4210103279"]},{"raw_affiliation_string":"[IBM India Res. Lab., Bangalore, India]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046918342","display_name":"Narendran Sachindran","orcid":null},"institutions":[{"id":"https://openalex.org/I4210103279","display_name":"IBM Research - India","ror":"https://ror.org/014wt7r80","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210103279","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"N. Sachindran","raw_affiliation_strings":["IBM India Research Laboratory, Bangalore, India","[IBM India Res. Lab., Bangalore, India]"],"affiliations":[{"raw_affiliation_string":"IBM India Research Laboratory, Bangalore, India","institution_ids":["https://openalex.org/I4210103279"]},{"raw_affiliation_string":"[IBM India Res. Lab., Bangalore, India]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015609009","display_name":"S. V. Raghavan","orcid":"https://orcid.org/0009-0001-0283-0310"},"institutions":[{"id":"https://openalex.org/I4210103279","display_name":"IBM Research - India","ror":"https://ror.org/014wt7r80","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210103279","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["IN","US"],"is_corresponding":false,"raw_author_name":"S. Raghavan","raw_affiliation_strings":["IBM India Research Laboratory, Bangalore, India","[IBM India Res. Lab., Bangalore, India]"],"affiliations":[{"raw_affiliation_string":"IBM India Research Laboratory, Bangalore, India","institution_ids":["https://openalex.org/I4210103279"]},{"raw_affiliation_string":"[IBM India Res. Lab., Bangalore, India]","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110047220"],"corresponding_institution_ids":["https://openalex.org/I1341412227","https://openalex.org/I4210103279"],"apc_list":null,"apc_paid":null,"fwci":2.4268,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.91066966,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"32","issue":null,"first_page":"1219","last_page":"1230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8379176259040833},{"id":"https://openalex.org/keywords/nosql","display_name":"NoSQL","score":0.8086296916007996},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.7942301034927368},{"id":"https://openalex.org/keywords/analytics","display_name":"Analytics","score":0.6704365611076355},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6378804445266724},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5645564198493958},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5181506872177124},{"id":"https://openalex.org/keywords/intranet","display_name":"Intranet","score":0.48519232869148254},{"id":"https://openalex.org/keywords/stream-processing","display_name":"Stream processing","score":0.47167855501174927},{"id":"https://openalex.org/keywords/ibm","display_name":"IBM","score":0.4502432346343994},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.42306041717529297},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3571041226387024},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2655664086341858},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.10405999422073364}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8379176259040833},{"id":"https://openalex.org/C2779599972","wikidata":"https://www.wikidata.org/wiki/Q82231","display_name":"NoSQL","level":3,"score":0.8086296916007996},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.7942301034927368},{"id":"https://openalex.org/C79158427","wikidata":"https://www.wikidata.org/wiki/Q485396","display_name":"Analytics","level":2,"score":0.6704365611076355},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6378804445266724},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5645564198493958},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5181506872177124},{"id":"https://openalex.org/C2778059363","wikidata":"https://www.wikidata.org/wiki/Q483426","display_name":"Intranet","level":3,"score":0.48519232869148254},{"id":"https://openalex.org/C107027933","wikidata":"https://www.wikidata.org/wiki/Q2006448","display_name":"Stream processing","level":2,"score":0.47167855501174927},{"id":"https://openalex.org/C70388272","wikidata":"https://www.wikidata.org/wiki/Q5968558","display_name":"IBM","level":2,"score":0.4502432346343994},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.42306041717529297},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3571041226387024},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2655664086341858},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.10405999422073364},{"id":"https://openalex.org/C171250308","wikidata":"https://www.wikidata.org/wiki/Q11468","display_name":"Nanotechnology","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icde.2013.6544911","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde.2013.6544911","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 29th International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5400000214576721,"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W10197252","https://openalex.org/W1575324001","https://openalex.org/W1795645138","https://openalex.org/W1845494277","https://openalex.org/W1981420413","https://openalex.org/W1998477918","https://openalex.org/W2010929544","https://openalex.org/W2013373704","https://openalex.org/W2033565095","https://openalex.org/W2098935637","https://openalex.org/W2102458936","https://openalex.org/W2110367654","https://openalex.org/W2116440993","https://openalex.org/W2135927143","https://openalex.org/W2144002928","https://openalex.org/W2146635036","https://openalex.org/W2206204485","https://openalex.org/W2262278669","https://openalex.org/W6638819420","https://openalex.org/W6688217013","https://openalex.org/W6692986867"],"related_works":["https://openalex.org/W2374107376","https://openalex.org/W4241047679","https://openalex.org/W2799973158","https://openalex.org/W562045822","https://openalex.org/W2419153746","https://openalex.org/W3089119258","https://openalex.org/W4230978433","https://openalex.org/W2893963003","https://openalex.org/W2920657135","https://openalex.org/W2953080867"],"abstract_inverted_index":{"There":[0],"is":[1,101],"an":[2,91,102],"emerging":[3],"class":[4],"of":[5,27,76,114,147,159,183],"enterprise":[6],"applications":[7,33],"in":[8,186],"areas":[9],"such":[10,115],"as":[11],"log":[12],"data":[13,58,62],"analysis,":[14],"information":[15],"discovery,":[16],"and":[17,29,44,136,178],"social":[18],"media":[19],"marketing":[20],"that":[21,90,110,153,172],"involve":[22],"analytics":[23,37,103,151],"over":[24],"large":[25],"volumes":[26],"unstructured":[28],"semi-structured":[30],"data.":[31],"These":[32],"are":[34],"leveraging":[35],"new":[36],"platforms":[38],"based":[39],"on":[40,56,157],"the":[41,74,112,145,166],"MapReduce":[42],"framework":[43],"its":[45],"open":[46],"source":[47],"Hadoop":[48],"implementation.":[49],"While":[50],"this":[51,86],"trend":[52],"has":[53,68],"engendered":[54],"work":[55],"high-level":[57],"analysis":[59],"languages,":[60],"NoSQL":[61],"stores,":[63],"workflow":[64,171],"engines":[65],"etc.,":[66],"there":[67],"been":[69],"very":[70],"little":[71],"attention":[72],"to":[73,161],"challenges":[75],"deploying":[77],"analytic":[78,99],"workflows":[79,100],"into":[80],"production":[81,98,170],"for":[82,95,126,139],"continuous":[83,97],"operation.":[84],"In":[85],"paper,":[87],"we":[88,154,180],"argue":[89],"essential":[92],"platform":[93],"component":[94],"enabling":[96],"store.":[104],"We":[105,143],"highlight":[106],"five":[107],"key":[108],"requirements":[109],"impact":[111],"design":[113,146],"a":[116,149,169],"store:":[117],"(i)":[118],"efficient":[119],"incremental":[120,134],"operations,":[121],"(ii)":[122],"flexible":[123],"storage":[124],"model":[125],"hierarchical":[127],"data,":[128],"(iii)":[129],"snapshot":[130],"support":[131,138],"(iv)":[132],"object-level":[133],"updates,":[135],"(v)":[137],"handling":[140],"change":[141],"sets.":[142],"describe":[144],"SASH,":[148],"scalable":[150],"store":[152],"have":[155],"developed":[156],"top":[158],"HBase":[160],"address":[162],"these":[163],"requirements.":[164],"Using":[165],"workload":[167],"from":[168],"powers":[173],"search":[174],"within":[175],"IBM's":[176],"intranet":[177],"extranet,":[179],"demonstrate":[181],"orders":[182],"magnitude":[184],"improvement":[185],"IO":[187],"performance":[188],"using":[189],"SASH.":[190]},"counts_by_year":[{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
