{"id":"https://openalex.org/W1989215876","doi":"https://doi.org/10.1145/2737817.2737829","title":"Exploring Big Data with Helix","display_name":"Exploring Big Data with Helix","publication_year":2015,"publication_date":"2015-02-18","ids":{"openalex":"https://openalex.org/W1989215876","doi":"https://doi.org/10.1145/2737817.2737829","mag":"1989215876"},"language":"en","primary_location":{"id":"doi:10.1145/2737817.2737829","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2737817.2737829","pdf_url":null,"source":{"id":"https://openalex.org/S47508943","display_name":"ACM SIGMOD Record","issn_l":"0163-5808","issn":["0163-5808","1943-5835"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGMOD Record","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038223145","display_name":"Jason Ellis","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Jason Ellis","raw_affiliation_strings":["IBM Research","IBM Research, -"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research","institution_ids":[]},{"raw_affiliation_string":"IBM Research, -","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062643837","display_name":"Achille Fokoue","orcid":"https://orcid.org/0000-0003-1137-1344"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Achille Fokoue","raw_affiliation_strings":["IBM Research","IBM Research, -"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research","institution_ids":[]},{"raw_affiliation_string":"IBM Research, -","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068065546","display_name":"Oktie Hassanzadeh","orcid":"https://orcid.org/0000-0001-5307-9857"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oktie Hassanzadeh","raw_affiliation_strings":["IBM Research","IBM Research, -"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research","institution_ids":[]},{"raw_affiliation_string":"IBM Research, -","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014087838","display_name":"Anastasios Kementsietsidis","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anastasios Kementsietsidis","raw_affiliation_strings":["IBM Research","IBM Research, -"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research","institution_ids":[]},{"raw_affiliation_string":"IBM Research, -","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085594669","display_name":"Kavitha Srinivas","orcid":"https://orcid.org/0000-0003-4610-967X"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kavitha Srinivas","raw_affiliation_strings":["IBM Research","IBM Research, -"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research","institution_ids":[]},{"raw_affiliation_string":"IBM Research, -","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057715845","display_name":"Michael J. Ward","orcid":"https://orcid.org/0000-0002-4561-2946"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael J. Ward","raw_affiliation_strings":["IBM Research","IBM Research, -"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research","institution_ids":[]},{"raw_affiliation_string":"IBM Research, -","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5038223145"],"corresponding_institution_ids":["https://openalex.org/I1341412227"],"apc_list":null,"apc_paid":null,"fwci":3.2924,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.9196742,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"43","issue":"4","first_page":"43","last_page":"54"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8694092631340027},{"id":"https://openalex.org/keywords/rdf","display_name":"RDF","score":0.6327911019325256},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.593082070350647},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5641458630561829},{"id":"https://openalex.org/keywords/semi-structured-data","display_name":"Semi-structured data","score":0.5267103314399719},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.5139521956443787},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.4650847315788269},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.45010727643966675},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.43546026945114136},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.42921045422554016},{"id":"https://openalex.org/keywords/linked-data","display_name":"Linked data","score":0.42509543895721436},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.42040300369262695},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.41452500224113464},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.2534160017967224},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.1371903419494629}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8694092631340027},{"id":"https://openalex.org/C147497476","wikidata":"https://www.wikidata.org/wiki/Q54872","display_name":"RDF","level":3,"score":0.6327911019325256},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.593082070350647},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5641458630561829},{"id":"https://openalex.org/C40077939","wikidata":"https://www.wikidata.org/wiki/Q2336004","display_name":"Semi-structured data","level":3,"score":0.5267103314399719},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.5139521956443787},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.4650847315788269},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.45010727643966675},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.43546026945114136},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.42921045422554016},{"id":"https://openalex.org/C69075417","wikidata":"https://www.wikidata.org/wiki/Q515701","display_name":"Linked data","level":3,"score":0.42509543895721436},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42040300369262695},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.41452500224113464},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2534160017967224},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.1371903419494629}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2737817.2737829","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2737817.2737829","pdf_url":null,"source":{"id":"https://openalex.org/S47508943","display_name":"ACM SIGMOD Record","issn_l":"0163-5808","issn":["0163-5808","1943-5835"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGMOD Record","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4399999976158142,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W20290297","https://openalex.org/W180847788","https://openalex.org/W195679761","https://openalex.org/W1426690399","https://openalex.org/W1981578383","https://openalex.org/W1988674507","https://openalex.org/W1998282059","https://openalex.org/W2008896880","https://openalex.org/W2012833704","https://openalex.org/W2028716971","https://openalex.org/W2029554959","https://openalex.org/W2031250218","https://openalex.org/W2036260704","https://openalex.org/W2037802158","https://openalex.org/W2093189534","https://openalex.org/W2098179152","https://openalex.org/W2116391761","https://openalex.org/W2122483056","https://openalex.org/W2124391840","https://openalex.org/W2130865062","https://openalex.org/W2132069633","https://openalex.org/W2148524305","https://openalex.org/W2156580346","https://openalex.org/W2168846860","https://openalex.org/W2171244245","https://openalex.org/W2295108729","https://openalex.org/W2399597710","https://openalex.org/W6679663036"],"related_works":["https://openalex.org/W2283287182","https://openalex.org/W1485690712","https://openalex.org/W82112649","https://openalex.org/W2058923328","https://openalex.org/W2776293731","https://openalex.org/W2610919777","https://openalex.org/W2965230088","https://openalex.org/W4293389049","https://openalex.org/W1534806717","https://openalex.org/W1977140384"],"abstract_inverted_index":{"While":[0],"much":[1],"work":[2,12],"has":[3],"focused":[4],"on":[5],"efficient":[6],"processing":[7],"of":[8,29,37,70,75,114],"Big":[9,30],"Data,":[10],"little":[11],"considers":[13],"how":[14],"to":[15,51],"understand":[16],"them.":[17],"In":[18],"this":[19],"paper,":[20],"we":[21],"describe":[22],"Helix,":[23,109],"a":[24,34,68,97,112],"system":[25],"for":[26],"guided":[27],"exploration":[28],"Data.":[31],"Helix":[32,60],"provides":[33],"unified":[35],"view":[36],"sources,":[38],"ranging":[39],"from":[40],"spreadsheets":[41],"and":[42,54,73,89,93,118],"XML":[43],"files":[44],"with":[45,57,111],"no":[46],"schema,":[47],"all":[48],"the":[49,83,100,103,119],"way":[50],"RDF":[52],"graphs":[53],"relational":[55],"data":[56,65,88],"well-defined":[58],"schemas.":[59],"users":[61],"explore":[62],"these":[63],"heterogeneous":[64],"sources":[66],"through":[67],"combination":[69],"keyword":[71],"searches":[72],"navigation":[74],"linked":[76],"web":[77],"pages":[78],"that":[79],"include":[80],"information":[81],"about":[82],"schemas,":[84],"as":[85,87],"well":[86],"semantic":[90],"links":[91],"within":[92],"across":[94],"sources.":[95],"At":[96],"technical":[98],"level,":[99],"paper":[101],"describes":[102],"research":[104],"challenges":[105],"involved":[106],"in":[107],"developing":[108],"along":[110],"set":[113],"real-world":[115],"usage":[116],"scenarios":[117],"lessons":[120],"learned.":[121]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1}],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
