{"id":"https://openalex.org/W1994212309","doi":"https://doi.org/10.1145/1458432.1458442","title":"Estimating and bounding aggregations in databases with referential integrity errors","display_name":"Estimating and bounding aggregations in databases with referential integrity errors","publication_year":2008,"publication_date":"2008-10-30","ids":{"openalex":"https://openalex.org/W1994212309","doi":"https://doi.org/10.1145/1458432.1458442","mag":"1994212309"},"language":"en","primary_location":{"id":"doi:10.1145/1458432.1458442","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458432.1458442","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM 11th international workshop on Data warehousing and OLAP","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038679061","display_name":"Javier Garc\u0131\u0301a-Garc\u0131\u0301a","orcid":"https://orcid.org/0000-0001-9539-2606"},"institutions":[{"id":"https://openalex.org/I8961855","display_name":"Universidad Nacional Aut\u00f3noma de M\u00e9xico","ror":"https://ror.org/01tmp8f25","country_code":"MX","type":"education","lineage":["https://openalex.org/I8961855"]}],"countries":["MX"],"is_corresponding":true,"raw_author_name":"Javier Garc\u00eda-Garc\u00eda","raw_affiliation_strings":["Universidad Nacional Aut\u00f3noma de M\u00e9xico, Mexico City, Mexico"],"affiliations":[{"raw_affiliation_string":"Universidad Nacional Aut\u00f3noma de M\u00e9xico, Mexico City, Mexico","institution_ids":["https://openalex.org/I8961855"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031610238","display_name":"Carlos Ordo\u0144\u1ebdz","orcid":"https://orcid.org/0009-0005-1135-9726"},"institutions":[{"id":"https://openalex.org/I44461941","display_name":"University of Houston","ror":"https://ror.org/048sx0r50","country_code":"US","type":"education","lineage":["https://openalex.org/I44461941"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Carlos Ordonez","raw_affiliation_strings":["University of Houston, Houston, TX, USA"],"affiliations":[{"raw_affiliation_string":"University of Houston, Houston, TX, USA","institution_ids":["https://openalex.org/I44461941"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5038679061"],"corresponding_institution_ids":["https://openalex.org/I8961855"],"apc_list":null,"apc_paid":null,"fwci":0.7332,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.74377004,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"49","last_page":"56"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/data-integrity","display_name":"Data integrity","score":0.8043897151947021},{"id":"https://openalex.org/keywords/tuple","display_name":"Tuple","score":0.7739893794059753},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7681803703308105},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.6979841589927673},{"id":"https://openalex.org/keywords/online-analytical-processing","display_name":"Online analytical processing","score":0.6227015852928162},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.5787644386291504},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.5439706444740295},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5218400359153748},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.49267250299453735},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.48351576924324036},{"id":"https://openalex.org/keywords/data-warehouse","display_name":"Data warehouse","score":0.46780824661254883},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1108563244342804},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.10885092616081238}],"concepts":[{"id":"https://openalex.org/C33762810","wikidata":"https://www.wikidata.org/wiki/Q461671","display_name":"Data integrity","level":2,"score":0.8043897151947021},{"id":"https://openalex.org/C118930307","wikidata":"https://www.wikidata.org/wiki/Q600590","display_name":"Tuple","level":2,"score":0.7739893794059753},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7681803703308105},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.6979841589927673},{"id":"https://openalex.org/C201932085","wikidata":"https://www.wikidata.org/wiki/Q642514","display_name":"Online analytical processing","level":3,"score":0.6227015852928162},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.5787644386291504},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.5439706444740295},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5218400359153748},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.49267250299453735},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.48351576924324036},{"id":"https://openalex.org/C135572916","wikidata":"https://www.wikidata.org/wiki/Q193351","display_name":"Data warehouse","level":2,"score":0.46780824661254883},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1108563244342804},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.10885092616081238},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1458432.1458442","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1458432.1458442","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the ACM 11th international workshop on Data warehousing and OLAP","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.5099999904632568,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1593468624","https://openalex.org/W1968461475","https://openalex.org/W1972933296","https://openalex.org/W2016704849","https://openalex.org/W2045054164","https://openalex.org/W2045630074","https://openalex.org/W2062796915","https://openalex.org/W2098333994","https://openalex.org/W2108658789","https://openalex.org/W2134516133","https://openalex.org/W2140151132","https://openalex.org/W2146581901","https://openalex.org/W2616737215"],"related_works":["https://openalex.org/W2378213774","https://openalex.org/W2357522326","https://openalex.org/W2363019959","https://openalex.org/W6138692","https://openalex.org/W1535822977","https://openalex.org/W23190051","https://openalex.org/W2367419170","https://openalex.org/W2377387014","https://openalex.org/W2382180329","https://openalex.org/W2375394542"],"abstract_inverted_index":{"Database":[0],"integration":[1],"builds":[2],"on":[3,140],"tables":[4,45,83,90,96,135],"coming":[5],"from":[6,218],"multiple":[7],"databases":[8,28,142],"by":[9,76,195],"creating":[10],"a":[11,35,53,114,171,207,224],"single":[12],"view":[13],"of":[14,64,178],"all":[15],"these":[16],"data.":[17],"Each":[18],"database":[19,40,225],"has":[20],"different":[21,30],"tables,":[22],"columns":[23,47],"with":[24,48,91,105,136,192],"similar":[25],"content":[26],"across":[27],"and":[29,46,99],"referential":[31,49,66,92,137,227],"integrity":[32,50,67,138,228],"constraints.":[33,229],"Thus,":[34],"query":[36],"in":[37,69,80,113,127,148,183,221],"an":[38,106,165,202],"integrated":[39],"is":[41,73,154,181,187],"likely":[42],"to":[43,85,87,143,158,189],"involve":[44],"errors.":[51,93],"In":[52],"data":[54],"warehouse":[55],"environment,":[56],"even":[57],"though":[58],"the":[59,65,81,88,103,149,162,199],"ETL":[60],"processes":[61],"take":[62],"care":[63],"errors,":[68],"many":[70],"scenarios":[71],"this":[72],"generally":[74],"done":[75],"including":[77],"'dummy'":[78],"records":[79],"dimension":[82],"used":[84],"relate":[86],"fact":[89],"When":[94],"two":[95],"are":[97,101,111,216],"joined,":[98],"aggregations":[100],"computed,":[102],"tuples":[104,191],"undefined":[107,118],"foreign":[108],"key":[109],"value":[110],"aggregated":[112],"group":[115],"marked":[116],"as":[117],"effectively":[119],"discarding":[120],"potentially":[121],"valuable":[122],"information.":[123],"With":[124],"that":[125,151,164,182,201],"motivation":[126],"mind,":[128],"we":[129],"extend":[130],"aggregate":[131,219],"functions":[132],"computed":[133],"over":[134],"errors":[139],"OLAP":[141],"return":[144],"complete":[145],"answer":[146,214],"sets":[147,215],"sense":[150],"no":[152],"tuple":[153],"excluded.":[155],"We":[156],"associate":[157],"each":[159],"valid":[160],"reference,":[161],"probability":[163,200],"invalid":[166,193,203],"reference":[167,204],"may":[168],"actually":[169,205],"be":[170,206],"certain":[172,184,208],"correct":[173,209],"reference.":[174,210],"The":[175],"main":[176],"idea":[177],"our":[179],"work":[180],"contexts,":[185],"it":[186],"possible":[188],"use":[190],"references":[194],"taking":[196],"into":[197],"account":[198],"This":[211],"way,":[212],"improved":[213],"obtained":[217],"queries":[220],"settings":[222],"where":[223],"violates":[226]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
