{"id":"https://openalex.org/W2112129552","doi":"https://doi.org/10.14778/1920841.1920944","title":"On multi-column foreign key discovery","display_name":"On multi-column foreign key discovery","publication_year":2010,"publication_date":"2010-09-01","ids":{"openalex":"https://openalex.org/W2112129552","doi":"https://doi.org/10.14778/1920841.1920944","mag":"2112129552"},"language":"en","primary_location":{"id":"doi:10.14778/1920841.1920944","is_oa":false,"landing_page_url":"https://doi.org/10.14778/1920841.1920944","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086550982","display_name":"Meihui Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Meihui Zhang","raw_affiliation_strings":["National University of Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058831095","display_name":"Marios Hadjieleftheriou","orcid":null},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marios Hadjieleftheriou","raw_affiliation_strings":["AT&amp;T Labs - Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AT&amp;T Labs - Research","institution_ids":["https://openalex.org/I1283103587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024892041","display_name":"Beng Chin Ooi","orcid":"https://orcid.org/0000-0003-4446-1100"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Beng Chin Ooi","raw_affiliation_strings":["National University of Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071763795","display_name":"Cecilia M. Procopiuc","orcid":null},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cecilia M. Procopiuc","raw_affiliation_strings":["AT&amp;T Labs - Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AT&amp;T Labs - Research","institution_ids":["https://openalex.org/I1283103587"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088315797","display_name":"Divesh Srivastava","orcid":"https://orcid.org/0000-0002-7609-9217"},"institutions":[{"id":"https://openalex.org/I1283103587","display_name":"AT&T (United States)","ror":"https://ror.org/02bbd5539","country_code":"US","type":"company","lineage":["https://openalex.org/I1283103587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Divesh Srivastava","raw_affiliation_strings":["AT&amp;T Labs - Research"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AT&amp;T Labs - Research","institution_ids":["https://openalex.org/I1283103587"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":6.0222,"has_fulltext":false,"cited_by_count":89,"citation_normalized_percentile":{"value":0.96078,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"3","issue":"1-2","first_page":"805","last_page":"814"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/column","display_name":"Column (typography)","score":0.8477252721786499},{"id":"https://openalex.org/keywords/randomness","display_name":"Randomness","score":0.8194782137870789},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7523515224456787},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.6916316151618958},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6653279662132263},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5991407036781311},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4608859717845917},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.4428223967552185},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.36643186211586},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1646409034729004},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1484522521495819},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.060627371072769165},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.05976611375808716}],"concepts":[{"id":"https://openalex.org/C2780551164","wikidata":"https://www.wikidata.org/wiki/Q2306599","display_name":"Column (typography)","level":3,"score":0.8477252721786499},{"id":"https://openalex.org/C125112378","wikidata":"https://www.wikidata.org/wiki/Q176640","display_name":"Randomness","level":2,"score":0.8194782137870789},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7523515224456787},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.6916316151618958},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6653279662132263},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5991407036781311},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4608859717845917},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.4428223967552185},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36643186211586},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1646409034729004},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1484522521495819},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.060627371072769165},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.05976611375808716},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.14778/1920841.1920944","is_oa":false,"landing_page_url":"https://doi.org/10.14778/1920841.1920944","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},{"id":"pmh:oai:scholarbank.nus.edu.sg:10635/39479","is_oa":false,"landing_page_url":"http://scholarbank.nus.edu.sg/handle/10635/39479","pdf_url":null,"source":{"id":"https://openalex.org/S7407052290","display_name":"National University of Singapore","issn_l":null,"issn":[],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Scopus","raw_type":"Article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.174.438","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.174.438","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.comp.nus.edu.sg/%7Evldb2010/proceedings/files/papers/R72.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.222.7732","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.222.7732","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.comp.nus.edu.sg/%7Ecospace/pub/vldb10-pkfk.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.8100000023841858,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1964312191","https://openalex.org/W1972848834","https://openalex.org/W1984566373","https://openalex.org/W1992363839","https://openalex.org/W1994945255","https://openalex.org/W2002664886","https://openalex.org/W2042389627","https://openalex.org/W2094407133","https://openalex.org/W2096461223","https://openalex.org/W2099725016","https://openalex.org/W2104648049","https://openalex.org/W2112452856","https://openalex.org/W2120587290","https://openalex.org/W2132069633","https://openalex.org/W2140313762","https://openalex.org/W2140523882","https://openalex.org/W2159186077","https://openalex.org/W2168846860","https://openalex.org/W2752885492","https://openalex.org/W3145128584","https://openalex.org/W4285719527","https://openalex.org/W6679663036","https://openalex.org/W7021264618","https://openalex.org/W7029321148"],"related_works":["https://openalex.org/W3034924094","https://openalex.org/W1488708774","https://openalex.org/W3094954546","https://openalex.org/W2981906196","https://openalex.org/W4391100477","https://openalex.org/W4327779705","https://openalex.org/W1513698804","https://openalex.org/W4310560702","https://openalex.org/W2029712093","https://openalex.org/W1590541736"],"abstract_inverted_index":{"A":[0],"foreign/primary":[1],"key":[2,42],"relationship":[3],"between":[4],"relational":[5],"tables":[6],"is":[7,25],"one":[8],"of":[9,100,123],"the":[10,34,48,65,140],"most":[11],"important":[12],"constraints":[13,43],"in":[14,29,47,64],"a":[15,18,26,78,98,113,121],"database.":[16],"From":[17],"data":[19,73],"analysis":[20],"perspective,":[21],"discovering":[22,82,93],"foreign":[23,41,86,95],"keys":[24,96],"crucial":[27],"step":[28],"understanding":[30],"and":[31,84,107,152],"working":[32],"with":[33],"data.":[35,141],"Nevertheless,":[36],"more":[37],"often":[38],"than":[39],"not,":[40],"are":[44,56,62],"not":[45,57],"specified":[46],"data,":[49,66],"for":[50,81,132],"various":[51],"reasons;":[52],"e.g.,":[53],"some":[54],"associations":[55],"known":[58],"to":[59,72],"designers":[60],"but":[61],"inherent":[63],"while":[67],"others":[68],"become":[69],"invalid":[70],"due":[71],"inconsistencies.":[74],"This":[75],"work":[76,89],"proposes":[77],"robust":[79],"algorithm":[80],"single-column":[83,94],"multi-column":[85],"keys.":[87],"Previous":[88],"concentrated":[90],"mostly":[91],"on":[92],"using":[97,135,150],"variety":[99,122],"rules,":[101],"like":[102],"inclusion":[103],"dependencies,":[104],"column":[105],"names,":[106],"minimum/maximum":[108],"values.":[109],"We":[110,126],"first":[111],"propose":[112],"general":[114],"rule,":[115],"termed":[116],"Randomness":[117],",":[118],"that":[119],"subsumes":[120],"other":[124],"rules.":[125],"then":[127],"develop":[128],"efficient":[129],"approximation":[130],"algorithms":[131],"evaluating":[133],"randomness,":[134],"only":[136],"two":[137],"passes":[138],"over":[139],"Finally,":[142],"we":[143],"validate":[144],"our":[145],"approach":[146],"via":[147],"extensive":[148],"experiments":[149],"real":[151],"synthetic":[153],"datasets.":[154]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":11},{"year":2017,"cited_by_count":5},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":10},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":7},{"year":2012,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
