{"id":"https://openalex.org/W2962207144","doi":"https://doi.org/10.31577/cai_2019_3_621","title":"Discovering Foreign Keys on Web Tables with the Crowd","display_name":"Discovering Foreign Keys on Web Tables with the Crowd","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2962207144","doi":"https://doi.org/10.31577/cai_2019_3_621","mag":"2962207144"},"language":"en","primary_location":{"id":"doi:10.31577/cai_2019_3_621","is_oa":true,"landing_page_url":"https://doi.org/10.31577/cai_2019_3_621","pdf_url":null,"source":{"id":"https://openalex.org/S4210200093","display_name":"Computing and Informatics","issn_l":"1335-9150","issn":["1335-9150","2585-8807"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.31577/cai_2019_3_621","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100357651","display_name":"Xiaoyu Wu","orcid":"https://orcid.org/0000-0003-3481-7820"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaoyu Wu","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, Beijing 100044"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, Beijing 100044","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100387096","display_name":"Ning Wang","orcid":"https://orcid.org/0000-0001-8903-8790"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ning Wang","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, Beijing 100044"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, Beijing 100044","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006435045","display_name":"Huaxi Liu","orcid":"https://orcid.org/0000-0002-8583-3698"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaxi Liu","raw_affiliation_strings":["School of Computer and Information Technology, Beijing Jiaotong University, Beijing 100044"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Technology, Beijing Jiaotong University, Beijing 100044","institution_ids":["https://openalex.org/I21193070"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100357651"],"corresponding_institution_ids":["https://openalex.org/I21193070"],"apc_list":null,"apc_paid":null,"fwci":0.28,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.64928652,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"38","issue":"3","first_page":"621","last_page":"646"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11598","display_name":"Internet Traffic Analysis and Secure E-voting","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11598","display_name":"Internet Traffic Analysis and Secure E-voting","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11045","display_name":"Privacy, Security, and Data Protection","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.551689088344574},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5418459177017212},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.3778000473976135},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3763052523136139},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3466927409172058}],"concepts":[{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.551689088344574},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5418459177017212},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.3778000473976135},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3763052523136139},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3466927409172058}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.31577/cai_2019_3_621","is_oa":true,"landing_page_url":"https://doi.org/10.31577/cai_2019_3_621","pdf_url":null,"source":{"id":"https://openalex.org/S4210200093","display_name":"Computing and Informatics","issn_l":"1335-9150","issn":["1335-9150","2585-8807"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Informatics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.31577/cai_2019_3_621","is_oa":true,"landing_page_url":"https://doi.org/10.31577/cai_2019_3_621","pdf_url":null,"source":{"id":"https://openalex.org/S4210200093","display_name":"Computing and Informatics","issn_l":"1335-9150","issn":["1335-9150","2585-8807"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computing and Informatics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.7099999785423279}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2478288626","https://openalex.org/W4391913857","https://openalex.org/W2350741829","https://openalex.org/W2530322880"],"abstract_inverted_index":{"Foreign-key":[0],"relationship":[1,29],"is":[2,30,50,123,150],"one":[3],"of":[4,43,46,88,103,156],"the":[5,101,104,108,132,154,160],"most":[6,133],"important":[7],"constraints":[8],"between":[9],"two":[10],"tables.":[11,40,80],"Previous":[12],"works":[13],"focused":[14],"on":[15,60,78,117,166,182],"detecting":[16],"inclusion":[17,121],"dependencies":[18],"(INDs)":[19],"or":[20],"foreign":[21,54,76,91,178],"keys":[22,55,77,92],"in":[23,38],"relational":[24],"database.":[25],"To":[26,106],"discover":[27,53],"foreign-key":[28],"obviously":[31,176],"helpful":[32],"for":[33],"analyzing":[34],"and":[35,84,120,130,146,169,189],"integrating":[36],"data":[37],"web":[39,47,79,183],"However,":[41],"because":[42],"poor":[44],"quality":[45],"tables,":[48],"it":[49],"difficult":[51],"to":[52,74,136,139,152,159],"by":[56,93],"existing":[57],"techniques":[58],"based":[59,116],"checking":[61],"basic":[62],"integrity":[63],"constraints.":[64],"In":[65],"this":[66],"paper,":[67],"we":[68,96],"propose":[69],"a":[70,111],"hybrid":[71],"human-machine":[72],"framework":[73,174],"detect":[75],"After":[81],"discovering":[82],"candidates":[83,99],"evaluating":[85],"their":[86],"confidence":[87],"being":[89],"true":[90],"machine":[94],"algorithm,":[95],"verify":[97],"those":[98],"leveraging":[100],"power":[102],"crowd.":[105,161],"reduce":[107],"monetary":[109,187],"cost,":[110],"dynamical":[112],"task":[113],"selection":[114],"technique":[115],"conflict":[118],"detection":[119,180],"dependency":[122],"proposed,":[124],"which":[125],"could":[126],"eliminate":[127],"redundant":[128],"tasks":[129,135,143],"assign":[131],"valuable":[134],"workers.":[137],"Additionally,":[138],"make":[140],"workers":[141],"complete":[142],"more":[144],"effectively":[145],"efficiently,":[147],"sampling":[148],"strategy":[149],"applied":[151],"minimize":[153],"number":[155],"tuples":[157],"posed":[158],"We":[162],"conducted":[163],"extensive":[164],"experiments":[165],"real-world":[167],"datasets":[168],"results":[170],"show":[171],"that":[172],"our":[173],"can":[175],"improve":[177],"key":[179],"accuracy":[181],"tables":[184],"with":[185],"lower":[186],"cost":[188],"time":[190],"cost.":[191]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
