{"id":"https://openalex.org/W4412377066","doi":"https://doi.org/10.1145/3726302.3730296","title":"<scp>nlcTables:</scp> A Dataset for Marrying Natural Language Conditions with Table Discovery","display_name":"<scp>nlcTables:</scp> A Dataset for Marrying Natural Language Conditions with Table Discovery","publication_year":2025,"publication_date":"2025-07-13","ids":{"openalex":"https://openalex.org/W4412377066","doi":"https://doi.org/10.1145/3726302.3730296"},"language":"en","primary_location":{"id":"doi:10.1145/3726302.3730296","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726302.3730296","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730296","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730296","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5108965069","display_name":"Lingxi Cui","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Lingxi Cui","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0002-6314-9104","affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100319234","display_name":"Huan Li","orcid":"https://orcid.org/0000-0003-0084-1662"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huan Li","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-0084-1662","affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100451997","display_name":"Ke Chen","orcid":"https://orcid.org/0000-0002-3062-0900"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Chen","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-3062-0900","affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103017455","display_name":"Lidan Shou","orcid":"https://orcid.org/0000-0001-8062-8356"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lidan Shou","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-8062-8356","affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China and Hangzhou High-Tech Zone (Binjiang) Institute of Blockchain and Data Security, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100389286","display_name":"Gang Chen","orcid":"https://orcid.org/0000-0002-7483-0045"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gang Chen","raw_affiliation_strings":["The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-7483-0045","affiliations":[{"raw_affiliation_string":"The State Key Laboratory of Blockchain and Data Security, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5108965069"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07994146,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3638","last_page":"3647"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.7208045125007629},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7050355076789856},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.5731539726257324},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4413870573043823},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.42326152324676514},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35378068685531616},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.33566147089004517},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.22973495721817017},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.12397173047065735}],"concepts":[{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.7208045125007629},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7050355076789856},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.5731539726257324},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4413870573043823},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.42326152324676514},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35378068685531616},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.33566147089004517},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.22973495721817017},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.12397173047065735},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3726302.3730296","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726302.3730296","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730296","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3726302.3730296","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3726302.3730296","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3726302.3730296","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.4300000071525574,"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320338464","display_name":"Natural Science Foundation of Zhejiang Province","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4412377066.pdf","grobid_xml":"https://content.openalex.org/works/W4412377066.grobid-xml"},"referenced_works_count":41,"referenced_works":["https://openalex.org/W1996505782","https://openalex.org/W2092364718","https://openalex.org/W2140116426","https://openalex.org/W2740592503","https://openalex.org/W2788550262","https://openalex.org/W2798664493","https://openalex.org/W2899286282","https://openalex.org/W2948163032","https://openalex.org/W2963469388","https://openalex.org/W3014616325","https://openalex.org/W3016473712","https://openalex.org/W3026889466","https://openalex.org/W3034944976","https://openalex.org/W3037852608","https://openalex.org/W3099839495","https://openalex.org/W3099965312","https://openalex.org/W3102264439","https://openalex.org/W3153032435","https://openalex.org/W3157891451","https://openalex.org/W3161215821","https://openalex.org/W3174637548","https://openalex.org/W4205922070","https://openalex.org/W4221009220","https://openalex.org/W4224951911","https://openalex.org/W4289533971","https://openalex.org/W4289533982","https://openalex.org/W4365456672","https://openalex.org/W4375928372","https://openalex.org/W4379390735","https://openalex.org/W4380433117","https://openalex.org/W4385653220","https://openalex.org/W4385893866","https://openalex.org/W4387332921","https://openalex.org/W4389609672","https://openalex.org/W4399208200","https://openalex.org/W4400528676","https://openalex.org/W4401306679","https://openalex.org/W4403322892","https://openalex.org/W4404181035","https://openalex.org/W4404181101","https://openalex.org/W4414633497"],"related_works":["https://openalex.org/W4394360958","https://openalex.org/W2948670949","https://openalex.org/W4288047943","https://openalex.org/W4394193569","https://openalex.org/W1797990060","https://openalex.org/W4232484699","https://openalex.org/W2473636215","https://openalex.org/W4226226396","https://openalex.org/W3153750606","https://openalex.org/W4308854837"],"abstract_inverted_index":{"With":[0],"the":[1,114],"growing":[2],"abundance":[3],"of":[4,101],"repositories":[5],"containing":[6],"tabular":[7],"data,":[8],"discovering":[9],"relevant":[10],"tables":[11,25],"for":[12,116],"in-depth":[13],"analysis":[14],"remains":[15],"a":[16,28,48,58,78],"challenging":[17,122],"task.Existing":[18],"table":[19,30,52,60,104],"discovery":[20,53,105],"methods":[21,106],"primarily":[22],"retrieve":[23],"desired":[24],"based":[26],"on":[27,107],"query":[29,59],"or":[31],"several":[32],"vague":[33],"keywords,":[34],"leaving":[35],"users":[36,56],"to":[37,66,119,136],"manually":[38],"filter":[39],"large":[40],"result":[41],"sets.To":[42],"address":[43],"this":[44,73,121],"limitation,":[45],"we":[46,75],"propose":[47],"new":[49],"task:":[50],"NL-conditional":[51],"(nlcTD),":[54],"where":[55],"combine":[57],"with":[61],"natural":[62],"language":[63],"(NL)":[64],"requirements":[65],"refine":[67],"search":[68],"results.To":[69],"advance":[70],"research":[71],"in":[72],"area,":[74],"present":[76],"nlcTables,":[77],"comprehensive":[79],"benchmark":[80],"dataset":[81],"comprising":[82],"627":[83],"diverse":[84],"queries":[85],"spanning":[86],"NL-only,":[87],"union,":[88],"join,":[89],"and":[90,96,128],"fuzzy":[91],"conditions,":[92],"22,080":[93],"candidate":[94],"tables,":[95],"21,200":[97],"relevance":[98],"annotations.Our":[99],"evaluation":[100],"six":[102],"state-ofthe-art":[103],"nlcTables":[108],"reveals":[109],"substantial":[110],"performance":[111],"gaps,":[112],"highlighting":[113],"need":[115],"advanced":[117],"techniques":[118],"tackle":[120],"nlcTD":[123],"scenario.The":[124],"dataset,":[125],"construction":[126],"framework,":[127],"baseline":[129],"implementations":[130],"are":[131],"publicly":[132],"available":[133],"at":[134],"https://github.com/SuDIS-ZJU/nlcTables":[135],"foster":[137],"future":[138],"research.":[139]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
