{"id":"https://openalex.org/W7154170117","doi":"https://doi.org/10.1145/3772318.3791449","title":"SemTabla: A Human-in-the-Loop Framework for Semantic Enrichment and Validation of Data Tables","display_name":"SemTabla: A Human-in-the-Loop Framework for Semantic Enrichment and Validation of Data Tables","publication_year":2026,"publication_date":"2026-04-13","ids":{"openalex":"https://openalex.org/W7154170117","doi":"https://doi.org/10.1145/3772318.3791449"},"language":null,"primary_location":{"id":"doi:10.1145/3772318.3791449","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3772318.3791449","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3772318.3791449","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5012157105","display_name":"Zhuochen Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhuochen Jin","raw_affiliation_strings":["Tongji Universiy, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-7246-3923","affiliations":[{"raw_affiliation_string":"Tongji Universiy, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133491174","display_name":"Yingjie Mi","orcid":"https://orcid.org/0009-0008-7466-7031"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingjie Mi","raw_affiliation_strings":["School of intelligence Science and Technology, Nanjing University, Nanjing, China and Huawei Cloud, Hangzhou, China"],"raw_orcid":"https://orcid.org/0009-0008-7466-7031","affiliations":[{"raw_affiliation_string":"School of intelligence Science and Technology, Nanjing University, Nanjing, China and Huawei Cloud, Hangzhou, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yehang Zhu","orcid":"https://orcid.org/0009-0003-0886-0128"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yehang Zhu","raw_affiliation_strings":["School of Intelligent Software and Engineering, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0003-0886-0128","affiliations":[{"raw_affiliation_string":"School of Intelligent Software and Engineering, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133532745","display_name":"yichen yao","orcid":"https://orcid.org/0009-0006-4344-3903"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"yichen yao","raw_affiliation_strings":["School of Intelligent Software and Engineering, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0006-4344-3903","affiliations":[{"raw_affiliation_string":"School of Intelligent Software and Engineering, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133487698","display_name":"Chongyang Yu","orcid":"https://orcid.org/0009-0009-0579-0244"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chongyang Yu","raw_affiliation_strings":["School of Intelligence Science and Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0009-0009-0579-0244","affiliations":[{"raw_affiliation_string":"School of Intelligence Science and Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5133536138","display_name":"Ke Xu","orcid":"https://orcid.org/0000-0001-6481-3770"},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Xu","raw_affiliation_strings":["School of Intelligence Science and Technology, Nanjing University, Nanjing, China"],"raw_orcid":"https://orcid.org/0000-0001-6481-3770","affiliations":[{"raw_affiliation_string":"School of Intelligence Science and Technology, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I36399199"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5012157105"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.85718937,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"22"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.8827000260353088,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.8827000260353088,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.05299999937415123,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.008700000122189522,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.6682999730110168},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.6514000296592712},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.5906999707221985},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4447000026702881},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42879998683929443},{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.40230000019073486}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8416000008583069},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.6682999730110168},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.6514000296592712},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.5906999707221985},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4447000026702881},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42879998683929443},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.40230000019073486},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.39809998869895935},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37139999866485596},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36390000581741333},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.3626999855041504},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.35190001130104065},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C2778828372","wikidata":"https://www.wikidata.org/wiki/Q5283209","display_name":"Distributional semantics","level":3,"score":0.2718000113964081},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.26809999346733093},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.25949999690055847},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.2556999921798706}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3772318.3791449","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3772318.3791449","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3772318.3791449","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3772318.3791449","pdf_url":null,"source":null,"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2026 CHI Conference on Human Factors in Computing Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7529737949371338,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W2023718005","https://openalex.org/W2064766209","https://openalex.org/W2122949840","https://openalex.org/W2135415614","https://openalex.org/W2145154883","https://openalex.org/W2166549982","https://openalex.org/W2168270139","https://openalex.org/W2266772167","https://openalex.org/W2526501380","https://openalex.org/W2551119071","https://openalex.org/W2753739212","https://openalex.org/W2952611840","https://openalex.org/W2973366514","https://openalex.org/W3001838726","https://openalex.org/W3035461111","https://openalex.org/W3158303960","https://openalex.org/W3159054342","https://openalex.org/W4210312918","https://openalex.org/W4297459242","https://openalex.org/W4309735497","https://openalex.org/W4312600202","https://openalex.org/W4321393171","https://openalex.org/W4377104732","https://openalex.org/W4381950474","https://openalex.org/W4384563086","https://openalex.org/W4387138412","https://openalex.org/W4391709246","https://openalex.org/W4393317678","https://openalex.org/W4396832076","https://openalex.org/W4399175313","https://openalex.org/W4399435163","https://openalex.org/W4399670658","https://openalex.org/W4408564929","https://openalex.org/W4409747213","https://openalex.org/W4409749522"],"related_works":[],"abstract_inverted_index":{"Data":[0],"tables":[1],"are":[2],"widely":[3],"used":[4],"to":[5,11,29,41,47,77],"record":[6],"critical":[7,105],"information,":[8],"enabling":[9],"decision-makers":[10],"derive":[12],"insights":[13],"through":[14],"table":[15,24,124],"question":[16],"answering":[17],"(Table":[18],"QA).":[19],"However,":[20],"the":[21,31,37,122,130,138,143],"metadata":[22],"from":[23,83],"schemas":[25],"alone":[26],"often":[27],"fail":[28],"capture":[30],"underlying":[32],"business":[33],"semantics":[34,82,140],"embedded":[35],"in":[36,52],"tabular":[38,84],"data,":[39],"leading":[40],"reasoning":[42,144],"errors.":[43],"Existing":[44],"automated":[45],"approaches":[46],"semantic":[48,96],"enrichment":[49],"face":[50],"challenges":[51],"insufficient":[53],"data":[54],"utilization,":[55],"narrow":[56],"feature":[57],"coverage,":[58],"and":[59,80,110,119,133],"limited":[60],"interpretability.":[61],"To":[62],"overcome":[63],"these":[64],"limitations,":[65],"we":[66],"propose":[67],"SemTabla,":[68],"an":[69,112],"interactive":[70,113],"system":[71],"that":[72,103,115,137],"employs":[73],"a":[74,91,99],"human-in-the-loop":[75],"mechanism":[76],"extract":[78],"comprehensive":[79],"interpretable":[81],"data.":[85],"Our":[86],"key":[87],"contributions":[88],"include:":[89],"(1)":[90],"hierarchical":[92],"framework":[93],"for":[94],"extracting":[95],"attributes;":[97],"(2)":[98],"novel":[100],"sampling":[101],"method":[102],"identifies":[104],"but":[106],"rare":[107],"row":[108],"instances;":[109],"(3)":[111],"interface":[114],"supports":[116],"visualization,":[117],"validation,":[118],"refinement":[120],"of":[121,146],"extracted":[123,139],"semantics.":[125],"A":[126],"user":[127],"study":[128],"confirmed":[129],"system\u2019s":[131],"usability,":[132],"quantitative":[134],"experiments":[135],"demonstrate":[136],"significantly":[141],"enhance":[142],"capabilities":[145],"large":[147],"language":[148],"models.":[149]},"counts_by_year":[],"updated_date":"2026-04-25T08:17:42.794288","created_date":"2026-04-14T00:00:00"}
