{"id":"https://openalex.org/W4318820499","doi":"https://doi.org/10.1007/978-3-031-17030-0_6","title":"Improving the\u00a0Usability of\u00a0Tabular Data Through Data Annotation, Repair and\u00a0Augmentation","display_name":"Improving the\u00a0Usability of\u00a0Tabular Data Through Data Annotation, Repair and\u00a0Augmentation","publication_year":2022,"publication_date":"2022-01-01","ids":{"openalex":"https://openalex.org/W4318820499","doi":"https://doi.org/10.1007/978-3-031-17030-0_6"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-031-17030-0_6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-031-17030-0_6","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-17030-0_6.pdf","source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-17030-0_6.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074172674","display_name":"Rabeb Abida","orcid":"https://orcid.org/0000-0003-4005-2633"},"institutions":[{"id":"https://openalex.org/I149768937","display_name":"University of Namur","ror":"https://ror.org/03d1maw17","country_code":"BE","type":"education","lineage":["https://openalex.org/I149768937"]}],"countries":["BE"],"is_corresponding":true,"raw_author_name":"Rabeb Abida","raw_affiliation_strings":["PReCISE, NaDI, Faculty of Computer Science, University of Namur, Namur, Belgium"],"raw_orcid":"https://orcid.org/0000-0003-4005-2633","affiliations":[{"raw_affiliation_string":"PReCISE, NaDI, Faculty of Computer Science, University of Namur, Namur, Belgium","institution_ids":["https://openalex.org/I149768937"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5070165042","display_name":"Anthony Cleve","orcid":null},"institutions":[{"id":"https://openalex.org/I149768937","display_name":"University of Namur","ror":"https://ror.org/03d1maw17","country_code":"BE","type":"education","lineage":["https://openalex.org/I149768937"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Anthony Cleve","raw_affiliation_strings":["PReCISE, NaDI, Faculty of Computer Science, University of Namur, Namur, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"PReCISE, NaDI, Faculty of Computer Science, University of Namur, Namur, Belgium","institution_ids":["https://openalex.org/I149768937"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5074172674"],"corresponding_institution_ids":["https://openalex.org/I149768937"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.58403709,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"65","last_page":"77"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8080800771713257},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.7756204009056091},{"id":"https://openalex.org/keywords/metadata","display_name":"Metadata","score":0.769885778427124},{"id":"https://openalex.org/keywords/missing-data","display_name":"Missing data","score":0.7219231724739075},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6598864793777466},{"id":"https://openalex.org/keywords/usable","display_name":"USable","score":0.6593440771102905},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.593838632106781},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5879703760147095},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5203661322593689},{"id":"https://openalex.org/keywords/bridge","display_name":"Bridge (graph theory)","score":0.46866095066070557},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.45814889669418335},{"id":"https://openalex.org/keywords/data-quality","display_name":"Data quality","score":0.45416077971458435},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.31839966773986816},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1600877046585083},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.134794682264328},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07442629337310791}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8080800771713257},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.7756204009056091},{"id":"https://openalex.org/C93518851","wikidata":"https://www.wikidata.org/wiki/Q180160","display_name":"Metadata","level":2,"score":0.769885778427124},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.7219231724739075},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6598864793777466},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.6593440771102905},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.593838632106781},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5879703760147095},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5203661322593689},{"id":"https://openalex.org/C100776233","wikidata":"https://www.wikidata.org/wiki/Q2532492","display_name":"Bridge (graph theory)","level":2,"score":0.46866095066070557},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.45814889669418335},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.45416077971458435},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.31839966773986816},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1600877046585083},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.134794682264328},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07442629337310791},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.0},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1007/978-3-031-17030-0_6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-031-17030-0_6","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-17030-0_6.pdf","source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},{"id":"pmh:oai:pure.unamur.be:openaire_cris_publications/e5b2428d-6a56-4d8e-a7d5-6a7b1030b8c5","is_oa":false,"landing_page_url":"https://researchportal.unamur.be/en/publications/e5b2428d-6a56-4d8e-a7d5-6a7b1030b8c5","pdf_url":null,"source":{"id":"https://openalex.org/S4406922457","display_name":"Repository of the University of Namur","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Abida, R & Cleve, A 2023, Improving the Usability of Tabular Data through Data Annotation, Repair and Augmentation. in 2022 Symposium of the Norwegian AI Society. Communications in Computer and Information Science, Springer.","raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":{"id":"doi:10.1007/978-3-031-17030-0_6","is_oa":true,"landing_page_url":"https://doi.org/10.1007/978-3-031-17030-0_6","pdf_url":"https://link.springer.com/content/pdf/10.1007/978-3-031-17030-0_6.pdf","source":{"id":"https://openalex.org/S2764900261","display_name":"Communications in computer and information science","issn_l":"1865-0929","issn":["1865-0929","1865-0937"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Communications in Computer and Information Science","raw_type":"book-chapter"},"sustainable_development_goals":[{"score":0.5199999809265137,"display_name":"No poverty","id":"https://metadata.un.org/sdg/1"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320335302","display_name":"Universit\u00e9 de Namur","ror":"https://ror.org/03d1maw17"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4318820499.pdf"},"referenced_works_count":11,"referenced_works":["https://openalex.org/W102708294","https://openalex.org/W2080133951","https://openalex.org/W2581324571","https://openalex.org/W2788550262","https://openalex.org/W2898796029","https://openalex.org/W2965875055","https://openalex.org/W3013003636","https://openalex.org/W3023371140","https://openalex.org/W3099839495","https://openalex.org/W3114574485","https://openalex.org/W6608497737"],"related_works":["https://openalex.org/W2982321410","https://openalex.org/W2392768766","https://openalex.org/W2058118494","https://openalex.org/W2361861616","https://openalex.org/W95465806","https://openalex.org/W2392004567","https://openalex.org/W2095118173","https://openalex.org/W2382021449","https://openalex.org/W2183692821","https://openalex.org/W4213040784"],"abstract_inverted_index":{"Abstract":[0],"In":[1,86],"recent":[2],"years,":[3],"a":[4,63,151],"rapidly":[5],"increasing":[6],"amount":[7],"of":[8,22,65,143,159],"information":[9],"has":[10],"been":[11,48],"made":[12],"publicly":[13],"available":[14],"in":[15,50,157],"tabular":[16],"form":[17],"on":[18,148],"the":[19,51,106,139,144],"Web.":[20],"Many":[21],"these":[23,55,82],"data":[24,56,83,109,118,127],"are":[25],"not":[26],"usable":[27],"due":[28],"to":[29,53,76,80,100,138],"their":[30],"poor":[31],"quality":[32,57,84],"(e.g.,":[33],"misspelled":[34,113],"or":[35,39],"missing":[36,38,43,122],"values,":[37],"incomplete":[40,115],"metadata,":[41],"and":[42,93,114,126,134,161],"meaningful":[44,132],"columns).":[45],"Solutions":[46],"have":[47],"proposed":[49],"literature":[52],"address":[54,112,121],"issues,":[58],"but":[59],"there":[60],"is":[61],"still":[62],"lack":[64],"all-in-one":[66,92],"approaches":[67],"that":[68,98],"can":[69],"fully":[70],"solve":[71,81],"them.":[72],"Therefore,":[73],"users":[74],"need":[75],"use":[77],"several":[78],"methods":[79],"issues.":[85],"this":[87,102],"paper,":[88],"we":[89],"present":[90],"an":[91],"automatic":[94],"approach":[95,146],"called":[96],"SINATRA":[97,145],"helps":[99],"bridge":[101],"gaps":[103],"by":[104],"providing":[105],"following":[107],"features:":[108],"annotation":[110],"(to":[111,120,129],"metadata":[116],"issues),":[117,125],"repair":[119],"values":[123,137],"(data)":[124],"augmentation":[128],"dynamically":[130],"add":[131],"columns":[133],"corresponding":[135],"cell":[136],"dataset).":[140],"An":[141],"evaluation":[142],"based":[147],"datasets":[149],"from":[150],"state-of-the-art":[152],"benchmark":[153],"shows":[154],"promising":[155],"results":[156],"terms":[158],"F1-measure":[160],"precision.":[162]},"counts_by_year":[],"updated_date":"2026-06-13T06:13:01.061226","created_date":"2025-10-10T00:00:00"}
