{"id":"https://openalex.org/W4297816490","doi":"https://doi.org/10.1145/3555349","title":"Classification of Layout vs. Relational Tables\u00a0on the Web: Machine Learning with Rendered Pages","display_name":"Classification of Layout vs. Relational Tables\u00a0on the Web: Machine Learning with Rendered Pages","publication_year":2022,"publication_date":"2022-08-09","ids":{"openalex":"https://openalex.org/W4297816490","doi":"https://doi.org/10.1145/3555349"},"language":"en","primary_location":{"id":"doi:10.1145/3555349","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3555349","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3555349","source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3555349","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028892816","display_name":"Waqar Haider","orcid":"https://orcid.org/0000-0001-7108-6989"},"institutions":[{"id":"https://openalex.org/I201799495","display_name":"Middle East Technical University","ror":"https://ror.org/014weej12","country_code":"TR","type":"education","lineage":["https://openalex.org/I201799495"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Waqar Haider","raw_affiliation_strings":["Middle East Technical University Northern Cyprus Campus, Mersin, Turkey"],"affiliations":[{"raw_affiliation_string":"Middle East Technical University Northern Cyprus Campus, Mersin, Turkey","institution_ids":["https://openalex.org/I201799495"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006201403","display_name":"Yeliz Ye\u015filada","orcid":"https://orcid.org/0000-0001-8501-0205"},"institutions":[{"id":"https://openalex.org/I201799495","display_name":"Middle East Technical University","ror":"https://ror.org/014weej12","country_code":"TR","type":"education","lineage":["https://openalex.org/I201799495"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"Yeliz Yesilada","raw_affiliation_strings":["Middle East Technical University Northern Cyprus Campus, Mersin, Turkey"],"affiliations":[{"raw_affiliation_string":"Middle East Technical University Northern Cyprus Campus, Mersin, Turkey","institution_ids":["https://openalex.org/I201799495"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5028892816"],"corresponding_institution_ids":["https://openalex.org/I201799495"],"apc_list":null,"apc_paid":null,"fwci":1.5162,"has_fulltext":true,"cited_by_count":6,"citation_normalized_percentile":{"value":0.86538673,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"17","issue":"1","first_page":"1","last_page":"23"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9753999710083008,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8167593479156494},{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.6939268112182617},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.6286442875862122},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6067521572113037},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.58278489112854},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5789046287536621},{"id":"https://openalex.org/keywords/table-of-contents","display_name":"Table of contents","score":0.504499077796936},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.4428291916847229},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.40580421686172485},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36698734760284424},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33526498079299927},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3323433995246887}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8167593479156494},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.6939268112182617},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.6286442875862122},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6067521572113037},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.58278489112854},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5789046287536621},{"id":"https://openalex.org/C68476402","wikidata":"https://www.wikidata.org/wiki/Q1456936","display_name":"Table of contents","level":2,"score":0.504499077796936},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.4428291916847229},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.40580421686172485},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36698734760284424},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33526498079299927},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3323433995246887},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3555349","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3555349","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3555349","source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3555349","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3555349","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3555349","source":{"id":"https://openalex.org/S131231701","display_name":"ACM Transactions on the Web","issn_l":"1559-1131","issn":["1559-1131","1559-114X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on the Web","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.46000000834465027}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4297816490.pdf","grobid_xml":"https://content.openalex.org/works/W4297816490.grobid-xml"},"referenced_works_count":48,"referenced_works":["https://openalex.org/W155236017","https://openalex.org/W981727710","https://openalex.org/W1493235501","https://openalex.org/W1691409177","https://openalex.org/W1967774582","https://openalex.org/W1988217119","https://openalex.org/W2004193186","https://openalex.org/W2022351003","https://openalex.org/W2046710396","https://openalex.org/W2052198547","https://openalex.org/W2062783131","https://openalex.org/W2078206655","https://openalex.org/W2093559286","https://openalex.org/W2096496923","https://openalex.org/W2102189859","https://openalex.org/W2124576009","https://openalex.org/W2133669904","https://openalex.org/W2134708958","https://openalex.org/W2138556038","https://openalex.org/W2155243985","https://openalex.org/W2290320465","https://openalex.org/W2340354588","https://openalex.org/W2341748398","https://openalex.org/W2342096063","https://openalex.org/W2398606196","https://openalex.org/W2490420619","https://openalex.org/W2571832859","https://openalex.org/W2618530766","https://openalex.org/W2765370481","https://openalex.org/W2785494106","https://openalex.org/W2786162033","https://openalex.org/W2787523828","https://openalex.org/W2788550262","https://openalex.org/W2971470875","https://openalex.org/W2982377694","https://openalex.org/W3004442222","https://openalex.org/W3008881932","https://openalex.org/W3021275915","https://openalex.org/W3021344331","https://openalex.org/W3048516901","https://openalex.org/W3080211177","https://openalex.org/W3099839495","https://openalex.org/W3100314869","https://openalex.org/W3102616888","https://openalex.org/W4224982663","https://openalex.org/W4239044025","https://openalex.org/W4248184695","https://openalex.org/W6748296288"],"related_works":["https://openalex.org/W4293226380","https://openalex.org/W2948670949","https://openalex.org/W4288047943","https://openalex.org/W4232484699","https://openalex.org/W4313906399","https://openalex.org/W4321487865","https://openalex.org/W4321444604","https://openalex.org/W2990655940","https://openalex.org/W2535940710","https://openalex.org/W4255439234"],"abstract_inverted_index":{"Table":[0],"mining":[1,96,117],"on":[2,23,118],"the":[3,12,24,27,33,38,101,106,110,119,164,174,187,205,226,239,244,254,258],"web":[4,120,146],"is":[5,41,121,182,246],"an":[6,215],"open":[7],"problem,":[8],"and":[9,35,86,128,237,242,252],"none":[10],"of":[11,26,32,37,60,189,217],"previously":[13],"proposed":[14],"techniques":[15],"provides":[16],"a":[17,43,57,91,158,235],"complete":[18],"solution.":[19],"Most":[20],"research":[21],"focuses":[22],"structure":[25,36],"HTML":[28,102],"document,":[29],"but":[30,66,104],"because":[31],"nature":[34],"web,":[39],"it":[40,232],"still":[42,81],"challenging":[44],"problem":[45],"to":[46,83,94,122,250],"detect":[47],"relational":[48,124,177],"tables.":[49,151,178],"Web":[50],"Content":[51],"Accessibility":[52],"Guidelines":[53],"(WCAG)":[54],"also":[55,75],"cover":[56],"wide":[58],"range":[59],"recommendations":[61,73],"for":[62,135],"making":[63,257],"tables":[64,79,200,259],"accessible,":[65],"our":[67,141],"previous":[68],"work":[69,222],"shows":[70,224],"that":[71,136,225],"these":[72],"are":[74,80],"not":[76,98],"followed;":[77],"therefore,":[78],"inaccessible":[82],"disabled":[84],"people":[85],"automated":[87],"processing.":[88],"We":[89,138],"propose":[90,131],"new":[92],"approach":[93,154,198],"table":[95,116],"by":[97,109,163],"looking":[99],"at":[100],"structure,":[103],"rather,":[105],"rendered":[107,162,240],"pages":[108,147,241],"browser.":[111],"The":[112,179],"first":[113,139,153],"task":[114],"in":[115,172,256],"classify":[123],"vs.":[125,176],"layout":[126,175],"tables,":[127,243],"here,":[129],"we":[130],"two":[132],"alternative":[133],"approaches":[134],"task.":[137],"introduce":[140],"dataset,":[142],"which":[143,213],"includes":[144],"725":[145],"with":[148,183,186,193],"9,957":[149],"extracted":[150],"Our":[152,196,221],"extracts":[155],"features":[156],"from":[157,204],"page":[159],"after":[160,231],"being":[161],"browser,":[165],"then":[166],"applies":[167],"several":[168],"machine":[169],"learning":[170],"algorithms":[171],"classifying":[173],"best":[180],"result":[181],"Random":[184],"Forest":[185],"accuracy":[188,216],"97.2%":[190],"(F1-score:":[191,219],"0.955)":[192],"10-fold":[194],"cross-validation.":[195],"second":[197],"classifies":[199],"using":[201,208,238],"images":[202],"taken":[203],"same":[206],"sources":[207],"Convolutional":[209],"Neural":[210],"Network":[211],"(CNN),":[212],"gives":[214],"95%":[218],"0.95).":[220],"here":[223],"web\u2019s":[227],"true":[228],"essence":[229],"comes":[230],"goes":[233],"through":[234],"browser":[236],"classification":[245],"more":[247,260],"accurate":[248],"compared":[249],"literature":[251],"paves":[253],"way":[255],"accessible.":[261]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
