{"id":"https://openalex.org/W2107092590","doi":"https://doi.org/10.1177/0165551514551903","title":"On methods and tools of table detection, extraction and annotation in PDF documents","display_name":"On methods and tools of table detection, extraction and annotation in PDF documents","publication_year":2014,"publication_date":"2014-10-03","ids":{"openalex":"https://openalex.org/W2107092590","doi":"https://doi.org/10.1177/0165551514551903","mag":"2107092590"},"language":"en","primary_location":{"id":"doi:10.1177/0165551514551903","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551514551903","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074454844","display_name":"Shah Khusro","orcid":"https://orcid.org/0000-0002-7734-7243"},"institutions":[{"id":"https://openalex.org/I36001604","display_name":"University of Peshawar","ror":"https://ror.org/02t2qwf81","country_code":"PK","type":"education","lineage":["https://openalex.org/I36001604"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Shah Khusro","raw_affiliation_strings":["Department of Computer Science, University of Peshawar, Pakistan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Peshawar, Pakistan","institution_ids":["https://openalex.org/I36001604"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110201683","display_name":"Asima Latif","orcid":null},"institutions":[{"id":"https://openalex.org/I36001604","display_name":"University of Peshawar","ror":"https://ror.org/02t2qwf81","country_code":"PK","type":"education","lineage":["https://openalex.org/I36001604"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Asima Latif","raw_affiliation_strings":["Department of Computer Science, University of Peshawar, Pakistan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Peshawar, Pakistan","institution_ids":["https://openalex.org/I36001604"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108013133","display_name":"Irfan Ullah","orcid":"https://orcid.org/0000-0003-0693-5467"},"institutions":[{"id":"https://openalex.org/I36001604","display_name":"University of Peshawar","ror":"https://ror.org/02t2qwf81","country_code":"PK","type":"education","lineage":["https://openalex.org/I36001604"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Irfan Ullah","raw_affiliation_strings":["Department of Computer Science, University of Peshawar, Pakistan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of Peshawar, Pakistan","institution_ids":["https://openalex.org/I36001604"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5074454844"],"corresponding_institution_ids":["https://openalex.org/I36001604"],"apc_list":null,"apc_paid":null,"fwci":2.7237,"has_fulltext":false,"cited_by_count":65,"citation_normalized_percentile":{"value":0.92589603,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"41","issue":"1","first_page":"41","last_page":"57"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/table","display_name":"Table (database)","score":0.8802011013031006},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.8680018186569214},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8281521201133728},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6778175234794617},{"id":"https://openalex.org/keywords/information-extraction","display_name":"Information extraction","score":0.5823488235473633},{"id":"https://openalex.org/keywords/data-extraction","display_name":"Data extraction","score":0.44741904735565186},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.38904523849487305},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.37135589122772217},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25187334418296814}],"concepts":[{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.8802011013031006},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.8680018186569214},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8281521201133728},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6778175234794617},{"id":"https://openalex.org/C195807954","wikidata":"https://www.wikidata.org/wiki/Q1662562","display_name":"Information extraction","level":2,"score":0.5823488235473633},{"id":"https://openalex.org/C2777466982","wikidata":"https://www.wikidata.org/wiki/Q5227287","display_name":"Data extraction","level":3,"score":0.44741904735565186},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.38904523849487305},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37135589122772217},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25187334418296814},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C2779473830","wikidata":"https://www.wikidata.org/wiki/Q1540899","display_name":"MEDLINE","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/0165551514551903","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551514551903","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8299999833106995,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":126,"referenced_works":["https://openalex.org/W30902120","https://openalex.org/W95284390","https://openalex.org/W158800878","https://openalex.org/W161140159","https://openalex.org/W178986155","https://openalex.org/W214170106","https://openalex.org/W603935256","https://openalex.org/W1495062271","https://openalex.org/W1501251778","https://openalex.org/W1503330383","https://openalex.org/W1506666816","https://openalex.org/W1509330973","https://openalex.org/W1511986666","https://openalex.org/W1529144909","https://openalex.org/W1534481981","https://openalex.org/W1546430096","https://openalex.org/W1552246388","https://openalex.org/W1555624686","https://openalex.org/W1557790983","https://openalex.org/W1562673218","https://openalex.org/W1564103265","https://openalex.org/W1568702397","https://openalex.org/W1569639771","https://openalex.org/W1595439448","https://openalex.org/W1605010801","https://openalex.org/W1605633529","https://openalex.org/W1774363252","https://openalex.org/W1967830139","https://openalex.org/W1970549718","https://openalex.org/W1971336721","https://openalex.org/W1974346290","https://openalex.org/W1981453410","https://openalex.org/W1981920506","https://openalex.org/W1984130280","https://openalex.org/W1988217119","https://openalex.org/W1993035437","https://openalex.org/W2000569744","https://openalex.org/W2009659675","https://openalex.org/W2015432638","https://openalex.org/W2022166150","https://openalex.org/W2026153548","https://openalex.org/W2033547624","https://openalex.org/W2034075507","https://openalex.org/W2034797903","https://openalex.org/W2046441607","https://openalex.org/W2048135704","https://openalex.org/W2051265407","https://openalex.org/W2052198547","https://openalex.org/W2056797079","https://openalex.org/W2058875874","https://openalex.org/W2066636486","https://openalex.org/W2069028640","https://openalex.org/W2072944755","https://openalex.org/W2074966879","https://openalex.org/W2076437101","https://openalex.org/W2077630735","https://openalex.org/W2078206655","https://openalex.org/W2082056382","https://openalex.org/W2086677639","https://openalex.org/W2091042506","https://openalex.org/W2092364718","https://openalex.org/W2092772700","https://openalex.org/W2093390569","https://openalex.org/W2093559286","https://openalex.org/W2096004021","https://openalex.org/W2096782419","https://openalex.org/W2096820050","https://openalex.org/W2098218583","https://openalex.org/W2102189859","https://openalex.org/W2102672399","https://openalex.org/W2104586313","https://openalex.org/W2105693220","https://openalex.org/W2106170438","https://openalex.org/W2106863921","https://openalex.org/W2111869785","https://openalex.org/W2119476919","https://openalex.org/W2121061496","https://openalex.org/W2121457610","https://openalex.org/W2127578890","https://openalex.org/W2128235325","https://openalex.org/W2129123248","https://openalex.org/W2130186082","https://openalex.org/W2130649712","https://openalex.org/W2131131934","https://openalex.org/W2132083030","https://openalex.org/W2134164043","https://openalex.org/W2135678693","https://openalex.org/W2136134253","https://openalex.org/W2136379584","https://openalex.org/W2137998699","https://openalex.org/W2141099517","https://openalex.org/W2142809404","https://openalex.org/W2147877524","https://openalex.org/W2147880316","https://openalex.org/W2150652226","https://openalex.org/W2150673968","https://openalex.org/W2151462415","https://openalex.org/W2151825758","https://openalex.org/W2151846280","https://openalex.org/W2153225416","https://openalex.org/W2154643148","https://openalex.org/W2155361294","https://openalex.org/W2156515921","https://openalex.org/W2163041183","https://openalex.org/W2165382068","https://openalex.org/W2166323498","https://openalex.org/W2168459394","https://openalex.org/W2185450495","https://openalex.org/W2229562501","https://openalex.org/W2315919170","https://openalex.org/W2331489044","https://openalex.org/W2470734433","https://openalex.org/W2504234218","https://openalex.org/W2623111293","https://openalex.org/W2671954119","https://openalex.org/W2886362482","https://openalex.org/W2912439978","https://openalex.org/W2912817377","https://openalex.org/W2913000315","https://openalex.org/W2913589968","https://openalex.org/W3142746689","https://openalex.org/W4206765718","https://openalex.org/W4229912654","https://openalex.org/W4229964943","https://openalex.org/W4285719527","https://openalex.org/W4401149522"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2358755282","https://openalex.org/W2625833328","https://openalex.org/W1533177136","https://openalex.org/W2251519152","https://openalex.org/W4380994516"],"abstract_inverted_index":{"Table":[0],"detection,":[1,52,116],"extraction":[2,53,108,117],"and":[3,37,54,81,88,118],"annotation":[4,55],"have":[5,19],"been":[6,20],"an":[7],"important":[8],"research":[9,72],"problem":[10],"for":[11,22,35,84,93,96],"years.":[12],"To":[13],"handle":[14],"this":[15],"issue,":[16],"different":[17,23,39,106],"approaches":[18,77],"designed":[21],"types":[24,40],"of":[25,41,47,60,67,76],"documents.":[26,42,58],"Among":[27],"these":[28,126],"PDF":[29,57,133],"is":[30,102,136],"a":[31,74,151,154],"widely":[32],"used":[33,113],"format":[34],"preserving":[36],"presenting":[38],"We":[43,120],"investigate":[44],"the":[45,48,65,68],"state":[46,66],"art":[49,69],"in":[50,56,70,114,128,132,153],"table":[51,62,115,152],"Because":[59],"varying":[61],"structural":[63],"anatomy,":[64],"table-related":[71],"enumerates":[73],"number":[75],"that":[78,104,110,140,146],"are":[79,147],"critically":[80],"analytically":[82],"investigated":[83],"identifying":[85],"their":[86],"strengths":[87],"limitations":[89],"as":[90,92],"well":[91],"making":[94],"recommendations":[95],"further":[97],"improvement.":[98],"An":[99],"evaluation":[100],"framework":[101],"contributed":[103],"compares":[105],"information":[107],"tools":[109],"may":[111],"be":[112],"annotation.":[119],"found":[121],"very":[122],"limited":[123],"attention":[124],"towards":[125],"aspects":[127],"books,":[129],"especially":[130],"books":[131,143],"format.":[134],"There":[135],"no":[137],"searching":[138],"solution":[139],"can":[141],"find":[142],"having":[144],"tables":[145],"semantically":[148],"related":[149],"to":[150],"given":[155],"book.":[156]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":15},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":4},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":3}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
