{"id":"https://openalex.org/W2146708062","doi":"https://doi.org/10.1080/08839510701252551","title":"RELATIONAL DATA MINING AND ILP FOR DOCUMENT IMAGE UNDERSTANDING","display_name":"RELATIONAL DATA MINING AND ILP FOR DOCUMENT IMAGE UNDERSTANDING","publication_year":2007,"publication_date":"2007-04-25","ids":{"openalex":"https://openalex.org/W2146708062","doi":"https://doi.org/10.1080/08839510701252551","mag":"2146708062"},"language":"en","primary_location":{"id":"doi:10.1080/08839510701252551","is_oa":true,"landing_page_url":"https://doi.org/10.1080/08839510701252551","pdf_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839510701252551?download=true","source":{"id":"https://openalex.org/S125501549","display_name":"Applied Artificial Intelligence","issn_l":"0883-9514","issn":["0883-9514","1087-6545"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839510701252551?download=true","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073750332","display_name":"Michelangelo Ceci","orcid":"https://orcid.org/0000-0002-6690-7583"},"institutions":[{"id":"https://openalex.org/I5561750","display_name":"University of Bari Aldo Moro","ror":"https://ror.org/027ynra39","country_code":"IT","type":"education","lineage":["https://openalex.org/I5561750"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Michelangelo Ceci","raw_affiliation_strings":["\n                   \n               Dipartimento di Informatica, Universit\u00e0 degli Studi di Bari, Bari, Italy","Dipartimento di Informatica - Universit\u00e0 degli Studi di Bari - Bari, Italy"],"affiliations":[{"raw_affiliation_string":"\n                   \n               Dipartimento di Informatica, Universit\u00e0 degli Studi di Bari, Bari, Italy","institution_ids":["https://openalex.org/I5561750"]},{"raw_affiliation_string":"Dipartimento di Informatica - Universit\u00e0 degli Studi di Bari - Bari, Italy","institution_ids":["https://openalex.org/I5561750"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041745569","display_name":"Margherita Berardi","orcid":null},"institutions":[{"id":"https://openalex.org/I5561750","display_name":"University of Bari Aldo Moro","ror":"https://ror.org/027ynra39","country_code":"IT","type":"education","lineage":["https://openalex.org/I5561750"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Margherita Berardi","raw_affiliation_strings":["\n                   \n               Dipartimento di Informatica, Universit\u00e0 degli Studi di Bari, Bari, Italy","Dipartimento di Informatica - Universit\u00e0 degli Studi di Bari - Bari, Italy"],"affiliations":[{"raw_affiliation_string":"\n                   \n               Dipartimento di Informatica, Universit\u00e0 degli Studi di Bari, Bari, Italy","institution_ids":["https://openalex.org/I5561750"]},{"raw_affiliation_string":"Dipartimento di Informatica - Universit\u00e0 degli Studi di Bari - Bari, Italy","institution_ids":["https://openalex.org/I5561750"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5035789137","display_name":"Donato Malerba","orcid":"https://orcid.org/0000-0001-8432-4608"},"institutions":[{"id":"https://openalex.org/I5561750","display_name":"University of Bari Aldo Moro","ror":"https://ror.org/027ynra39","country_code":"IT","type":"education","lineage":["https://openalex.org/I5561750"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Donato Malerba","raw_affiliation_strings":["\n                   \n               Dipartimento di Informatica, Universit\u00e0 degli Studi di Bari, Bari, Italy","Dipartimento di Informatica - Universit\u00e0 degli Studi di Bari - Bari, Italy"],"affiliations":[{"raw_affiliation_string":"\n                   \n               Dipartimento di Informatica, Universit\u00e0 degli Studi di Bari, Bari, Italy","institution_ids":["https://openalex.org/I5561750"]},{"raw_affiliation_string":"Dipartimento di Informatica - Universit\u00e0 degli Studi di Bari - Bari, Italy","institution_ids":["https://openalex.org/I5561750"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5035789137"],"corresponding_institution_ids":["https://openalex.org/I5561750"],"apc_list":{"value":2195,"currency":"USD","value_usd":2195},"apc_paid":null,"fwci":1.8716,"has_fulltext":true,"cited_by_count":18,"citation_normalized_percentile":{"value":0.86233193,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"21","issue":"4-5","first_page":"317","last_page":"342"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11063","display_name":"Rough Sets and Fuzzy Logic","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9900000095367432,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9843000173568726,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8535061478614807},{"id":"https://openalex.org/keywords/inductive-logic-programming","display_name":"Inductive logic programming","score":0.8326079845428467},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.5504414439201355},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5159302949905396},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.497576504945755},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.4724041819572449},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.4515768587589264},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4417104125022888},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42468297481536865},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38335585594177246},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3493651747703552},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3326668441295624}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8535061478614807},{"id":"https://openalex.org/C2779382394","wikidata":"https://www.wikidata.org/wiki/Q1464197","display_name":"Inductive logic programming","level":2,"score":0.8326079845428467},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.5504414439201355},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5159302949905396},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.497576504945755},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.4724041819572449},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.4515768587589264},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4417104125022888},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42468297481536865},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38335585594177246},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3493651747703552},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3326668441295624},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1080/08839510701252551","is_oa":true,"landing_page_url":"https://doi.org/10.1080/08839510701252551","pdf_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839510701252551?download=true","source":{"id":"https://openalex.org/S125501549","display_name":"Applied Artificial Intelligence","issn_l":"0883-9514","issn":["0883-9514","1087-6545"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Artificial Intelligence","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.108.3424","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.108.3424","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.di.uniba.it/~ceci/micFiles/papers/ceci et AAI 2007.pdf","raw_type":"text"},{"id":"pmh:oai:ricerca.uniba.it:11586/127806","is_oa":false,"landing_page_url":"http://hdl.handle.net/11586/127806","pdf_url":null,"source":{"id":"https://openalex.org/S4377196296","display_name":"CINECA IRIS Institutional Research Information System (University of Bari Aldo Moro)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I5561750","host_organization_name":"University of Bari Aldo Moro","host_organization_lineage":["https://openalex.org/I5561750"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"doi:10.1080/08839510701252551","is_oa":true,"landing_page_url":"https://doi.org/10.1080/08839510701252551","pdf_url":"https://www.tandfonline.com/doi/pdf/10.1080/08839510701252551?download=true","source":{"id":"https://openalex.org/S125501549","display_name":"Applied Artificial Intelligence","issn_l":"0883-9514","issn":["0883-9514","1087-6545"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Applied Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.4000000059604645,"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2146708062.pdf","grobid_xml":"https://content.openalex.org/works/W2146708062.grobid-xml"},"referenced_works_count":40,"referenced_works":["https://openalex.org/W31561947","https://openalex.org/W1486717255","https://openalex.org/W1491691765","https://openalex.org/W1497943029","https://openalex.org/W1541434994","https://openalex.org/W1548367482","https://openalex.org/W1549887922","https://openalex.org/W1598033630","https://openalex.org/W1611920884","https://openalex.org/W1801594279","https://openalex.org/W1979622972","https://openalex.org/W1983284692","https://openalex.org/W2013866009","https://openalex.org/W2062226968","https://openalex.org/W2071415224","https://openalex.org/W2090393796","https://openalex.org/W2096942889","https://openalex.org/W2103116581","https://openalex.org/W2116509046","https://openalex.org/W2120543825","https://openalex.org/W2121906195","https://openalex.org/W2131043005","https://openalex.org/W2131715999","https://openalex.org/W2135085165","https://openalex.org/W2139689856","https://openalex.org/W2140785063","https://openalex.org/W2141756865","https://openalex.org/W2146904366","https://openalex.org/W2161484642","https://openalex.org/W2164727403","https://openalex.org/W2169042011","https://openalex.org/W2172223321","https://openalex.org/W2520858206","https://openalex.org/W2526346152","https://openalex.org/W2962735828","https://openalex.org/W3023264106","https://openalex.org/W3149838063","https://openalex.org/W4206370914","https://openalex.org/W4206727053","https://openalex.org/W4237171445"],"related_works":["https://openalex.org/W2978856588","https://openalex.org/W2995623605","https://openalex.org/W2118775997","https://openalex.org/W320292658","https://openalex.org/W2001007279","https://openalex.org/W2009141112","https://openalex.org/W3181676408","https://openalex.org/W2596625410","https://openalex.org/W1523236614","https://openalex.org/W2079674650"],"abstract_inverted_index":{"&":[0],"Document":[1],"image":[2,172,179,219],"understanding":[3,253],"denotes":[4],"the":[5,12,55,105,109,126,129,138,155,159,167,175,231,243,250],"recognition":[6,19],"of":[7,38,78,120,128,150,158,170,177,230,242,254,261],"semantically":[8,263],"relevant":[9,264],"components":[10,229,266,279],"in":[11,45,82,117],"layout":[13,40,246,265,278],"extracted":[14],"from":[15],"a":[16,121,146,201],"document":[17,185,218,255],"image.This":[18],"process":[20,203],"is":[21,91,174,200,220,259],"based":[22],"on":[23,72],"domain-specific":[24],"knowledge":[25,241],"that":[26,98,137,181,260],"can":[27],"be":[28,143],"acquired":[29],"automatically":[30],"by":[31],"applying":[32],"data":[33,52,75,115],"mining":[34,53],"techniques.The":[35],"spatial":[36,130],"dimension":[37,131],"page":[39],"makes":[41],"classification":[42],"methods":[43],"developed":[44],"inductive":[46],"logic":[47],"programming":[48],"(ILP)":[49],"and":[50,69,86,135,195,216,269],"multi-relational":[51],"(MRDM)":[54],"most":[56],"suitable":[57],"candidates":[58],"for":[59,132,190],"this":[60,63,133],"specific":[61,244],"task.In":[62],"paper,":[64],"both":[65],"approaches":[66],"are":[67],"considered":[68],"empirically":[70],"compared":[71],"three":[73],"different":[74],"sets":[76],"consisting":[77],"multi-page":[79],"articles":[80],"published":[81],"an":[83],"international":[84],"journal":[85],"historical":[87],"documents.The":[88],"ILP":[89,139],"method":[90,107,140,161],"able":[92],"to":[93,114,142,164,183,187],"learn":[94],"recursive":[95],"logical":[96,102],"theories":[97],"express":[99],"dependencies":[100],"between":[101,166,277],"components,":[103],"while":[104,154],"MRDM":[106,160],"extends":[108],"na":[110],"ve":[111],"Bayesian":[112],"classifier":[113],"stored":[116],"multiple":[118],"tables":[119],"relational":[122],"database.Experimental":[123],"results":[124],"confirm":[125],"importance":[127],"application":[134],"show":[136],"tends":[141],"conservative":[144],"with":[145],"high":[147],"(low)":[148],"percentage":[149],"omission":[151],"(commission)":[152],"errors,":[153],"probabilistic":[156],"nature":[157],"allows":[162],"us":[163],"tradeoff":[165],"two":[168],"types":[169],"error.Document":[171],"analysis":[173,247],"subfield":[176],"digital":[178],"processing":[180,208],"aims":[182],"convert":[184],"images":[186],"symbolic":[188],"form":[189],"modification,":[191],"storage,":[192],"retrieval,":[193],"reuse,":[194],"transmission":[196],"(Nagy":[197],"2000).This":[198],"conversion":[199],"complex":[202],"articulated":[204],"into":[205,222],"several":[206,223],"stages.Initial":[207],"steps":[209],"include":[210],"binarization,":[211],"skew":[212],"detection,":[213],"noise":[214],"filtering,":[215],"segmentation.Then":[217],"decomposed":[221],"constituent":[224],"items":[225],"which":[226],"represent":[227],"coherent":[228],"documents":[232],"(e.g.,":[233,267,280],"text":[234],"lines":[235],"or":[236,252],"halftone":[237],"images),":[238],"without":[239],"any":[240],"format.This":[245],"step":[248],"precedes":[249],"interpretation":[251],"images,":[256],"whose":[257],"aim":[258],"recognizing":[262],"title":[268],"abstract)":[270],"as":[271,273],"well":[272],"extracting":[274],"abstract":[275],"relationships":[276],"reading":[281],"order).":[282]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
