{"id":"https://openalex.org/W2827722876","doi":"https://doi.org/10.2352/issn.2470-1173.2018.2.vipc-253","title":"Text/Figure Separation in Document Images Using Docstrum Descriptor and Two-Level Clustering","display_name":"Text/Figure Separation in Document Images Using Docstrum Descriptor and Two-Level Clustering","publication_year":2018,"publication_date":"2018-01-28","ids":{"openalex":"https://openalex.org/W2827722876","doi":"https://doi.org/10.2352/issn.2470-1173.2018.2.vipc-253","mag":"2827722876"},"language":"en","primary_location":{"id":"doi:10.2352/issn.2470-1173.2018.2.vipc-253","is_oa":false,"landing_page_url":"https://doi.org/10.2352/issn.2470-1173.2018.2.vipc-253","pdf_url":null,"source":{"id":"https://openalex.org/S4210227276","display_name":"Electronic Imaging","issn_l":"2470-1173","issn":["2470-1173"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Electronic Imaging","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086730767","display_name":"Valery Anisimovskiy","orcid":"https://orcid.org/0000-0001-9134-1078"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Valery Anisimovskiy","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037152117","display_name":"Ilya V. Kurilin","orcid":"https://orcid.org/0009-0002-9015-4005"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ilya Kurilin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030242472","display_name":"Andrey Shcherbinin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andrey Shcherbinin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5042565874","display_name":"Petr Pohl","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Petr Pohl","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5086730767"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0645067,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":"2","first_page":"253","last_page":"1"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7508141994476318},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7025583982467651},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6636728048324585},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.600699245929718},{"id":"https://openalex.org/keywords/centroid","display_name":"Centroid","score":0.5471906661987305},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.5105458498001099},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.482723206281662},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4740840196609497},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.44555380940437317},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4282873272895813},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3637859523296356},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11642995476722717}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7508141994476318},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7025583982467651},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6636728048324585},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.600699245929718},{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.5471906661987305},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.5105458498001099},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.482723206281662},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4740840196609497},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.44555380940437317},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4282873272895813},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3637859523296356},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11642995476722717},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.2352/issn.2470-1173.2018.2.vipc-253","is_oa":false,"landing_page_url":"https://doi.org/10.2352/issn.2470-1173.2018.2.vipc-253","pdf_url":null,"source":{"id":"https://openalex.org/S4210227276","display_name":"Electronic Imaging","issn_l":"2470-1173","issn":["2470-1173"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Electronic Imaging","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2381926679","https://openalex.org/W2007009951","https://openalex.org/W2082644203","https://openalex.org/W2350539780","https://openalex.org/W3165040664","https://openalex.org/W3122652148","https://openalex.org/W1583866266","https://openalex.org/W4242386713","https://openalex.org/W2996505764","https://openalex.org/W3088649123"],"abstract_inverted_index":{"We":[0,110],"propose":[1],"a":[2],"novel":[3],"algorithm":[4,168],"for":[5,9,30,93,144],"text/figure":[6,58],"separation":[7,65],"tailored":[8],"binary":[10],"document":[11,70],"images":[12,71],"containing":[13],"line":[14],"drawings,":[15],"block":[16],"diagrams,":[17],"charts,":[18],"schemes":[19],"and":[20,46,80,99,127,161,176],"other":[21],"kinds":[22],"of":[23,27,38,56,77,96,101,125,138,180,189],"business":[24],"graphics.":[25],"Most":[26],"the":[28,51,190],"approaches":[29,61],"this":[31,112],"task":[32],"rely":[33],"either":[34,103],"on":[35,50],"clever":[36],"design":[37],"visual":[39],"descriptor":[40],"allowing":[41],"to":[42,69,119,158,172],"easily":[43],"distinguish":[44],"text":[45],"graphics":[47],"regions":[48,124],"or":[49,107,132],"supervised":[52],"learning":[53,116],"using":[54],"dataset":[55],"labeled":[57,84],"regions.":[59],"Such":[60],"often":[62],"provide":[63],"moderate":[64],"accuracy":[66],"when":[67],"applied":[68,118,157,171],"which":[72,149],"contain":[73],"very":[74],"diverse":[75],"set":[76],"figure":[78,97],"classes":[79,98],"lack":[81],"sufficiently":[82],"representative":[83],"training":[85],"dataset.":[86],"In":[87],"contrast,":[88],"our":[89,139],"method":[90,140],"is":[91,141,150,169,184],"well-suited":[92],"vast":[94],"variety":[95],"capable":[100],"operating":[102],"in":[104],"semi-supervised":[105,129],"mode":[106],"unsupervised":[108,115,133],"mode.":[109],"achieve":[111],"by":[113,187],"leveraging":[114],"algorithms":[117],"Docstrum":[120,159],"descriptors":[121,160],"extracted":[122],"from":[123],"interest":[126],"subsequent":[128],"label":[130,134],"propagation":[131],"inference.":[135],"Another":[136],"advantage":[137],"its":[142],"suitability":[143],"large":[145,173],"scale":[146,174],"data":[147,175],"processing":[148],"achieved":[151],"through":[152],"efficient":[153],"kernel-approximating":[154],"feature":[155],"mapping":[156],"two-level":[162],"clustering":[163,193],"where":[164],"fast":[165],"mini-batch":[166],"K-means":[167],"first":[170],"only":[177],"small":[178],"number":[179],"resulting":[181],"cluster":[182],"centroids":[183],"subsequently":[185],"processed":[186],"one":[188],"more":[191],"sophisticated":[192],"algorithms.":[194]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
