{"id":"https://openalex.org/W2066988702","doi":"https://doi.org/10.1002/(sici)1098-1098(199624)7:4<330::aid-ima8>3.0.co;2-9","title":"An integrated approach to document decomposition and structural analysis","display_name":"An integrated approach to document decomposition and structural analysis","publication_year":1996,"publication_date":"1996-01-01","ids":{"openalex":"https://openalex.org/W2066988702","doi":"https://doi.org/10.1002/(sici)1098-1098(199624)7:4<330::aid-ima8>3.0.co;2-9","mag":"2066988702"},"language":"en","primary_location":{"id":"doi:10.1002/(sici)1098-1098(199624)7:4<330::aid-ima8>3.0.co;2-9","is_oa":false,"landing_page_url":"https://doi.org/10.1002/(sici)1098-1098(199624)7:4<330::aid-ima8>3.0.co;2-9","pdf_url":null,"source":{"id":"https://openalex.org/S15952048","display_name":"International Journal of Imaging Systems and Technology","issn_l":"0899-9457","issn":["0899-9457","1098-1098"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Imaging Systems and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055941869","display_name":"Debashish Niyogi","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Debashish Niyogi","raw_affiliation_strings":["Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228-2567","Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228\u20102567"],"affiliations":[{"raw_affiliation_string":"Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228-2567","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228\u20102567","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102711181","display_name":"Sargur N. Srihari","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sargur N. Srihari","raw_affiliation_strings":["Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228-2567","Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228\u20102567"],"affiliations":[{"raw_affiliation_string":"Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228-2567","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Center of Excellence for Document Analysis and Recognition, State University of New York at Buffalo, UB Commons, 520 Lee Entrance, Suite 202, Amherst, NY 14228\u20102567","institution_ids":["https://openalex.org/I63190737"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5055941869"],"corresponding_institution_ids":["https://openalex.org/I63190737"],"apc_list":{"value":3450,"currency":"USD","value_usd":3450},"apc_paid":null,"fwci":0.4984,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.6966559,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"7","issue":"4","first_page":"330","last_page":"342"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9861999750137329,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9854000210762024,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/document-layout-analysis","display_name":"Document layout analysis","score":0.8594088554382324},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7761696577072144},{"id":"https://openalex.org/keywords/facsimile","display_name":"Facsimile","score":0.6129976511001587},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6113264560699463},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6005608439445496},{"id":"https://openalex.org/keywords/well-formed-document","display_name":"Well-formed document","score":0.5293921828269958},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5259806513786316},{"id":"https://openalex.org/keywords/document-processing","display_name":"Document processing","score":0.5050771832466125},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4822288453578949},{"id":"https://openalex.org/keywords/document-clustering","display_name":"Document clustering","score":0.4733721613883972},{"id":"https://openalex.org/keywords/document-structure-description","display_name":"Document Structure Description","score":0.4567800760269165},{"id":"https://openalex.org/keywords/document-management-system","display_name":"Document management system","score":0.45535802841186523},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.44496726989746094},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.43427574634552},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35554957389831543},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.33959275484085083},{"id":"https://openalex.org/keywords/document-type-definition","display_name":"Document type definition","score":0.24987906217575073},{"id":"https://openalex.org/keywords/xml","display_name":"XML","score":0.21820667386054993},{"id":"https://openalex.org/keywords/transmission","display_name":"Transmission (telecommunications)","score":0.142676442861557},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.12696272134780884},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09110301733016968}],"concepts":[{"id":"https://openalex.org/C72773152","wikidata":"https://www.wikidata.org/wiki/Q5287629","display_name":"Document layout analysis","level":3,"score":0.8594088554382324},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7761696577072144},{"id":"https://openalex.org/C2778310199","wikidata":"https://www.wikidata.org/wiki/Q194070","display_name":"Facsimile","level":3,"score":0.6129976511001587},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6113264560699463},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6005608439445496},{"id":"https://openalex.org/C137441365","wikidata":"https://www.wikidata.org/wiki/Q7981054","display_name":"Well-formed document","level":5,"score":0.5293921828269958},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5259806513786316},{"id":"https://openalex.org/C67905146","wikidata":"https://www.wikidata.org/wiki/Q5287646","display_name":"Document processing","level":2,"score":0.5050771832466125},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4822288453578949},{"id":"https://openalex.org/C177937566","wikidata":"https://www.wikidata.org/wiki/Q4223102","display_name":"Document clustering","level":3,"score":0.4733721613883972},{"id":"https://openalex.org/C68699486","wikidata":"https://www.wikidata.org/wiki/Q265904","display_name":"Document Structure Description","level":3,"score":0.4567800760269165},{"id":"https://openalex.org/C2278759","wikidata":"https://www.wikidata.org/wiki/Q831677","display_name":"Document management system","level":2,"score":0.45535802841186523},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.44496726989746094},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.43427574634552},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35554957389831543},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33959275484085083},{"id":"https://openalex.org/C84314905","wikidata":"https://www.wikidata.org/wiki/Q212327","display_name":"Document type definition","level":4,"score":0.24987906217575073},{"id":"https://openalex.org/C8797682","wikidata":"https://www.wikidata.org/wiki/Q2115","display_name":"XML","level":2,"score":0.21820667386054993},{"id":"https://openalex.org/C761482","wikidata":"https://www.wikidata.org/wiki/Q118093","display_name":"Transmission (telecommunications)","level":2,"score":0.142676442861557},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.12696272134780884},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09110301733016968},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1002/(sici)1098-1098(199624)7:4<330::aid-ima8>3.0.co;2-9","is_oa":false,"landing_page_url":"https://doi.org/10.1002/(sici)1098-1098(199624)7:4<330::aid-ima8>3.0.co;2-9","pdf_url":null,"source":{"id":"https://openalex.org/S15952048","display_name":"International Journal of Imaging Systems and Technology","issn_l":"0899-9457","issn":["0899-9457","1098-1098"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Imaging Systems and Technology","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.43.5369","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.43.5369","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cedar.buffalo.edu/~niyogi/papers/IJIST/IJIST.ps","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4399999976158142,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2296417820","https://openalex.org/W217414027","https://openalex.org/W2089356193","https://openalex.org/W2079569022","https://openalex.org/W3151136357","https://openalex.org/W3217329329","https://openalex.org/W4255926577","https://openalex.org/W4387846611","https://openalex.org/W4238415164","https://openalex.org/W2359653062"],"abstract_inverted_index":{"A":[0,96],"document":[1,43,56,70,86],"image":[2,30,49,71],"is":[3,114],"a":[4,8,13,17,33,42,128],"visual":[5],"representation":[6],"of":[7,20,37,64,76,85,127,146,154],"paper":[9],"document,":[10,129],"such":[11],"as":[12,32],"journal":[14],"article":[15,54],"page,":[16],"cover":[18],"page":[19],"facsimile":[21],"transmission,":[22],"office":[23],"correspondence,":[24],"an":[25],"application":[26],"form,":[27],"etc.":[28],"Document":[29],"understanding":[31],"research":[34],"endeavor":[35],"consists":[36],"developing":[38],"processes":[39,67],"for":[40],"taking":[41],"through":[44],"various":[45],"representations,":[46],"from":[47],"scanned":[48],"to":[50,122,133],"semantic":[51],"representation.":[52],"This":[53,116],"describes":[55],"decomposition":[57,100],"and":[58,79,90,101,107,130,135,159],"structural":[59,102],"analysis,":[60,89],"which":[61],"constitutes":[62],"one":[63],"the":[65,77,83,124,147,152],"major":[66],"involved":[68],"in":[69,82],"understanding.":[72],"The":[73],"current":[74],"state":[75],"art":[78],"future":[80],"directions":[81],"areas":[84],"segmentation,":[87],"layout":[88,131],"logical":[91,105,140],"block":[92,125],"grouping":[93,106],"are":[94,157],"indicated.":[95],"system":[97,117],"that":[98,142],"performs":[99],"analysis":[103],"(including":[104],"read-order":[108],"determination)":[109],"on":[110],"complex":[111],"multiarticled":[112],"documents":[113],"presented.":[115],"uses":[118],"bottom-up":[119],"segmentation":[120],"techniques":[121],"identify":[123],"structure":[126],"rules":[132],"classify":[134],"group":[136],"these":[137],"blocks":[138],"into":[139],"units":[141],"represent":[143],"meaningful":[144],"subdivisions":[145],"document.":[148],"Experimental":[149],"results":[150],"showing":[151],"efficiency":[153],"this":[155],"approach":[156],"presented":[158],"discussed.":[160],"\u00a9":[161],"1996":[162],"John":[163],"Wiley":[164],"&":[165],"Sons,":[166],"Inc.":[167]},"counts_by_year":[{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
