{"id":"https://openalex.org/W2110212011","doi":"https://doi.org/10.1109/cvpr.2009.5206606","title":"Robust unsupervised segmentation of degraded document images with topic models","display_name":"Robust unsupervised segmentation of degraded document images with topic models","publication_year":2009,"publication_date":"2009-06-01","ids":{"openalex":"https://openalex.org/W2110212011","doi":"https://doi.org/10.1109/cvpr.2009.5206606","mag":"2110212011"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr.2009.5206606","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2009.5206606","pdf_url":null,"source":{"id":"https://openalex.org/S4363607795","display_name":"2009 IEEE Conference on Computer Vision and Pattern Recognition","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079677615","display_name":"Timothy J. Burns","orcid":"https://orcid.org/0000-0002-7201-6437"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Timothy J. Burns","raw_affiliation_strings":["Computer Science and Engineering, Suny at Buffalo, Buffalo, NY, USA","Computer Science and Engineering, SUNY at Buffalo, Buffalo, NY, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Suny at Buffalo, Buffalo, NY, USA","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Computer Science and Engineering, SUNY at Buffalo, Buffalo, NY, USA","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079301873","display_name":"Jason J. Corso","orcid":"https://orcid.org/0000-0001-6454-9594"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason J. Corso","raw_affiliation_strings":["Computer Science and Engineering, Suny at Buffalo, Buffalo, NY, USA","Computer Science and Engineering, SUNY at Buffalo, Buffalo, NY, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science and Engineering, Suny at Buffalo, Buffalo, NY, USA","institution_ids":["https://openalex.org/I63190737"]},{"raw_affiliation_string":"Computer Science and Engineering, SUNY at Buffalo, Buffalo, NY, USA","institution_ids":["https://openalex.org/I63190737"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5079677615"],"corresponding_institution_ids":["https://openalex.org/I63190737"],"apc_list":null,"apc_paid":null,"fwci":0.7465,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.76421305,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1287","last_page":"1294"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8214017152786255},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6931442022323608},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6828065514564514},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5796513557434082},{"id":"https://openalex.org/keywords/heuristics","display_name":"Heuristics","score":0.578449547290802},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5782160758972168},{"id":"https://openalex.org/keywords/codebook","display_name":"Codebook","score":0.5493379831314087},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49460408091545105},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.48506441712379456},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.48206740617752075},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.420917809009552},{"id":"https://openalex.org/keywords/document-layout-analysis","display_name":"Document layout analysis","score":0.4136779308319092},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.40384650230407715},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.37241625785827637},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.30628710985183716}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8214017152786255},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6931442022323608},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6828065514564514},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5796513557434082},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.578449547290802},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5782160758972168},{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.5493379831314087},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49460408091545105},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.48506441712379456},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.48206740617752075},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.420917809009552},{"id":"https://openalex.org/C72773152","wikidata":"https://www.wikidata.org/wiki/Q5287629","display_name":"Document layout analysis","level":3,"score":0.4136779308319092},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40384650230407715},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.37241625785827637},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.30628710985183716},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/cvpr.2009.5206606","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr.2009.5206606","pdf_url":null,"source":{"id":"https://openalex.org/S4363607795","display_name":"2009 IEEE Conference on Computer Vision and Pattern Recognition","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Conference on Computer Vision and Pattern Recognition","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.188.7517","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.188.7517","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cse.buffalo.edu/%7Ejcorso/pubs/cvpr2009_docs.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.211.5015","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.211.5015","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cse.buffalo.edu/~tjburns/1019.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1487718662","https://openalex.org/W1572666543","https://openalex.org/W1592774159","https://openalex.org/W1625255723","https://openalex.org/W1880262756","https://openalex.org/W2016847844","https://openalex.org/W2096210305","https://openalex.org/W2106919699","https://openalex.org/W2107034620","https://openalex.org/W2112050062","https://openalex.org/W2116013899","https://openalex.org/W2120685492","https://openalex.org/W2134383396","https://openalex.org/W2134636339","https://openalex.org/W2140124448","https://openalex.org/W2141303268","https://openalex.org/W2141376824","https://openalex.org/W2144209937","https://openalex.org/W2150920547","https://openalex.org/W2151259137","https://openalex.org/W2162031011","https://openalex.org/W2163220086","https://openalex.org/W2165463593","https://openalex.org/W2169402356","https://openalex.org/W4254997627","https://openalex.org/W4300407400","https://openalex.org/W6635368981","https://openalex.org/W6636494156","https://openalex.org/W6639619044","https://openalex.org/W6836242169"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4380551139","https://openalex.org/W2280377497","https://openalex.org/W3174044702","https://openalex.org/W4238433571","https://openalex.org/W2967848559","https://openalex.org/W4283803360","https://openalex.org/W4317695495","https://openalex.org/W4387506531"],"abstract_inverted_index":{"Segmentation":[0],"of":[1,18,78,173],"document":[2,10,71,90,129,156],"images":[3,11,72],"remains":[4,45],"a":[5,13,46,66,89,93,120,153,169],"challenging":[6],"vision":[7],"problem.":[8],"Although":[9],"have":[12],"structured":[14],"layout,":[15],"capturing":[16],"enough":[17],"it":[19],"for":[20,33,70],"segmentation":[21,150],"can":[22],"be":[23],"difficult.":[24],"Most":[25],"current":[26],"methods":[27,58],"combine":[28],"text":[29,36,100],"extraction":[30,37],"and":[31,42,147],"heuristics":[32],"segmentation,":[34],"but":[35,102],"is":[38,119],"prone":[39],"to":[40,75,109,143],"failure":[41],"measuring":[43],"accuracy":[44],"difficult":[47],"challenge.":[48],"Furthermore,":[49],"when":[50],"presented":[51],"with":[52,131],"significant":[53],"degradation":[54],"many":[55],"common":[56],"heuristic":[57],"fall":[59],"apart.":[60],"In":[61],"this":[62],"paper,":[63],"we":[64],"propose":[65],"Bayesian":[67],"generative":[68],"model":[69,82],"which":[73],"seeks":[74],"overcome":[76],"some":[77],"these":[79,123],"drawbacks.":[80],"Our":[81],"automatically":[83],"discovers":[84],"different":[85],"regions":[86],"present":[87],"in":[88,92],"image":[91,157],"completely":[94],"unsupervised":[95],"fashion.":[96],"We":[97,126,136,160],"attempt":[98],"no":[99],"extraction,":[101],"rather":[103],"use":[104],"discrete":[105],"patch-based":[106],"codebook":[107],"learning":[108],"make":[110],"our":[111,162,174],"probabilistic":[112],"representation":[113],"feasible.":[114],"Each":[115],"latent":[116],"region":[117],"topic":[118],"distribution":[121],"over":[122],"patch":[124],"indices.":[125],"capture":[127],"rough":[128],"layout":[130],"an":[132,138],"MRF":[133],"Potts":[134],"model.":[135],"take":[137],"analysis":[139],"by":[140,165],"synthesis":[141],"approach":[142],"examine":[144],"the":[145],"model,":[146],"provide":[148],"quantitative":[149],"results":[151,167],"on":[152,168],"manually":[154],"labeled":[155],"data":[158],"set.":[159,176],"illustrate":[161],"model's":[163],"robustness":[164],"providing":[166],"highly":[170],"degraded":[171],"version":[172],"test":[175]},"counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
