{"id":"https://openalex.org/W2130050079","doi":"https://doi.org/10.1109/icdar.2007.4378682","title":"Document Content Inventory and Retrieval","display_name":"Document Content Inventory and Retrieval","publication_year":2007,"publication_date":"2007-09-01","ids":{"openalex":"https://openalex.org/W2130050079","doi":"https://doi.org/10.1109/icdar.2007.4378682","mag":"2130050079"},"language":"en","primary_location":{"id":"doi:10.1109/icdar.2007.4378682","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdar.2007.4378682","pdf_url":null,"source":{"id":"https://openalex.org/S4210215987","display_name":"Proceedings of the International Conference on Document Analysis and Recognition","issn_l":"1520-5363","issn":["1520-5363","2379-2140"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ninth International Conference on Document Analysis and Recognition (ICDAR 2007)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011850885","display_name":"Henry S. Baird","orcid":null},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"H. Baird","raw_affiliation_strings":["Computer Science & Engineering Dept, Lehigh University, Bethlehem, PA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science & Engineering Dept, Lehigh University, Bethlehem, PA, USA","institution_ids":["https://openalex.org/I186143895"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5047573566","display_name":"M. Moll","orcid":"https://orcid.org/0000-0001-7013-9751"},"institutions":[{"id":"https://openalex.org/I186143895","display_name":"Lehigh University","ror":"https://ror.org/012afjb06","country_code":"US","type":"education","lineage":["https://openalex.org/I186143895"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M. Moll","raw_affiliation_strings":["Computer Science & Engineering Department, Lehigh University, Bethlehem, PA, USA"],"affiliations":[{"raw_affiliation_string":"Computer Science & Engineering Department, Lehigh University, Bethlehem, PA, USA","institution_ids":["https://openalex.org/I186143895"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5011850885"],"corresponding_institution_ids":["https://openalex.org/I186143895"],"apc_list":null,"apc_paid":null,"fwci":2.6422,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.89829545,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"93","last_page":"97"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10601","display_name":"Handwritten Text Recognition Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7379377484321594},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.6523443460464478},{"id":"https://openalex.org/keywords/handwriting","display_name":"Handwriting","score":0.5640600323677063},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5454209446907043},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5292263031005859},{"id":"https://openalex.org/keywords/fraction","display_name":"Fraction (chemistry)","score":0.5128112435340881},{"id":"https://openalex.org/keywords/content","display_name":"Content (measure theory)","score":0.489122211933136},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.47433653473854065},{"id":"https://openalex.org/keywords/content-based-image-retrieval","display_name":"Content-based image retrieval","score":0.4456016421318054},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4442558288574219},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.4398857355117798},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42588481307029724},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2972605228424072},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24519938230514526}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7379377484321594},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.6523443460464478},{"id":"https://openalex.org/C2779386606","wikidata":"https://www.wikidata.org/wiki/Q2393642","display_name":"Handwriting","level":2,"score":0.5640600323677063},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5454209446907043},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5292263031005859},{"id":"https://openalex.org/C149629883","wikidata":"https://www.wikidata.org/wiki/Q660926","display_name":"Fraction (chemistry)","level":2,"score":0.5128112435340881},{"id":"https://openalex.org/C2778152352","wikidata":"https://www.wikidata.org/wiki/Q5165061","display_name":"Content (measure theory)","level":2,"score":0.489122211933136},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.47433653473854065},{"id":"https://openalex.org/C2780052074","wikidata":"https://www.wikidata.org/wiki/Q1128648","display_name":"Content-based image retrieval","level":4,"score":0.4456016421318054},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4442558288574219},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.4398857355117798},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42588481307029724},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2972605228424072},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24519938230514526},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icdar.2007.4378682","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icdar.2007.4378682","pdf_url":null,"source":{"id":"https://openalex.org/S4210215987","display_name":"Proceedings of the International Conference on Document Analysis and Recognition","issn_l":"1520-5363","issn":["1520-5363","2379-2140"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Ninth International Conference on Document Analysis and Recognition (ICDAR 2007)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.4300000071525574,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W99136341","https://openalex.org/W195783868","https://openalex.org/W1727881885","https://openalex.org/W1998347547","https://openalex.org/W2098062186","https://openalex.org/W2106215871","https://openalex.org/W2109044256","https://openalex.org/W2124113661","https://openalex.org/W2128119911","https://openalex.org/W2160484851","https://openalex.org/W6604080519"],"related_works":["https://openalex.org/W2900811989","https://openalex.org/W2044706866","https://openalex.org/W2746816529","https://openalex.org/W2341223103","https://openalex.org/W2024252608","https://openalex.org/W2905186525","https://openalex.org/W2031096531","https://openalex.org/W4367727948","https://openalex.org/W3198880640","https://openalex.org/W3017331082"],"abstract_inverted_index":{"We":[0,127],"give":[1],"an":[2,95],"analysis":[3],"of":[4,17,32,88,92,108,115,120,152,159],"relationships":[5],"between":[6],"expected":[7,150],"retrieval":[8,75,111],"performance":[9],"and":[10,22,30,68,110,137,161,179,185],"classification":[11,61,109,142,183],"recognition":[12],"accuracy":[13,184],"in":[14,43,123],"the":[15,106,118,149,157,167],"context":[16],"document":[18,78,124],"image":[19,125],"content":[20,25,60,121,160],"extraction":[21,26],"inventory.":[23],"By":[24],"we":[27,103,133,146],"mean":[28],"location":[29],"measurement":[31],"regions":[33],"containing":[34],"handwriting,":[35],"machine-":[36],"printed":[37],"text,":[38],"photographs,":[39],"blank":[40],"space,":[41],"etc,":[42],"documents":[44],"represented":[45],"as":[46],"bilevel,":[47],"grey-level,":[48],"or":[49],"color":[50],"images.":[51],"Recent":[52],"experiments":[53],"have":[54,104],"shown":[55],"that":[56,82,129],"even":[57],"modest":[58],"per-pixel":[59,141],"accuracies":[62],"can":[63,147],"support":[64],"usefully":[65],"high":[66],"recall":[67,138,180],"precision":[69,136,178],"rates":[70,163],"(of,":[71],"e.g.,":[72],"80-90%)":[73],"for":[74],"queries":[76],"within":[77],"collections":[79],"seeking":[80],"pages":[81],"contain":[83],"a":[84,89,113],"given":[85],"minimum":[86],"fraction":[87],"certain":[90],"type":[91],"content.":[93],"In":[94],"effort":[96],"to":[97,176],"elucidate":[98],"this":[99],"interesting":[100],"empirical":[101],"result,":[102],"analyzed":[105],"interdependency":[107],"under":[112,130],"variety":[114],"assumptions":[116],"about":[117],"distribution":[119,158],"types":[122],"collections.":[126],"show":[128],"general":[131],"conditions":[132],"cannot":[134],"derive":[135],"measures":[139,143,181],"from":[140,182],"alone,":[144],"but":[145],"estimate":[148],"values":[151],"these":[153],"measures.":[154],"If":[155],"however":[156],"error":[162],"are":[164],"uniform":[165],"across":[166],"entire":[168],"collection,":[169],"our":[170],"results":[171],"suggest,":[172],"it":[173],"is":[174],"possible":[175],"predict":[177],"vice":[186],"versa.":[187]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2026-03-25T13:04:00.132906","created_date":"2025-10-10T00:00:00"}
