{"id":"https://openalex.org/W1974924846","doi":"https://doi.org/10.1145/2037342.2037355","title":"Data mining medieval documents by word spotting","display_name":"Data mining medieval documents by word spotting","publication_year":2011,"publication_date":"2011-09-16","ids":{"openalex":"https://openalex.org/W1974924846","doi":"https://doi.org/10.1145/2037342.2037355","mag":"1974924846"},"language":"en","primary_location":{"id":"doi:10.1145/2037342.2037355","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2037342.2037355","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2011 Workshop on Historical Document Imaging and Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:uu:diva-162428","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5068463418","display_name":"Fredrik Wahlberg","orcid":"https://orcid.org/0000-0002-5306-1283"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Fredrik Wahlberg","raw_affiliation_strings":["Uppsala University","Uppsala University ,"],"affiliations":[{"raw_affiliation_string":"Uppsala University","institution_ids":["https://openalex.org/I123387679"]},{"raw_affiliation_string":"Uppsala University ,","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059869608","display_name":"Mats Dahll\u00f6f","orcid":"https://orcid.org/0000-0002-4990-7880"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Mats Dahll\u00f6f","raw_affiliation_strings":["Uppsala University","Uppsala University ,"],"affiliations":[{"raw_affiliation_string":"Uppsala University","institution_ids":["https://openalex.org/I123387679"]},{"raw_affiliation_string":"Uppsala University ,","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016187942","display_name":"Lasse M\u00e5rtensson","orcid":"https://orcid.org/0000-0001-5072-4961"},"institutions":[{"id":"https://openalex.org/I123387679","display_name":"Uppsala University","ror":"https://ror.org/048a87296","country_code":"SE","type":"education","lineage":["https://openalex.org/I123387679"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Lasse M\u00e5rtensson","raw_affiliation_strings":["Uppsala University","Uppsala University ,"],"affiliations":[{"raw_affiliation_string":"Uppsala University","institution_ids":["https://openalex.org/I123387679"]},{"raw_affiliation_string":"Uppsala University ,","institution_ids":["https://openalex.org/I123387679"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103545657","display_name":"Anders Brun","orcid":null},"institutions":[{"id":"https://openalex.org/I298625061","display_name":"Swedish University of Agricultural Sciences","ror":"https://ror.org/02yy8x990","country_code":"SE","type":"education","lineage":["https://openalex.org/I298625061"]}],"countries":["SE"],"is_corresponding":false,"raw_author_name":"Anders Brun","raw_affiliation_strings":["Swedish University of Agricultural Sciences","Swedish UNiversity of Agricultural Sciences;"],"affiliations":[{"raw_affiliation_string":"Swedish University of Agricultural Sciences","institution_ids":["https://openalex.org/I298625061"]},{"raw_affiliation_string":"Swedish UNiversity of Agricultural Sciences;","institution_ids":["https://openalex.org/I298625061"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5068463418"],"corresponding_institution_ids":["https://openalex.org/I123387679"],"apc_list":null,"apc_paid":null,"fwci":0.8552,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.78437817,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"75","last_page":"82"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9886999726295471,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spotting","display_name":"Spotting","score":0.8907411098480225},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7426961064338684},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6995170712471008},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5518860220909119},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.425912082195282},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3426026999950409},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.245265930891037}],"concepts":[{"id":"https://openalex.org/C2779506182","wikidata":"https://www.wikidata.org/wiki/Q7580141","display_name":"Spotting","level":2,"score":0.8907411098480225},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7426961064338684},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6995170712471008},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5518860220909119},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.425912082195282},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3426026999950409},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.245265930891037},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/2037342.2037355","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2037342.2037355","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2011 Workshop on Historical Document Imaging and Processing","raw_type":"proceedings-article"},{"id":"pmh:oai:DiVA.org:uu-162428","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:uu:diva-162428","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:DiVA.org:uu-162428","is_oa":true,"landing_page_url":"http://urn.kb.se/resolve?urn=urn:nbn:se:uu:diva-162428","pdf_url":null,"source":{"id":"https://openalex.org/S4306401559","display_name":"KTH Publication Database DiVA (KTH Royal Institute of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7099999785423279}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1500918733","https://openalex.org/W1800355726","https://openalex.org/W1982907973","https://openalex.org/W2019096529","https://openalex.org/W2038576084","https://openalex.org/W2079352267","https://openalex.org/W2097657973","https://openalex.org/W2116604999","https://openalex.org/W2125045217","https://openalex.org/W2133503046","https://openalex.org/W2134097102","https://openalex.org/W2156301828","https://openalex.org/W2564385013","https://openalex.org/W3098821875","https://openalex.org/W4232041434","https://openalex.org/W4238665603","https://openalex.org/W4298103743"],"related_works":["https://openalex.org/W2034439647","https://openalex.org/W4249589822","https://openalex.org/W2103063669","https://openalex.org/W3184921334","https://openalex.org/W4255446307","https://openalex.org/W2033009170","https://openalex.org/W2988098900","https://openalex.org/W4386895402","https://openalex.org/W2028814537","https://openalex.org/W3204019825"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"novel":[3],"results":[4],"for":[5,65],"word":[6,24,36,105,137],"spotting":[7,106],"based":[8],"on":[9,108],"dynamic":[10],"time":[11],"warping":[12],"applied":[13],"to":[14,62],"medieval":[15,110],"manuscripts":[16,111],"in":[17,38,130],"Latin":[18],"and":[19,30,52,133],"Old":[20],"Swedish.":[21],"A":[22],"target":[23],"is":[25,76],"marked":[26],"by":[27,41,124],"a":[28,82,126,131,140],"user,":[29],"the":[31,39,45,73,88,93],"method":[32,48,58,75],"automatically":[33,49],"finds":[34],"similar":[35],"forms":[37],"document":[40],"matching":[42,80],"them":[43],"against":[44],"target.":[46],"The":[47],"identifies":[50],"pages":[51],"lines.":[53],"We":[54,102,116],"show":[55,118],"that":[56,77,87,119],"our":[57,104],"improves":[59],"accuracy":[60],"compared":[61],"earlier":[63],"proposals":[64],"this":[66],"kind":[67],"of":[68,72,91,136,142],"handwriting.":[69],"An":[70],"advantage":[71],"new":[74],"it":[78,120],"performs":[79],"within":[81],"text":[83,94],"line":[84,95],"without":[85],"presupposing":[86],"difficult":[89],"problem":[90],"segmenting":[92],"into":[96],"individual":[97],"words":[98,129],"has":[99],"been":[100],"solved.":[101],"evaluate":[103],"implementation":[107],"two":[109,113],"representing":[112],"script":[114],"types.":[115],"also":[117],"can":[121],"be":[122],"useful":[123],"helping":[125],"user":[127],"find":[128],"manuscript":[132],"present":[134],"graphs":[135],"statistics":[138],"as":[139],"function":[141],"page":[143],"number.":[144]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
