{"id":"https://openalex.org/W2075274120","doi":"https://doi.org/10.1145/1860559.1860608","title":"Document conversion for cultural heritage texts","display_name":"Document conversion for cultural heritage texts","publication_year":2010,"publication_date":"2010-09-21","ids":{"openalex":"https://openalex.org/W2075274120","doi":"https://doi.org/10.1145/1860559.1860608","mag":"2075274120"},"language":"en","primary_location":{"id":"doi:10.1145/1860559.1860608","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1860559.1860608","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th ACM symposium on Document engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003608009","display_name":"Michael Piotrowski","orcid":"https://orcid.org/0000-0003-3307-5386"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Michael Piotrowski","raw_affiliation_strings":["Law Sources Foundation of the Swiss Lawyers Society, Zurich, Switzerland"],"affiliations":[{"raw_affiliation_string":"Law Sources Foundation of the Swiss Lawyers Society, Zurich, Switzerland","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5003608009"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0036,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.77158009,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"223","last_page":"226"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12377","display_name":"Digital Humanities and Scholarship","score":0.991100013256073,"subfield":{"id":"https://openalex.org/subfields/1208","display_name":"Literature and Literary Theory"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.948199987411499,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7956101894378662},{"id":"https://openalex.org/keywords/digitization","display_name":"Digitization","score":0.7642035484313965},{"id":"https://openalex.org/keywords/typeface","display_name":"Typeface","score":0.6754937171936035},{"id":"https://openalex.org/keywords/cultural-heritage","display_name":"Cultural heritage","score":0.6713245511054993},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.569609522819519},{"id":"https://openalex.org/keywords/german","display_name":"German","score":0.5346775054931641},{"id":"https://openalex.org/keywords/optical-character-recognition","display_name":"Optical character recognition","score":0.5278496742248535},{"id":"https://openalex.org/keywords/unicode","display_name":"Unicode","score":0.4653666019439697},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3970421850681305},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.2560885548591614},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.22649496793746948},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.18493065237998962},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.1815406084060669},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.12357956171035767}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7956101894378662},{"id":"https://openalex.org/C2779308522","wikidata":"https://www.wikidata.org/wiki/Q843958","display_name":"Digitization","level":2,"score":0.7642035484313965},{"id":"https://openalex.org/C80797182","wikidata":"https://www.wikidata.org/wiki/Q17451","display_name":"Typeface","level":2,"score":0.6754937171936035},{"id":"https://openalex.org/C60671577","wikidata":"https://www.wikidata.org/wiki/Q210272","display_name":"Cultural heritage","level":2,"score":0.6713245511054993},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.569609522819519},{"id":"https://openalex.org/C154775046","wikidata":"https://www.wikidata.org/wiki/Q188","display_name":"German","level":2,"score":0.5346775054931641},{"id":"https://openalex.org/C546480517","wikidata":"https://www.wikidata.org/wiki/Q167555","display_name":"Optical character recognition","level":3,"score":0.5278496742248535},{"id":"https://openalex.org/C500551929","wikidata":"https://www.wikidata.org/wiki/Q8819","display_name":"Unicode","level":2,"score":0.4653666019439697},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3970421850681305},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.2560885548591614},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.22649496793746948},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.18493065237998962},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.1815406084060669},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.12357956171035767},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1860559.1860608","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1860559.1860608","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 10th ACM symposium on Document engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7599999904632568,"id":"https://metadata.un.org/sdg/11","display_name":"Sustainable cities and communities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320421","display_name":"Hort Innovation","ror":"https://ror.org/02h291k47"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1987223300","https://openalex.org/W2014872868","https://openalex.org/W2016564401","https://openalex.org/W2041904910","https://openalex.org/W2063420976","https://openalex.org/W2072674683","https://openalex.org/W2115815306","https://openalex.org/W7047636377"],"related_works":["https://openalex.org/W2344247273","https://openalex.org/W2780279436","https://openalex.org/W1512334992","https://openalex.org/W2885938417","https://openalex.org/W4290785358","https://openalex.org/W2387970992","https://openalex.org/W2724898345","https://openalex.org/W907309559","https://openalex.org/W2566805851","https://openalex.org/W4310051385"],"abstract_inverted_index":{"Many":[0],"large-scale":[1],"digitization":[2],"projects":[3],"are":[4,121],"currently":[5],"under":[6],"way":[7],"that":[8,61],"intend":[9],"to":[10,33,82,99],"preserve":[11],"the":[12,27,45,54,72,116,119,133,166,172],"cultural":[13],"heritage":[14],"contained":[15],"in":[16,53,96,123,127,136],"paper":[17],"documents":[18],"(in":[19],"particular":[20],"books)":[21],"and":[22,110,126,144,159],"make":[23],"it":[24],"available":[25],"on":[26],"Web.":[28],"Typically":[29],"OCR":[30,69,130,157],"is":[31,131,135],"used":[32],"produce":[34],"searchable":[35],"electronic":[36],"texts":[37],"from":[38,44,156],"books.":[39],"For":[40,59],"newer":[41],"books,":[42],"approximately":[43],"late":[46],"1980s":[47],"onwards,digital":[48],"text":[49,134,154],"may":[50],"already":[51],"exist":[52],"form":[55],"of":[56,66,74,105,108,118,140,148,168,174],"typesetting":[57,75,94,149],"data.":[58],"applications":[60],"require":[62],"a":[63,90,103,163],"higher":[64],"level":[65],"accuracy":[67],"than":[68],"can":[70,77],"deliver,":[71],"conversion":[73,147],"data":[76,95,150],"thus":[78,160],"be":[79],"an":[80],"alternative":[81],"manual":[83],"keying.":[84],"In":[85],"this":[86],"paper,":[87],"we":[88],"describe":[89],"tool":[91],"for":[92,102,165,171],"converting":[93],"FrameMaker":[97],"format":[98],"XHTML+CSS":[100],"developed":[101],"collection":[104],"source":[106],"editions":[107],"medieval":[109],"early":[111],"modern":[112,128],"documents.":[113],"Even":[114],"though":[115],"books":[117],"Collection":[120],"typeset":[122],"good":[124],"quality":[125],"typefaces,":[129],"unusable,since":[132],"various":[137],"historical":[138,175],"forms":[139],"German,":[141],"French,Italian,":[142],"Rhaeto-Romanic,":[143],"Latin.":[145],"The":[146],"produces":[151],"fully":[152],"reliable":[153],"free":[155],"errors":[158],"also":[161],"provides":[162],"basis":[164],"construction":[167],"language":[169],"resources":[170],"processing":[173],"texts.":[176]},"counts_by_year":[{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
