{"id":"https://openalex.org/W2049727745","doi":"https://doi.org/10.1145/1096601.1096608","title":"Enabling massive scale document transformation for the semantic web","display_name":"Enabling massive scale document transformation for the semantic web","publication_year":2005,"publication_date":"2005-11-02","ids":{"openalex":"https://openalex.org/W2049727745","doi":"https://doi.org/10.1145/1096601.1096608","mag":"2049727745"},"language":"en","primary_location":{"id":"doi:10.1145/1096601.1096608","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1096601.1096608","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2005 ACM symposium on Document engineering","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109392109","display_name":"Mark Whiting","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mark A. Whiting","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007208627","display_name":"Wendy Cowley","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wendy Cowley","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108524080","display_name":"Nick Cramer","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nick Cramer","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043555235","display_name":"Alex Gibson","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alex Gibson","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009074540","display_name":"Ryan E. Hohimer","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ryan Hohimer","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088932764","display_name":"Ryan Scott","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ryan Scott","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050345737","display_name":"Stephen Tratz","orcid":null},"institutions":[{"id":"https://openalex.org/I142606810","display_name":"Pacific Northwest National Laboratory","ror":"https://ror.org/05h992307","country_code":"US","type":"facility","lineage":["https://openalex.org/I1325736334","https://openalex.org/I1330989302","https://openalex.org/I142606810","https://openalex.org/I39565521"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stephen Tratz","raw_affiliation_strings":["Pacific Northwest National Laboratory, Richland, Washington","[Pacific Northwest National Laboratory, Richland, Washington]"],"affiliations":[{"raw_affiliation_string":"Pacific Northwest National Laboratory, Richland, Washington","institution_ids":["https://openalex.org/I142606810"]},{"raw_affiliation_string":"[Pacific Northwest National Laboratory, Richland, Washington]","institution_ids":["https://openalex.org/I142606810"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5109392109"],"corresponding_institution_ids":["https://openalex.org/I142606810"],"apc_list":null,"apc_paid":null,"fwci":2.6325,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.90522126,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"23","last_page":"25"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10215","display_name":"Semantic Web and Ontologies","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8463042974472046},{"id":"https://openalex.org/keywords/parsing","display_name":"Parsing","score":0.7300604581832886},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.6492581367492676},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.6221062541007996},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.5220391750335693},{"id":"https://openalex.org/keywords/semantic-web-stack","display_name":"Semantic Web Stack","score":0.5086480379104614},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.4791697561740875},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.43516790866851807},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.31285592913627625}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8463042974472046},{"id":"https://openalex.org/C186644900","wikidata":"https://www.wikidata.org/wiki/Q194152","display_name":"Parsing","level":2,"score":0.7300604581832886},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.6492581367492676},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.6221062541007996},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.5220391750335693},{"id":"https://openalex.org/C167379230","wikidata":"https://www.wikidata.org/wiki/Q1026884","display_name":"Semantic Web Stack","level":3,"score":0.5086480379104614},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.4791697561740875},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.43516790866851807},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.31285592913627625},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1096601.1096608","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1096601.1096608","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2005 ACM symposium on Document engineering","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.47999998927116394,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W2072607050","https://openalex.org/W2081580037","https://openalex.org/W2145211186","https://openalex.org/W2157695030","https://openalex.org/W2770613891","https://openalex.org/W4247570771"],"related_works":["https://openalex.org/W6643695","https://openalex.org/W4381248170","https://openalex.org/W2366430559","https://openalex.org/W2349698472","https://openalex.org/W3189621521","https://openalex.org/W2173794830","https://openalex.org/W1585941060","https://openalex.org/W2355823470","https://openalex.org/W1985801232","https://openalex.org/W1710908466"],"abstract_inverted_index":{"The":[0],"Universal":[1],"Parsing":[2],"Agent":[3],"(UPA)":[4],"is":[5,51,59],"a":[6],"document":[7],"analysis":[8],"and":[9,35,46,56],"transformation":[10],"program":[11],"that":[12,50,58],"supports":[13],"massive":[14],"scale":[15],"conversion":[16],"of":[17],"information":[18,38,49],"into":[19],"forms":[20],"suitable":[21],"for":[22],"the":[23,48,54],"semantic":[24],"web.":[25],"UPA":[26],"provides":[27],"reusable":[28],"tools":[29],"to":[30],"analyze":[31],"text":[32,41],"documents;":[33],"identify":[34],"extract":[36],"important":[37],"elements;":[39],"enhance":[40],"with":[42],"semantically":[43],"descriptive":[44],"tags;":[45],"output":[47],"needed":[52],"in":[53],"format":[55],"structure":[57],"needed.":[60]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
