{"id":"https://openalex.org/W1596761147","doi":"https://doi.org/10.1007/3-540-31314-1_50","title":"Evaluating the Performance of Text Mining Systems on Real-world Press Archives","display_name":"Evaluating the Performance of Text Mining Systems on Real-world Press Archives","publication_year":2006,"publication_date":"2006-01-01","ids":{"openalex":"https://openalex.org/W1596761147","doi":"https://doi.org/10.1007/3-540-31314-1_50","mag":"1596761147"},"language":"en","primary_location":{"id":"doi:10.1007/3-540-31314-1_50","is_oa":false,"landing_page_url":"https://doi.org/10.1007/3-540-31314-1_50","pdf_url":null,"source":{"id":"https://openalex.org/S4210194094","display_name":"Studies in classification, data analysis, and knowledge organization","issn_l":"1431-8814","issn":["1431-8814","2198-3321"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Classification, Data Analysis, and Knowledge Organization","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025445408","display_name":"Gerhard Paa\u00df","orcid":null},"institutions":[{"id":"https://openalex.org/I4210144576","display_name":"Fraunhofer Institute for Intelligent Analysis and Information Systems","ror":"https://ror.org/04nc32781","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210144576","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Gerhard Paa\u00df","raw_affiliation_strings":["Fraunhofer Institute for Autonomous Intelligent Systems, St. Augustin, Germany"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Fraunhofer Institute for Autonomous Intelligent Systems, St. Augustin, Germany","institution_ids":["https://openalex.org/I4210144576"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007122757","display_name":"Hugo de Vries","orcid":"https://orcid.org/0000-0002-4003-0760"},"institutions":[{"id":"https://openalex.org/I99043593","display_name":"Macquarie University","ror":"https://ror.org/01sf06y89","country_code":"AU","type":"education","lineage":["https://openalex.org/I99043593"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Hugo de Vries","raw_affiliation_strings":["Macquarie University, Sydney, Australia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Macquarie University, Sydney, Australia","institution_ids":["https://openalex.org/I99043593"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.15090161,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"414","last_page":"421"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7492363452911377},{"id":"https://openalex.org/keywords/usability","display_name":"Usability","score":0.6541524529457092},{"id":"https://openalex.org/keywords/argument","display_name":"Argument (complex analysis)","score":0.6275384426116943},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.6053229570388794},{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.5837855339050293},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5814096331596375},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5754899382591248},{"id":"https://openalex.org/keywords/recall-rate","display_name":"Recall rate","score":0.4447677731513977},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3811763823032379},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3283272981643677},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28882408142089844},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.08028718829154968}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7492363452911377},{"id":"https://openalex.org/C170130773","wikidata":"https://www.wikidata.org/wiki/Q216378","display_name":"Usability","level":2,"score":0.6541524529457092},{"id":"https://openalex.org/C98184364","wikidata":"https://www.wikidata.org/wiki/Q1780131","display_name":"Argument (complex analysis)","level":2,"score":0.6275384426116943},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.6053229570388794},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.5837855339050293},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5814096331596375},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5754899382591248},{"id":"https://openalex.org/C2987098735","wikidata":"https://www.wikidata.org/wiki/Q3808900","display_name":"Recall rate","level":2,"score":0.4447677731513977},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3811763823032379},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3283272981643677},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28882408142089844},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.08028718829154968},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/3-540-31314-1_50","is_oa":false,"landing_page_url":"https://doi.org/10.1007/3-540-31314-1_50","pdf_url":null,"source":{"id":"https://openalex.org/S4210194094","display_name":"Studies in classification, data analysis, and knowledge organization","issn_l":"1431-8814","issn":["1431-8814","2198-3321"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Studies in Classification, Data Analysis, and Knowledge Organization","raw_type":"book-chapter"},{"id":"pmh:oai:fraunhofer.de:N-38623","is_oa":false,"landing_page_url":"http://publica.fraunhofer.de/documents/N-38623.html","pdf_url":null,"source":{"id":"https://openalex.org/S4306400801","display_name":"Publikationsdatenbank der Fraunhofer-Gesellschaft (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Fraunhofer AIS","raw_type":"Conference Paper"},{"id":"pmh:oai:publica.fraunhofer.de:publica/350886","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/350886","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":3,"referenced_works":["https://openalex.org/W2118020653","https://openalex.org/W2167277498","https://openalex.org/W3123294050"],"related_works":["https://openalex.org/W2358294942","https://openalex.org/W1996359983","https://openalex.org/W2601891598","https://openalex.org/W4367460280","https://openalex.org/W4328049145","https://openalex.org/W2121569490","https://openalex.org/W3214249595","https://openalex.org/W2352065863","https://openalex.org/W4387052059","https://openalex.org/W2011904342"],"abstract_inverted_index":null,"counts_by_year":[{"year":2017,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
