{"id":"https://openalex.org/W2121653205","doi":"https://doi.org/10.1007/s10579-004-1919-1","title":"Pitfalls in Corpus Research","display_name":"Pitfalls in Corpus Research","publication_year":2004,"publication_date":"2004-11-01","ids":{"openalex":"https://openalex.org/W2121653205","doi":"https://doi.org/10.1007/s10579-004-1919-1","mag":"2121653205"},"language":"en","primary_location":{"id":"doi:10.1007/s10579-004-1919-1","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s10579-004-1919-1","pdf_url":null,"source":{"id":"https://openalex.org/S93469583","display_name":"Computers and the Humanities","issn_l":"0010-4817","issn":["0010-4817","1572-8412"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers and the Humanities","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/11858/00-001M-0000-0013-1762-B","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016396474","display_name":"Toni Rietveld","orcid":"https://orcid.org/0000-0003-1867-6706"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Toni Rietveld","raw_affiliation_strings":["Department of Linguistics, Radboud University Nijmegen, Erasmusplein 1, 6525 HT, Nijmegen, The Netherlands","Department of Linguistics, Radboud University Nijmegen, Nijmegen, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Radboud University Nijmegen, Erasmusplein 1, 6525 HT, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]},{"raw_affiliation_string":"Department of Linguistics, Radboud University Nijmegen, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070001107","display_name":"Roeland van Hout","orcid":"https://orcid.org/0000-0002-8870-1631"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Roeland Van hout","raw_affiliation_strings":["Department of Linguistics, Radboud University Nijmegen, Erasmusplein 1, 6525 HT, Nijmegen, The Netherlands","Department of Linguistics, Radboud University Nijmegen, Nijmegen, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Radboud University Nijmegen, Erasmusplein 1, 6525 HT, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]},{"raw_affiliation_string":"Department of Linguistics, Radboud University Nijmegen, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5091677603","display_name":"Mirjam Ernestus","orcid":"https://orcid.org/0000-0002-1853-0750"},"institutions":[{"id":"https://openalex.org/I4210089003","display_name":"Max Planck Institute for Psycholinguistics","ror":"https://ror.org/00671me87","country_code":"NL","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210089003"]},{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Mirjam Ernestus","raw_affiliation_strings":["Department of Linguistics, Radboud University Nijmegen, Erasmusplein 1, 6525 HT, Nijmegen, The Netherlands","Max Planck Institute for Psycholinguistics, The Netherlands","Department of Linguistics, Radboud University Nijmegen, Nijmegen, The Netherlands"],"affiliations":[{"raw_affiliation_string":"Department of Linguistics, Radboud University Nijmegen, Erasmusplein 1, 6525 HT, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]},{"raw_affiliation_string":"Max Planck Institute for Psycholinguistics, The Netherlands","institution_ids":["https://openalex.org/I4210089003"]},{"raw_affiliation_string":"Department of Linguistics, Radboud University Nijmegen, Nijmegen, The Netherlands","institution_ids":["https://openalex.org/I145872427"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5016396474"],"corresponding_institution_ids":["https://openalex.org/I145872427"],"apc_list":null,"apc_paid":null,"fwci":1.4049,"has_fulltext":true,"cited_by_count":17,"citation_normalized_percentile":{"value":0.85710651,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"38","issue":"4","first_page":"343","last_page":"362"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.967199981212616,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9642999768257141,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.7342966794967651},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.6929943561553955},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6267756223678589},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5892402529716492},{"id":"https://openalex.org/keywords/cut-point","display_name":"Cut-point","score":0.5566992163658142},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.523786187171936},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4906562864780426},{"id":"https://openalex.org/keywords/odds","display_name":"Odds","score":0.48470592498779297},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36881256103515625},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.35763853788375854},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.2966506779193878},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.17859649658203125},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.15385061502456665},{"id":"https://openalex.org/keywords/logistic-regression","display_name":"Logistic regression","score":0.10230329632759094}],"concepts":[{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.7342966794967651},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.6929943561553955},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6267756223678589},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5892402529716492},{"id":"https://openalex.org/C2781415353","wikidata":"https://www.wikidata.org/wiki/Q5196602","display_name":"Cut-point","level":2,"score":0.5566992163658142},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.523786187171936},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4906562864780426},{"id":"https://openalex.org/C143095724","wikidata":"https://www.wikidata.org/wiki/Q515895","display_name":"Odds","level":3,"score":0.48470592498779297},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36881256103515625},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.35763853788375854},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.2966506779193878},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.17859649658203125},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.15385061502456665},{"id":"https://openalex.org/C151956035","wikidata":"https://www.wikidata.org/wiki/Q1132755","display_name":"Logistic regression","level":2,"score":0.10230329632759094},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1007/s10579-004-1919-1","is_oa":false,"landing_page_url":"https://doi.org/10.1007/s10579-004-1919-1","pdf_url":null,"source":{"id":"https://openalex.org/S93469583","display_name":"Computers and the Humanities","issn_l":"0010-4817","issn":["0010-4817","1572-8412"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computers and the Humanities","raw_type":"journal-article"},{"id":"pmh:oai:pure.mpg.de:item_57743","is_oa":true,"landing_page_url":"http://hdl.handle.net/11858/00-001M-0000-0013-1762-B","pdf_url":"http://hdl.handle.net/11858/00-001M-0000-0013-1762-B","source":{"id":"https://openalex.org/S4306400654","display_name":"MPG.PuRe (Max Planck Society)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149899117","host_organization_name":"Max Planck Society","host_organization_lineage":["https://openalex.org/I149899117"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers and the Humanities","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:edoc.mpg.de:225796","is_oa":false,"landing_page_url":"http://edoc.mpg.de/225796","pdf_url":null,"source":{"id":"https://openalex.org/S4406922265","display_name":"Max Planck Institute for Plasma Physics","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers and the Humanities, v.38, 343-362 (2004)","raw_type":"Article"},{"id":"pmh:oai:repository.ubn.ru.nl:2066/61747","is_oa":false,"landing_page_url":"http://hdl.handle.net/2066/61747","pdf_url":null,"source":{"id":"https://openalex.org/S4306401067","display_name":"Radboud Repository (Radboud University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I145872427","host_organization_name":"Radboud University Nijmegen","host_organization_lineage":["https://openalex.org/I145872427"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers and the Humanities, 38, 4, pp. 343-362","raw_type":"Article / Letter to editor"}],"best_oa_location":{"id":"pmh:oai:pure.mpg.de:item_57743","is_oa":true,"landing_page_url":"http://hdl.handle.net/11858/00-001M-0000-0013-1762-B","pdf_url":"http://hdl.handle.net/11858/00-001M-0000-0013-1762-B","source":{"id":"https://openalex.org/S4306400654","display_name":"MPG.PuRe (Max Planck Society)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I149899117","host_organization_name":"Max Planck Society","host_organization_lineage":["https://openalex.org/I149899117"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computers and the Humanities","raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5799999833106995}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2121653205.pdf","grobid_xml":"https://content.openalex.org/works/W2121653205.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W567704720","https://openalex.org/W622763911","https://openalex.org/W1501400124","https://openalex.org/W1520252915","https://openalex.org/W1533168323","https://openalex.org/W1536975410","https://openalex.org/W1577099447","https://openalex.org/W1975879668","https://openalex.org/W2016699802","https://openalex.org/W2026622887","https://openalex.org/W2038566047","https://openalex.org/W2044389540","https://openalex.org/W2053154970","https://openalex.org/W2075454710","https://openalex.org/W2076983043","https://openalex.org/W2104626092","https://openalex.org/W2105275276","https://openalex.org/W2115209721","https://openalex.org/W2116780029","https://openalex.org/W2132133133","https://openalex.org/W2133738611","https://openalex.org/W2135157209","https://openalex.org/W2139911629","https://openalex.org/W2153804780","https://openalex.org/W2160837376","https://openalex.org/W2316114989","https://openalex.org/W2472534060","https://openalex.org/W2512537078","https://openalex.org/W2990515966","https://openalex.org/W4211148787","https://openalex.org/W4230581167","https://openalex.org/W4231741839","https://openalex.org/W4235479268","https://openalex.org/W4248694980","https://openalex.org/W4301139280","https://openalex.org/W4360598533","https://openalex.org/W4390911820"],"related_works":["https://openalex.org/W1604849300","https://openalex.org/W4231328776","https://openalex.org/W1604293003","https://openalex.org/W1979850356","https://openalex.org/W3005040438","https://openalex.org/W3132387835","https://openalex.org/W2910024633","https://openalex.org/W1520846789","https://openalex.org/W3124750890","https://openalex.org/W2393365719"],"abstract_inverted_index":null,"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
