{"id":"https://openalex.org/W2100957046","doi":"https://doi.org/10.1007/978-3-642-15760-8_24","title":"Analysis of Czech Web 1T 5-Gram Corpus and Its Comparison with Czech National Corpus Data","display_name":"Analysis of Czech Web 1T 5-Gram Corpus and Its Comparison with Czech National Corpus Data","publication_year":2010,"publication_date":"2010-01-01","ids":{"openalex":"https://openalex.org/W2100957046","doi":"https://doi.org/10.1007/978-3-642-15760-8_24","mag":"2100957046"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-642-15760-8_24","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-15760-8_24","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072709539","display_name":"V\u00e1clav Proch\u00e1zka","orcid":"https://orcid.org/0000-0002-8550-2653"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"V\u00e1clav Proch\u00e1zka","raw_affiliation_strings":["Dept. of Circuit Theory, Czech Technical University, Technick\u00e1 2, 166 27, Prague, Czech Republic"],"affiliations":[{"raw_affiliation_string":"Dept. of Circuit Theory, Czech Technical University, Technick\u00e1 2, 166 27, Prague, Czech Republic","institution_ids":["https://openalex.org/I44504214"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039450310","display_name":"Petr Poll\u00e1k","orcid":"https://orcid.org/0000-0002-1533-4199"},"institutions":[{"id":"https://openalex.org/I44504214","display_name":"Czech Technical University in Prague","ror":"https://ror.org/03kqpb082","country_code":"CZ","type":"education","lineage":["https://openalex.org/I44504214"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Petr Poll\u00e1k","raw_affiliation_strings":["Dept. of Circuit Theory, Czech Technical University, Technick\u00e1 2, 166 27, Prague, Czech Republic"],"affiliations":[{"raw_affiliation_string":"Dept. of Circuit Theory, Czech Technical University, Technick\u00e1 2, 166 27, Prague, Czech Republic","institution_ids":["https://openalex.org/I44504214"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5072709539"],"corresponding_institution_ids":["https://openalex.org/I44504214"],"apc_list":{"value":5000,"currency":"EUR","value_usd":5392},"apc_paid":null,"fwci":0.5664,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.69142988,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"181","last_page":"188"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.932699978351593,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/czech","display_name":"Czech","score":0.9428850412368774},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8202573657035828},{"id":"https://openalex.org/keywords/trigram","display_name":"Trigram","score":0.72130286693573},{"id":"https://openalex.org/keywords/n-gram","display_name":"n-gram","score":0.667847216129303},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6303691864013672},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.6101195812225342},{"id":"https://openalex.org/keywords/british-national-corpus","display_name":"British National Corpus","score":0.6004892587661743},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5416373014450073},{"id":"https://openalex.org/keywords/perplexity","display_name":"Perplexity","score":0.5374534726142883},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4516271650791168},{"id":"https://openalex.org/keywords/corpus-linguistics","display_name":"Corpus linguistics","score":0.4380950927734375},{"id":"https://openalex.org/keywords/text-corpus","display_name":"Text corpus","score":0.43542835116386414},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.42938029766082764},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.2950872778892517},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.20838463306427002}],"concepts":[{"id":"https://openalex.org/C2777842544","wikidata":"https://www.wikidata.org/wiki/Q9056","display_name":"Czech","level":2,"score":0.9428850412368774},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8202573657035828},{"id":"https://openalex.org/C137546455","wikidata":"https://www.wikidata.org/wiki/Q3213474","display_name":"Trigram","level":2,"score":0.72130286693573},{"id":"https://openalex.org/C117884012","wikidata":"https://www.wikidata.org/wiki/Q94489","display_name":"n-gram","level":3,"score":0.667847216129303},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6303691864013672},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.6101195812225342},{"id":"https://openalex.org/C2776725116","wikidata":"https://www.wikidata.org/wiki/Q236935","display_name":"British National Corpus","level":2,"score":0.6004892587661743},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5416373014450073},{"id":"https://openalex.org/C100279451","wikidata":"https://www.wikidata.org/wiki/Q372193","display_name":"Perplexity","level":3,"score":0.5374534726142883},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4516271650791168},{"id":"https://openalex.org/C532629269","wikidata":"https://www.wikidata.org/wiki/Q865083","display_name":"Corpus linguistics","level":2,"score":0.4380950927734375},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.43542835116386414},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.42938029766082764},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2950872778892517},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.20838463306427002},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-642-15760-8_24","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-15760-8_24","pdf_url":null,"source":{"id":"https://openalex.org/S106296714","display_name":"Lecture notes in computer science","issn_l":"0302-9743","issn":["0302-9743","1611-3349"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Lecture Notes in Computer Science","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.75,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W153320552","https://openalex.org/W943204654","https://openalex.org/W1575895314","https://openalex.org/W1600529453","https://openalex.org/W2402261002","https://openalex.org/W6624852173"],"related_works":["https://openalex.org/W2053242504","https://openalex.org/W1903115690","https://openalex.org/W2397861987","https://openalex.org/W2126623367","https://openalex.org/W1495755158","https://openalex.org/W2041167939","https://openalex.org/W2106459246","https://openalex.org/W2020757772","https://openalex.org/W2105076537","https://openalex.org/W1577263324"],"abstract_inverted_index":null,"counts_by_year":[{"year":2012,"cited_by_count":1}],"updated_date":"2026-01-15T23:16:33.117629","created_date":"2025-10-10T00:00:00"}
