{"id":"https://openalex.org/W2772508672","doi":"https://doi.org/10.26615/978-954-452-049-6_053","title":"Czech Dataset for Semantic Similarity and Relatedness","display_name":"Czech Dataset for Semantic Similarity and Relatedness","publication_year":2017,"publication_date":"2017-11-10","ids":{"openalex":"https://openalex.org/W2772508672","doi":"https://doi.org/10.26615/978-954-452-049-6_053","mag":"2772508672"},"language":"en","primary_location":{"id":"doi:10.26615/978-954-452-049-6_053","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-049-6_053","pdf_url":"https://doi.org/10.26615/978-954-452-049-6_053","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"RANLP 2017 - Recent Advances in Natural Language Processing Meet Deep Learning","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.26615/978-954-452-049-6_053","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041676617","display_name":"Miloslav Konop\u00edk","orcid":"https://orcid.org/0000-0001-7397-1658"},"institutions":[{"id":"https://openalex.org/I92715842","display_name":"University of West Bohemia","ror":"https://ror.org/040t43x18","country_code":"CZ","type":"education","lineage":["https://openalex.org/I92715842"]}],"countries":["CZ"],"is_corresponding":true,"raw_author_name":"Miloslav Konop\u00edk","raw_affiliation_strings":["Faculty of Applied Sciences, University of West Bohemia, Technick\u00e1 8, 306 14 Plze\u0148 Czech Republic","NTIS -New Technologies for the Information Society, Department of Computer Science and Engineering,"],"affiliations":[{"raw_affiliation_string":"Faculty of Applied Sciences, University of West Bohemia, Technick\u00e1 8, 306 14 Plze\u0148 Czech Republic","institution_ids":["https://openalex.org/I92715842"]},{"raw_affiliation_string":"NTIS -New Technologies for the Information Society, Department of Computer Science and Engineering,","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064551686","display_name":"Ond\u0159ej Pra\u017e\u00e1k","orcid":"https://orcid.org/0000-0001-5445-7792"},"institutions":[{"id":"https://openalex.org/I92715842","display_name":"University of West Bohemia","ror":"https://ror.org/040t43x18","country_code":"CZ","type":"education","lineage":["https://openalex.org/I92715842"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"Ond\u0159ej Pra\u017e\u00e1k","raw_affiliation_strings":["NTIS -New Technologies for the Information Society, Department of Computer Science and Engineering,","Faculty of Applied Sciences, University of West Bohemia, Technick\u00e1 8, 306 14 Plze\u0148 Czech Republic"],"affiliations":[{"raw_affiliation_string":"NTIS -New Technologies for the Information Society, Department of Computer Science and Engineering,","institution_ids":[]},{"raw_affiliation_string":"Faculty of Applied Sciences, University of West Bohemia, Technick\u00e1 8, 306 14 Plze\u0148 Czech Republic","institution_ids":["https://openalex.org/I92715842"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021227331","display_name":"David Steinberger","orcid":null},"institutions":[{"id":"https://openalex.org/I92715842","display_name":"University of West Bohemia","ror":"https://ror.org/040t43x18","country_code":"CZ","type":"education","lineage":["https://openalex.org/I92715842"]}],"countries":["CZ"],"is_corresponding":false,"raw_author_name":"David Steinberger","raw_affiliation_strings":["Faculty of Applied Sciences, University of West Bohemia, Technick\u00e1 8, 306 14 Plze\u0148 Czech Republic","NTIS -New Technologies for the Information Society, Department of Computer Science and Engineering,"],"affiliations":[{"raw_affiliation_string":"Faculty of Applied Sciences, University of West Bohemia, Technick\u00e1 8, 306 14 Plze\u0148 Czech Republic","institution_ids":["https://openalex.org/I92715842"]},{"raw_affiliation_string":"NTIS -New Technologies for the Information Society, Department of Computer Science and Engineering,","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5041676617"],"corresponding_institution_ids":["https://openalex.org/I92715842"],"apc_list":null,"apc_paid":null,"fwci":0.39,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.71838471,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"401","last_page":"406"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9927999973297119,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.8335559964179993},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7769979238510132},{"id":"https://openalex.org/keywords/czech","display_name":"Czech","score":0.7602005004882812},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.7105541229248047},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6769651174545288},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.6153366565704346},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.6125960350036621},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6049665212631226},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5231127142906189},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4518555700778961},{"id":"https://openalex.org/keywords/explicit-semantic-analysis","display_name":"Explicit semantic analysis","score":0.4278731346130371},{"id":"https://openalex.org/keywords/semantic-computing","display_name":"Semantic computing","score":0.390536904335022},{"id":"https://openalex.org/keywords/semantic-technology","display_name":"Semantic technology","score":0.24820783734321594},{"id":"https://openalex.org/keywords/semantic-web","display_name":"Semantic Web","score":0.2112414836883545},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11453118920326233},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1051778495311737}],"concepts":[{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.8335559964179993},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7769979238510132},{"id":"https://openalex.org/C2777842544","wikidata":"https://www.wikidata.org/wiki/Q9056","display_name":"Czech","level":2,"score":0.7602005004882812},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.7105541229248047},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6769651174545288},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.6153366565704346},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.6125960350036621},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6049665212631226},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5231127142906189},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4518555700778961},{"id":"https://openalex.org/C173862523","wikidata":"https://www.wikidata.org/wiki/Q5421270","display_name":"Explicit semantic analysis","level":5,"score":0.4278731346130371},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.390536904335022},{"id":"https://openalex.org/C6881194","wikidata":"https://www.wikidata.org/wiki/Q7449091","display_name":"Semantic technology","level":4,"score":0.24820783734321594},{"id":"https://openalex.org/C2129575","wikidata":"https://www.wikidata.org/wiki/Q54837","display_name":"Semantic Web","level":2,"score":0.2112414836883545},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11453118920326233},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1051778495311737},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.26615/978-954-452-049-6_053","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-049-6_053","pdf_url":"https://doi.org/10.26615/978-954-452-049-6_053","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"RANLP 2017 - Recent Advances in Natural Language Processing Meet Deep Learning","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.26615/978-954-452-049-6_053","is_oa":true,"landing_page_url":"http://doi.org/10.26615/978-954-452-049-6_053","pdf_url":"https://doi.org/10.26615/978-954-452-049-6_053","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"RANLP 2017 - Recent Advances in Natural Language Processing Meet Deep Learning","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2772508672.pdf","grobid_xml":"https://content.openalex.org/works/W2772508672.grobid-xml"},"referenced_works_count":20,"referenced_works":["https://openalex.org/W1552847225","https://openalex.org/W1614298861","https://openalex.org/W1880262756","https://openalex.org/W1964209958","https://openalex.org/W1981617416","https://openalex.org/W2026487812","https://openalex.org/W2080100102","https://openalex.org/W2081580037","https://openalex.org/W2102131037","https://openalex.org/W2112184938","https://openalex.org/W2129773034","https://openalex.org/W2143927888","https://openalex.org/W2250354683","https://openalex.org/W2250539671","https://openalex.org/W2251012068","https://openalex.org/W2404753505","https://openalex.org/W2488809669","https://openalex.org/W2595715041","https://openalex.org/W3216404684","https://openalex.org/W4231510805"],"related_works":["https://openalex.org/W2103835134","https://openalex.org/W1965623300","https://openalex.org/W2359259132","https://openalex.org/W3134365128","https://openalex.org/W3016822073","https://openalex.org/W2774861092","https://openalex.org/W2114077504","https://openalex.org/W2807098362","https://openalex.org/W2156467700","https://openalex.org/W2088504393"],"abstract_inverted_index":{"This":[0],"paper":[1],"introduces":[2],"a":[3],"Czech":[4],"dataset":[5,13,33,63],"for":[6,91],"semantic":[7,10,24,27,93],"similarity":[8,25,94],"and":[9,26,46,95],"relatedness.":[11,96],"The":[12,32,62,70],"contains":[14,34,44],"word":[15,36],"pairs":[16,37],"with":[17,88],"hand":[18],"annotated":[19,65],"scores":[20],"that":[21],"indicate":[22],"the":[23,30,58,76],"relatedness":[28],"of":[29,75],"words.":[31],"953":[35],"compiled":[38],"from":[39,50],"9":[40],"different":[41],"sources.":[42],"It":[43],"words":[45,59],"their":[47],"contexts":[48],"taken":[49],"real":[51],"text":[52],"corpora":[53],"including":[54],"extra":[55],"examples":[56],"when":[57],"are":[60],"ambiguous.":[61],"is":[64,79],"by":[66],"5":[67],"independent":[68],"annotators.":[69],"average":[71],"Spearman":[72],"correlation":[73],"coefficient":[74],"annotation":[77],"agreement":[78],"r":[80],"=":[81],"0.81.":[82],"We":[83],"provide":[84],"reference":[85],"evaluation":[86],"experiments":[87],"several":[89],"methods":[90],"computing":[92]},"counts_by_year":[{"year":2019,"cited_by_count":2}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2017-12-22T00:00:00"}
