{"id":"https://openalex.org/W21004162","doi":"https://doi.org/10.1007/978-3-642-20128-8_6","title":"Measuring the Distance Between Comparable Corpora Between Languages","display_name":"Measuring the Distance Between Comparable Corpora Between Languages","publication_year":2013,"publication_date":"2013-01-01","ids":{"openalex":"https://openalex.org/W21004162","doi":"https://doi.org/10.1007/978-3-642-20128-8_6","mag":"21004162"},"language":"en","primary_location":{"id":"doi:10.1007/978-3-642-20128-8_6","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-20128-8_6","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Building and Using Comparable Corpora","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072701587","display_name":"Serge Sharoff","orcid":"https://orcid.org/0000-0002-4877-0210"},"institutions":[{"id":"https://openalex.org/I130828816","display_name":"University of Leeds","ror":"https://ror.org/024mrxd33","country_code":"GB","type":"education","lineage":["https://openalex.org/I130828816"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Serge Sharoff","raw_affiliation_strings":["Centre for Translation Studies, School of Modern Languages, University of Leeds, Woodhouse Lane, Leeds, LS2 9JT, UK","Centre for Translation Studies, School of Modern Languages, University of Leeds, Woodhouse Lane, UK","Centre for Translation Studies, University of Leeds, Leeds, United Kingdom","(University of Leeds"],"affiliations":[{"raw_affiliation_string":"Centre for Translation Studies, School of Modern Languages, University of Leeds, Woodhouse Lane, Leeds, LS2 9JT, UK","institution_ids":["https://openalex.org/I130828816"]},{"raw_affiliation_string":"Centre for Translation Studies, School of Modern Languages, University of Leeds, Woodhouse Lane, UK","institution_ids":["https://openalex.org/I130828816"]},{"raw_affiliation_string":"Centre for Translation Studies, University of Leeds, Leeds, United Kingdom","institution_ids":["https://openalex.org/I130828816"]},{"raw_affiliation_string":"(University of Leeds","institution_ids":["https://openalex.org/I130828816"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5072701587"],"corresponding_institution_ids":["https://openalex.org/I130828816"],"apc_list":null,"apc_paid":null,"fwci":0.3395,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.56240622,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"113","last_page":"130"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7413603067398071},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6648280620574951},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.5642316937446594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5329222679138184},{"id":"https://openalex.org/keywords/parallel-corpora","display_name":"Parallel corpora","score":0.5319939851760864},{"id":"https://openalex.org/keywords/corpus-linguistics","display_name":"Corpus linguistics","score":0.49103260040283203},{"id":"https://openalex.org/keywords/text-corpus","display_name":"Text corpus","score":0.46340179443359375},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4191456735134125},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.34072357416152954}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7413603067398071},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6648280620574951},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.5642316937446594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5329222679138184},{"id":"https://openalex.org/C2985367798","wikidata":"https://www.wikidata.org/wiki/Q1346592","display_name":"Parallel corpora","level":3,"score":0.5319939851760864},{"id":"https://openalex.org/C532629269","wikidata":"https://www.wikidata.org/wiki/Q865083","display_name":"Corpus linguistics","level":2,"score":0.49103260040283203},{"id":"https://openalex.org/C2474386","wikidata":"https://www.wikidata.org/wiki/Q461183","display_name":"Text corpus","level":2,"score":0.46340179443359375},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4191456735134125},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.34072357416152954},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/978-3-642-20128-8_6","is_oa":false,"landing_page_url":"https://doi.org/10.1007/978-3-642-20128-8_6","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Building and Using Comparable Corpora","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7900000214576721,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W11511616","https://openalex.org/W14574270","https://openalex.org/W22168010","https://openalex.org/W84079877","https://openalex.org/W229443363","https://openalex.org/W1571785066","https://openalex.org/W1651093245","https://openalex.org/W1880262756","https://openalex.org/W1966343454","https://openalex.org/W2027678432","https://openalex.org/W2087962968","https://openalex.org/W2099857124","https://openalex.org/W2118606687","https://openalex.org/W2144331291","https://openalex.org/W2155870214","https://openalex.org/W2156985047","https://openalex.org/W2159426623","https://openalex.org/W2170571488","https://openalex.org/W2238720809","https://openalex.org/W2550419310","https://openalex.org/W2737323272","https://openalex.org/W3165616014","https://openalex.org/W3197428893"],"related_works":["https://openalex.org/W2375537499","https://openalex.org/W2516977220","https://openalex.org/W3096124370","https://openalex.org/W2794113965","https://openalex.org/W107828926","https://openalex.org/W237928439","https://openalex.org/W2490960622","https://openalex.org/W1891547760","https://openalex.org/W4390840160","https://openalex.org/W2241529223"],"abstract_inverted_index":null,"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2026-01-15T23:16:33.117629","created_date":"2025-10-10T00:00:00"}
