{"id":"https://openalex.org/W6948911023","doi":"https://doi.org/10.5281/zenodo.10652309","title":"Early Irish Analogy Dataset for Word Embedding Evaluation","display_name":"Early Irish Analogy Dataset for Word Embedding Evaluation","publication_year":2021,"publication_date":"2021-03-08","ids":{"openalex":"https://openalex.org/W6948911023","doi":"https://doi.org/10.5281/zenodo.10652309"},"language":"en","primary_location":{"id":"doi:10.5281/zenodo.10652309","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.10652309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"type":"dataset","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.10652309","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Dereza, Oksana","orcid":"https://orcid.org/0000-0003-2896-6037"},"institutions":[{"id":"https://openalex.org/I188760350","display_name":"Ollscoil na Gaillimhe \u2013 University of Galway","ror":"https://ror.org/03bea9k73","country_code":"IE","type":"education","lineage":["https://openalex.org/I188760350"]}],"countries":["IE"],"is_corresponding":true,"raw_author_name":"Dereza, Oksana","raw_affiliation_strings":["Ollscoil na Gaillimhe \u2013 University of Galway","Insight SFI Research Centre for Data Analytics"],"raw_orcid":"https://orcid.org/0000-0003-2896-6037","affiliations":[{"raw_affiliation_string":"Ollscoil na Gaillimhe \u2013 University of Galway","institution_ids":["https://openalex.org/I188760350"]},{"raw_affiliation_string":"Insight SFI Research Centre for Data Analytics","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fransen, Theodorus","orcid":"https://orcid.org/0000-0001-5639-8626"},"institutions":[{"id":"https://openalex.org/I188760350","display_name":"Ollscoil na Gaillimhe \u2013 University of Galway","ror":"https://ror.org/03bea9k73","country_code":"IE","type":"education","lineage":["https://openalex.org/I188760350"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Fransen, Theodorus","raw_affiliation_strings":["Ollscoil na Gaillimhe \u2013 University of Galway","Insight SFI Research Centre for Data Analytics"],"raw_orcid":"https://orcid.org/0000-0001-5639-8626","affiliations":[{"raw_affiliation_string":"Ollscoil na Gaillimhe \u2013 University of Galway","institution_ids":["https://openalex.org/I188760350"]},{"raw_affiliation_string":"Insight SFI Research Centre for Data Analytics","institution_ids":[]}]},{"author_position":"last","author":{"id":null,"display_name":"McCrae, John Philip","orcid":"https://orcid.org/0000-0002-7227-1331"},"institutions":[{"id":"https://openalex.org/I188760350","display_name":"Ollscoil na Gaillimhe \u2013 University of Galway","ror":"https://ror.org/03bea9k73","country_code":"IE","type":"education","lineage":["https://openalex.org/I188760350"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"McCrae, John Philip","raw_affiliation_strings":["Ollscoil na Gaillimhe \u2013 University of Galway","Insight SFI Research Centre for Data Analytics"],"raw_orcid":"https://orcid.org/0000-0002-7227-1331","affiliations":[{"raw_affiliation_string":"Ollscoil na Gaillimhe \u2013 University of Galway","institution_ids":["https://openalex.org/I188760350"]},{"raw_affiliation_string":"Insight SFI Research Centre for Data Analytics","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I188760350"],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":null,"topics":[],"keywords":[{"id":"https://openalex.org/keywords/analogy","display_name":"Analogy","score":0.913100004196167},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.6955000162124634},{"id":"https://openalex.org/keywords/synonym","display_name":"Synonym (taxonomy)","score":0.6158000230789185},{"id":"https://openalex.org/keywords/spelling","display_name":"Spelling","score":0.536300003528595},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5069000124931335},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.39309999346733093}],"concepts":[{"id":"https://openalex.org/C521332185","wikidata":"https://www.wikidata.org/wiki/Q185816","display_name":"Analogy","level":2,"score":0.913100004196167},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.6955000162124634},{"id":"https://openalex.org/C173483453","wikidata":"https://www.wikidata.org/wiki/Q1040689","display_name":"Synonym (taxonomy)","level":3,"score":0.6158000230789185},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5809999704360962},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5394999980926514},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5389000177383423},{"id":"https://openalex.org/C2777801307","wikidata":"https://www.wikidata.org/wiki/Q2088390","display_name":"Spelling","level":2,"score":0.536300003528595},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5069000124931335},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.39309999346733093},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.3804999887943268},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.36570000648498535},{"id":"https://openalex.org/C547195049","wikidata":"https://www.wikidata.org/wiki/Q1725664","display_name":"Terminology","level":2,"score":0.3578999936580658},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3303999900817871},{"id":"https://openalex.org/C2780623531","wikidata":"https://www.wikidata.org/wiki/Q9142","display_name":"Irish","level":2,"score":0.30570000410079956},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.2953999936580658},{"id":"https://openalex.org/C159403335","wikidata":"https://www.wikidata.org/wiki/Q207857","display_name":"Inflection","level":2,"score":0.25929999351501465}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.10652309","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.10652309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"dataset"}],"best_oa_location":{"id":"doi:10.5281/zenodo.10652309","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.10652309","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"dataset"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"An":[0],"embedding":[1],"evaluation":[2],"dataset":[3,173],"for":[4,23,133],"Early":[5,64],"Irish":[6,65],"described":[7],"in":[8,50,141,177,184],"the":[9,14,17,45,69,92,136,144,157,164,178,185],"paper":[10],"\"Do":[11],"not":[12],"Trust":[13],"Experts:":[15],"How":[16],"Lack":[18],"of":[19,48,57,97,135,156],"Standard":[20],"Complicates":[21],"NLP":[22],"Historical":[24],"Irish\".":[25],"Traditionally,":[26],"analogy":[27,82],"datasets":[28],"are":[29,89,154],"based":[30],"on":[31],"pairwise":[32],"semantic":[33],"proportion,":[34],"and":[35,75,85,121,146,151,166,181],"therefore":[36],"every":[37],"question":[38],"has":[39],"a":[40,54,58,94],"single":[41],"correct":[42,59,78],"answer.":[43],"Given":[44],"high":[46],"level":[47],"variation":[49,87,120,124],"historical":[51,95],"languages,":[52],"such":[53],"strict":[55],"definition":[56],"answer":[60],"seems":[61],"unjustified.":[62],"Therefore,":[63],"Analogy":[66,71],"Dataset":[67],"follows":[68],"Bigger":[70],"Test":[72],"Set":[73],"(BATS)":[74],"provides":[76],"several":[77],"answers":[79],"to":[80,110,117,138],"each":[81,134],"question.":[83],"Morphological":[84],"spelling":[86,119],"data":[88,115],"extracted":[90],"from":[91,126],"eDIL,":[93],"dictionary":[96],"medieval":[98],"Irish.":[99],"Unlike":[100],"BATS,":[101],"no":[102],"distinction":[103],"is":[104],"made":[105],"between":[106],"inflection":[107],"types":[108],"due":[109],"eDIL's":[111],"structure.":[112],"The":[113,149,172],"raw":[114],"amounted":[116],"2,370":[118],"9,690":[122],"morphological":[123],"questions,":[125],"which":[127,189],"150":[128],"examples":[129],"were":[130],"randomly":[131],"selected":[132],"subsets":[137,153],"be":[139],"comparable":[140],"size":[142],"with":[143],"synonym":[145,150,179],"antonym":[147,152,186],"subsets.":[148],"translations":[155],"correspondent":[158],"BATS":[159],"parts":[160],"obtained":[161],"by":[162,168],"reverse-searching":[163],"eDIL":[165],"proofread":[167],"four":[169],"expert":[170],"evaluators.":[171],"includes":[174],"98":[175],"entries":[176,183],"subset":[180],"109":[182],"subset,":[187],"upon":[188],"three":[190],"or":[191],"more":[192],"experts":[193],"agreed.":[194]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
