{"id":"https://openalex.org/W2950989492","doi":"https://doi.org/10.18653/v1/p18-2088","title":"A Rank-Based Similarity Metric for Word Embeddings","display_name":"A Rank-Based Similarity Metric for Word Embeddings","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2950989492","doi":"https://doi.org/10.18653/v1/p18-2088","mag":"2950989492"},"language":"en","primary_location":{"id":"doi:10.18653/v1/p18-2088","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2088","pdf_url":"https://www.aclweb.org/anthology/P18-2088.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/P18-2088.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5059288410","display_name":"Enrico Santus","orcid":"https://orcid.org/0000-0002-7327-2731"},"institutions":[{"id":"https://openalex.org/I63966007","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44","country_code":"US","type":"education","lineage":["https://openalex.org/I63966007"]},{"id":"https://openalex.org/I168639165","display_name":"Singapore Institute of Technology","ror":"https://ror.org/01v2c2791","country_code":"SG","type":"education","lineage":["https://openalex.org/I168639165"]}],"countries":["SG","US"],"is_corresponding":true,"raw_author_name":"Enrico Santus","raw_affiliation_strings":["Computer Science and Artificial Intelligence Lab, MIT","Singapore Institute of Technology [Singapore]","Massachusetts Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Computer Science and Artificial Intelligence Lab, MIT","institution_ids":[]},{"raw_affiliation_string":"Singapore Institute of Technology [Singapore]","institution_ids":["https://openalex.org/I168639165"]},{"raw_affiliation_string":"Massachusetts Institute of Technology","institution_ids":["https://openalex.org/I63966007"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100715276","display_name":"Hongmin Wang","orcid":"https://orcid.org/0000-0002-3597-3086"},"institutions":[{"id":"https://openalex.org/I154570441","display_name":"University of California, Santa Barbara","ror":"https://ror.org/02t274463","country_code":"US","type":"education","lineage":["https://openalex.org/I154570441"]},{"id":"https://openalex.org/I168639165","display_name":"Singapore Institute of Technology","ror":"https://ror.org/01v2c2791","country_code":"SG","type":"education","lineage":["https://openalex.org/I168639165"]}],"countries":["SG","US"],"is_corresponding":false,"raw_author_name":"Hongmin Wang","raw_affiliation_strings":["Department of Computer Science, University of California Santa Barbara","University of California [Santa Barbara]","Singapore Institute of Technology [Singapore]"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, University of California Santa Barbara","institution_ids":["https://openalex.org/I154570441"]},{"raw_affiliation_string":"University of California [Santa Barbara]","institution_ids":["https://openalex.org/I154570441"]},{"raw_affiliation_string":"Singapore Institute of Technology [Singapore]","institution_ids":["https://openalex.org/I168639165"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079921667","display_name":"Emmanuele Chersoni","orcid":"https://orcid.org/0000-0001-8742-0451"},"institutions":[{"id":"https://openalex.org/I4210166510","display_name":"Laboratoire Parole et Langage","ror":"https://ror.org/05whq8x35","country_code":"FR","type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I21491767","https://openalex.org/I4210150854","https://openalex.org/I4210166510"]},{"id":"https://openalex.org/I21491767","display_name":"Aix-Marseille Universit\u00e9","ror":"https://ror.org/035xkbk20","country_code":"FR","type":"education","lineage":["https://openalex.org/I21491767"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Emmanuele Chersoni","raw_affiliation_strings":["Aix-Marseille University","Aix Marseille Universit\u00e9","Laboratoire Parole et Langage"],"affiliations":[{"raw_affiliation_string":"Aix-Marseille University","institution_ids":["https://openalex.org/I21491767"]},{"raw_affiliation_string":"Aix Marseille Universit\u00e9","institution_ids":["https://openalex.org/I21491767"]},{"raw_affiliation_string":"Laboratoire Parole et Langage","institution_ids":["https://openalex.org/I4210166510"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100333738","display_name":"Yue Zhang","orcid":"https://orcid.org/0000-0002-6327-5023"},"institutions":[{"id":"https://openalex.org/I152815399","display_name":"Singapore University of Technology and Design","ror":"https://ror.org/05j6fvn87","country_code":"SG","type":"education","lineage":["https://openalex.org/I152815399"]},{"id":"https://openalex.org/I168639165","display_name":"Singapore Institute of Technology","ror":"https://ror.org/01v2c2791","country_code":"SG","type":"education","lineage":["https://openalex.org/I168639165"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Yue Zhang","raw_affiliation_strings":["ISTD, Singapore University of Technology and Design","Singapore Institute of Technology [Singapore]"],"affiliations":[{"raw_affiliation_string":"ISTD, Singapore University of Technology and Design","institution_ids":["https://openalex.org/I152815399"]},{"raw_affiliation_string":"Singapore Institute of Technology [Singapore]","institution_ids":["https://openalex.org/I168639165"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5059288410"],"corresponding_institution_ids":["https://openalex.org/I168639165","https://openalex.org/I63966007"],"apc_list":null,"apc_paid":null,"fwci":1.5202,"has_fulltext":true,"cited_by_count":15,"citation_normalized_percentile":{"value":0.87535544,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"552","last_page":"557"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.7698690891265869},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.7267709374427795},{"id":"https://openalex.org/keywords/cosine-similarity","display_name":"Cosine similarity","score":0.7127366065979004},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6952537894248962},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.6878436207771301},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6445000171661377},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6347962617874146},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5781235098838806},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.5510226488113403},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4939783215522766},{"id":"https://openalex.org/keywords/outlier","display_name":"Outlier","score":0.47084447741508484},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.44038841128349304},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42250627279281616},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3047615587711334},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1383594274520874}],"concepts":[{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.7698690891265869},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.7267709374427795},{"id":"https://openalex.org/C2780762811","wikidata":"https://www.wikidata.org/wiki/Q1784941","display_name":"Cosine similarity","level":3,"score":0.7127366065979004},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6952537894248962},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.6878436207771301},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6445000171661377},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6347962617874146},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5781235098838806},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.5510226488113403},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4939783215522766},{"id":"https://openalex.org/C79337645","wikidata":"https://www.wikidata.org/wiki/Q779824","display_name":"Outlier","level":2,"score":0.47084447741508484},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.44038841128349304},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42250627279281616},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3047615587711334},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1383594274520874},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/p18-2088","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2088","pdf_url":"https://www.aclweb.org/anthology/P18-2088.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/p18-2088","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/p18-2088","pdf_url":"https://www.aclweb.org/anthology/P18-2088.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309369","display_name":"Massachusetts Institute of Technology","ror":"https://ror.org/042nb2s44"},{"id":"https://openalex.org/F4320324110","display_name":"Singapore University of Technology and Design","ror":"https://ror.org/05j6fvn87"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2950989492.pdf","grobid_xml":"https://content.openalex.org/works/W2950989492.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W1614298861","https://openalex.org/W1615991656","https://openalex.org/W1662133657","https://openalex.org/W1854884267","https://openalex.org/W2053921957","https://openalex.org/W2112184938","https://openalex.org/W2170682101","https://openalex.org/W2250539671","https://openalex.org/W2251283399","https://openalex.org/W2251291469","https://openalex.org/W2251803266","https://openalex.org/W2296653400","https://openalex.org/W2328759100","https://openalex.org/W2502814102","https://openalex.org/W2512498397","https://openalex.org/W2518587255","https://openalex.org/W2738438234","https://openalex.org/W2785265351","https://openalex.org/W2949254265","https://openalex.org/W2950577311","https://openalex.org/W2962852556","https://openalex.org/W4293506519","https://openalex.org/W4294170691"],"related_works":["https://openalex.org/W3006513224","https://openalex.org/W2046456988","https://openalex.org/W2357409937","https://openalex.org/W2510582230","https://openalex.org/W2978674666","https://openalex.org/W2074430941","https://openalex.org/W2113096305","https://openalex.org/W1977636359","https://openalex.org/W2772305933","https://openalex.org/W2135511601"],"abstract_inverted_index":{"Word":[0],"Embeddings":[1],"(WE)":[2],"have":[3],"recently":[4],"imposed":[5],"themselves":[6],"as":[7,37],"a":[8,49],"standard":[9],"for":[10,28,52],"representing":[11],"word":[12,19],"meaning":[13],"in":[14,60,66],"NLP.":[15],"Semantic":[16],"similarity":[17,40,61],"between":[18],"pairs":[20],"has":[21],"become":[22],"the":[23,38,67],"most":[24],"common":[25],"evaluation":[26],"benchmark":[27],"these":[29],"representations,":[30],"with":[31,48],"vector":[32,58],"cosine":[33,59],"being":[34],"typically":[35],"used":[36],"only":[39],"metric.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45],"report":[46],"experiments":[47],"rank-based":[50,78],"metric":[51],"WE,":[53],"which":[54],"performs":[55],"comparably":[56],"to":[57],"estimation":[62],"and":[63,69],"outperforms":[64],"it":[65],"recently-introduced":[68],"challenging":[70],"task":[71],"of":[72],"outlier":[73],"detection,":[74],"thus":[75],"suggesting":[76],"that":[77],"measures":[79],"can":[80],"improve":[81],"clustering":[82],"quality.":[83],"1":[84]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2019,"cited_by_count":6}],"updated_date":"2026-03-06T13:50:29.536080","created_date":"2025-10-10T00:00:00"}
