{"id":"https://openalex.org/W1971276189","doi":"https://doi.org/10.1162/089120105775299122","title":"Co-occurrence Retrieval: A Flexible Framework for Lexical Distributional Similarity","display_name":"Co-occurrence Retrieval: A Flexible Framework for Lexical Distributional Similarity","publication_year":2005,"publication_date":"2005-12-01","ids":{"openalex":"https://openalex.org/W1971276189","doi":"https://doi.org/10.1162/089120105775299122","mag":"1971276189"},"language":"en","primary_location":{"id":"doi:10.1162/089120105775299122","is_oa":true,"landing_page_url":"https://doi.org/10.1162/089120105775299122","pdf_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/089120105775299122","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/089120105775299122","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016270907","display_name":"Julie Weeds","orcid":"https://orcid.org/0000-0002-3831-4019"},"institutions":[{"id":"https://openalex.org/I162608824","display_name":"University of Sussex","ror":"https://ror.org/00ayhx656","country_code":"GB","type":"education","lineage":["https://openalex.org/I162608824"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Julie Weeds","raw_affiliation_strings":["University of Sussex","University of Sussex ,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Sussex","institution_ids":["https://openalex.org/I162608824"]},{"raw_affiliation_string":"University of Sussex ,","institution_ids":["https://openalex.org/I162608824"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023718997","display_name":"David Weir","orcid":"https://orcid.org/0000-0001-6986-0517"},"institutions":[{"id":"https://openalex.org/I162608824","display_name":"University of Sussex","ror":"https://ror.org/00ayhx656","country_code":"GB","type":"education","lineage":["https://openalex.org/I162608824"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"David Weir","raw_affiliation_strings":["University of Sussex, Department of Informatics, University of Sussex, Falmer, Brighton, BN1 9QH, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Sussex, Department of Informatics, University of Sussex, Falmer, Brighton, BN1 9QH, UK","institution_ids":["https://openalex.org/I162608824"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5016270907"],"corresponding_institution_ids":["https://openalex.org/I162608824"],"apc_list":null,"apc_paid":null,"fwci":18.3773,"has_fulltext":true,"cited_by_count":161,"citation_normalized_percentile":{"value":0.9924,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"31","issue":"4","first_page":"439","last_page":"475"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.7835718393325806},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6928824782371521},{"id":"https://openalex.org/keywords/semantic-similarity","display_name":"Semantic similarity","score":0.6126924157142639},{"id":"https://openalex.org/keywords/analogy","display_name":"Analogy","score":0.5521185398101807},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.5463510155677795},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.5277873873710632},{"id":"https://openalex.org/keywords/salient","display_name":"Salient","score":0.48287418484687805},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.45899680256843567},{"id":"https://openalex.org/keywords/parameterized-complexity","display_name":"Parameterized complexity","score":0.44891342520713806},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4460344612598419},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.43433690071105957},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4308733642101288},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.34306055307388306},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3420202136039734},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.23651331663131714},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.19773852825164795},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.13295534253120422}],"concepts":[{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.7835718393325806},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6928824782371521},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.6126924157142639},{"id":"https://openalex.org/C521332185","wikidata":"https://www.wikidata.org/wiki/Q185816","display_name":"Analogy","level":2,"score":0.5521185398101807},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.5463510155677795},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.5277873873710632},{"id":"https://openalex.org/C2780719617","wikidata":"https://www.wikidata.org/wiki/Q1030752","display_name":"Salient","level":2,"score":0.48287418484687805},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.45899680256843567},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.44891342520713806},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4460344612598419},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.43433690071105957},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4308733642101288},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34306055307388306},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3420202136039734},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.23651331663131714},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.19773852825164795},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.13295534253120422},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1162/089120105775299122","is_oa":true,"landing_page_url":"https://doi.org/10.1162/089120105775299122","pdf_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/089120105775299122","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.125.1189","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.125.1189","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://acl.ldc.upenn.edu/j/j05/j05-4002.pdf","raw_type":"text"},{"id":"pmh:oai:doaj.org/article:8f1acf5b56c542e7b414e7e29a54376f","is_oa":false,"landing_page_url":"https://doaj.org/article/8f1acf5b56c542e7b414e7e29a54376f","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Computational Linguistics, Vol 31, Iss 4 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1162/089120105775299122","is_oa":true,"landing_page_url":"https://doi.org/10.1162/089120105775299122","pdf_url":"http://www.mitpressjournals.org/doi/pdf/10.1162/089120105775299122","source":{"id":"https://openalex.org/S155526855","display_name":"Computational Linguistics","issn_l":"0891-2017","issn":["0891-2017","1530-9312"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320244","host_organization_name":"Association for Computational Linguistics","host_organization_lineage":["https://openalex.org/P4310320244"],"host_organization_lineage_names":["Association for Computational Linguistics"],"type":"journal"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Computational Linguistics","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6899999976158142,"display_name":"Quality Education"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1971276189.pdf","grobid_xml":"https://content.openalex.org/works/W1971276189.grobid-xml"},"referenced_works_count":59,"referenced_works":["https://openalex.org/W125820043","https://openalex.org/W135528467","https://openalex.org/W187228978","https://openalex.org/W332950216","https://openalex.org/W1502523810","https://openalex.org/W1515576489","https://openalex.org/W1516391399","https://openalex.org/W1528321674","https://openalex.org/W1534872089","https://openalex.org/W1554237613","https://openalex.org/W1556966784","https://openalex.org/W1569415500","https://openalex.org/W1572948005","https://openalex.org/W1574901103","https://openalex.org/W1576928919","https://openalex.org/W1593045043","https://openalex.org/W1593239840","https://openalex.org/W1647729745","https://openalex.org/W1677141046","https://openalex.org/W1754931551","https://openalex.org/W1859173823","https://openalex.org/W1956559956","https://openalex.org/W1965555277","https://openalex.org/W1966907789","https://openalex.org/W1979459060","https://openalex.org/W1997841190","https://openalex.org/W2003698958","https://openalex.org/W2006345298","https://openalex.org/W2026338580","https://openalex.org/W2029858480","https://openalex.org/W2035717317","https://openalex.org/W2038721957","https://openalex.org/W2096071381","https://openalex.org/W2099111195","https://openalex.org/W2100377551","https://openalex.org/W2100935296","https://openalex.org/W2101941521","https://openalex.org/W2118996379","https://openalex.org/W2119276288","https://openalex.org/W2119610041","https://openalex.org/W2120084270","https://openalex.org/W2121147707","https://openalex.org/W2121227244","https://openalex.org/W2123084125","https://openalex.org/W2123489126","https://openalex.org/W2127314673","https://openalex.org/W2130337399","https://openalex.org/W2136930489","https://openalex.org/W2149671658","https://openalex.org/W2166776180","https://openalex.org/W2167844361","https://openalex.org/W2397321090","https://openalex.org/W2545480737","https://openalex.org/W2949201587","https://openalex.org/W2979401726","https://openalex.org/W2999729612","https://openalex.org/W3037413987","https://openalex.org/W3128981953","https://openalex.org/W4241850027"],"related_works":["https://openalex.org/W2392206215","https://openalex.org/W2365201483","https://openalex.org/W2355561779","https://openalex.org/W2352407775","https://openalex.org/W2186567693","https://openalex.org/W108701362","https://openalex.org/W2469799552","https://openalex.org/W2768582344","https://openalex.org/W2615704157","https://openalex.org/W2808275385"],"abstract_inverted_index":{"Techniques":[0],"that":[1,289],"exploit":[2],"knowledge":[3],"of":[4,15,35,38,43,46,69,75,79,82,87,114,123,152,156,190,221],"distributional":[5,52,83,89,105,157,184,222,281,320],"similarity":[6,53,90,106,158,192,282],"between":[7],"words":[8,118],"have":[9,91],"been":[10,92],"proposed":[11,93],"in":[12,21,143,218,232,240,312,318],"many":[13,85],"areas":[14],"Natural":[16],"Language":[17],"Processing.":[18],"For":[19],"example,":[20],"language":[22],"modeling,":[23],"the":[24,33,41,66,73,80,112,138,165,171,188,219,230,233,270,273],"sparse":[25],"data":[26],"problem":[27,113],"can":[28,132],"be":[29,57,133,148,200,287,297],"alleviated":[30],"by":[31,135,268],"estimating":[32],"probabilities":[34,42],"unseen":[36],"co-occurrences":[37,45,212],"events":[39],"from":[40,202],"seen":[44],"similar":[47,117],"events.":[48],"In":[49,96,168],"other":[50,279],"applications,":[51],"is":[54,107,119,174,187,225,257,294,306],"taken":[55],"to":[56,60,65,177,199,228,235,259,296,299,308],"an":[58,206,309],"approximation":[59],"semantic":[61],"similarity.":[62,185,321],"However,":[63],"due":[64,307],"wide":[67],"range":[68],"potential":[70],"applications":[71],"and":[72,130,254,315],"lack":[74],"a":[76,99,150],"strict":[77],"definition":[78],"concept":[81],"similarity,":[84],"methods":[86],"calculating":[88,104],"or":[94,195],"adopted.":[95],"this":[97,110,169],"work,":[98],"flexible,":[100],"parameterized":[101],"framework":[102,173,275],"for":[103,127,249],"proposed.":[108],"Within":[109],"framework,":[111],"finding":[115],"distributionally":[116],"cast":[120],"as":[121,205],"one":[122],"co-occurrence":[124,242],"retrieval":[125],"(CR)":[126],"which":[128,236],"precision":[129],"recall":[131],"measured":[134,142],"analogy":[136],"with":[137,161],"way":[139],"they":[140],"are":[141,159,196,210,247],"document":[144],"retrieval.":[145],"As":[146],"will":[147,285],"shown,":[149],"number":[151],"popular":[153],"existing":[154,280],"measures":[155],"simulated":[160],"parameter":[162],"settings":[163],"within":[164,272],"CR":[166,172,274],"framework.":[167],"article,":[170],"then":[175],"used":[176,248],"systematically":[178],"investigate":[179],"three":[180],"fundamental":[181],"questions":[182],"concerning":[183],"First,":[186],"relationship":[189],"lexical":[191,313,319],"necessarily":[193],"symmetric,":[194],"there":[197],"advantages":[198],"gained":[201],"considering":[203],"it":[204,226,284],"asymmetric":[207],"relationship?":[208],"Second,":[209],"some":[211],"inherently":[213],"more":[214],"salient":[215],"than":[216,277],"others":[217],"calculation":[220],"similarity?":[223],"Third,":[224],"necessary":[227],"consider":[229],"difference":[231],"extent":[234],"each":[237,241],"word":[238],"occurs":[239],"type?":[243],"Two":[244],"application-based":[245],"tasks":[246,267],"evaluation:":[250],"automatic":[251],"thesaurus":[252],"generation":[253],"pseudo-disambiguation.":[255],"It":[256],"possible":[258],"achieve":[260],"significantly":[261],"better":[262,301],"results":[263],"on":[264,302],"both":[265,303],"these":[266],"varying":[269],"parameters":[271],"rather":[276],"using":[278],"measures;":[283],"also":[286,317],"shown":[288],"any":[290],"single":[291],"unparameterized":[292],"measure":[293],"unlikely":[295],"able":[298],"do":[300],"tasks.":[304],"This":[305],"inherent":[310],"asymmetry":[311],"substitutability":[314],"therefore":[316]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":7},{"year":2015,"cited_by_count":9},{"year":2014,"cited_by_count":24},{"year":2013,"cited_by_count":9},{"year":2012,"cited_by_count":11}],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
