{"id":"https://openalex.org/W2985193030","doi":"https://doi.org/10.18653/v1/d19-5540","title":"No, you\u2019re not alone: A better way to find people with similar experiences on Reddit","display_name":"No, you\u2019re not alone: A better way to find people with similar experiences on Reddit","publication_year":2019,"publication_date":"2019-01-01","ids":{"openalex":"https://openalex.org/W2985193030","doi":"https://doi.org/10.18653/v1/d19-5540","mag":"2985193030"},"language":"en","primary_location":{"id":"doi:10.18653/v1/d19-5540","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d19-5540","pdf_url":"https://www.aclweb.org/anthology/D19-5540.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th Workshop on Noisy User-generated Text (W-NUT 2019)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.aclweb.org/anthology/D19-5540.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101475389","display_name":"Zhilin Wang","orcid":"https://orcid.org/0000-0002-0188-0332"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Zhilin Wang","raw_affiliation_strings":["University of Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007900374","display_name":"Elena Rastorgueva","orcid":null},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Elena Rastorgueva","raw_affiliation_strings":["University of Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051401703","display_name":"Weizhe Lin","orcid":"https://orcid.org/0000-0002-0754-4524"},"institutions":[{"id":"https://openalex.org/I241749","display_name":"University of Cambridge","ror":"https://ror.org/013meh722","country_code":"GB","type":"education","lineage":["https://openalex.org/I241749"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Weizhe Lin","raw_affiliation_strings":["University of Cambridge, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Cambridge, United Kingdom","institution_ids":["https://openalex.org/I241749"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057091775","display_name":"Xiaodong Wu","orcid":"https://orcid.org/0000-0003-3545-9930"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiaodong Wu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5007900374"],"corresponding_institution_ids":["https://openalex.org/I241749"],"apc_list":null,"apc_paid":null,"fwci":0.14,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.58208418,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"307","last_page":"315"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12488","display_name":"Mental Health via Writing","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8426401615142822},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7483876347541809},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.726813554763794},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.7044514417648315},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.46536707878112793},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4501023292541504},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.4476177990436554},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.44132405519485474},{"id":"https://openalex.org/keywords/correlation-clustering","display_name":"Correlation clustering","score":0.43976590037345886},{"id":"https://openalex.org/keywords/word2vec","display_name":"Word2vec","score":0.42611658573150635},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41296520829200745},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32726651430130005}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8426401615142822},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7483876347541809},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.726813554763794},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.7044514417648315},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.46536707878112793},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4501023292541504},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.4476177990436554},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.44132405519485474},{"id":"https://openalex.org/C94641424","wikidata":"https://www.wikidata.org/wiki/Q5172845","display_name":"Correlation clustering","level":3,"score":0.43976590037345886},{"id":"https://openalex.org/C2776461190","wikidata":"https://www.wikidata.org/wiki/Q22673982","display_name":"Word2vec","level":3,"score":0.42611658573150635},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41296520829200745},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32726651430130005},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.18653/v1/d19-5540","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d19-5540","pdf_url":"https://www.aclweb.org/anthology/D19-5540.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th Workshop on Noisy User-generated Text (W-NUT 2019)","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.18653/v1/d19-5540","is_oa":true,"landing_page_url":"https://doi.org/10.18653/v1/d19-5540","pdf_url":"https://www.aclweb.org/anthology/D19-5540.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 5th Workshop on Noisy User-generated Text (W-NUT 2019)","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2985193030.pdf","grobid_xml":"https://content.openalex.org/works/W2985193030.grobid-xml"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W1555398107","https://openalex.org/W1566289585","https://openalex.org/W1880262756","https://openalex.org/W1973871257","https://openalex.org/W2058815839","https://openalex.org/W2059059273","https://openalex.org/W2095881835","https://openalex.org/W2153579005","https://openalex.org/W2160467647","https://openalex.org/W2162833336","https://openalex.org/W2461267643","https://openalex.org/W2752172973","https://openalex.org/W2757194839","https://openalex.org/W2807032982","https://openalex.org/W2896457183","https://openalex.org/W2963341956","https://openalex.org/W2963403868","https://openalex.org/W4231510805","https://openalex.org/W4252386822","https://openalex.org/W4294170691","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W3159709618","https://openalex.org/W2611137333","https://openalex.org/W3005513013"],"abstract_inverted_index":{"We":[0,57],"present":[1],"a":[2,42,65,80],"probabilistic":[3,61,87],"clustering":[4,38,62,70,88,123],"algorithm":[5,96],"that":[6,14,59],"can":[7,63],"help":[8],"Reddit":[9],"users":[10],"to":[11,18,48,52,126],"find":[12],"posts":[13,40,105],"discuss":[15],"experiences":[16],"similar":[17],"their":[19],"own.":[20],"This":[21,108],"model":[22,31,118],"is":[23,79,106],"built":[24],"upon":[25],"the":[26,34,53,90,99,110,113,127],"BERT":[27,114,133],"Next":[28,115],"Sentence":[29,116],"Prediction":[30,117],"and":[32,89],"reduces":[33],"time":[35],"complexity":[36],"for":[37,121],"all":[39],"in":[41,97],"corpus":[43],"from":[44],"O(n":[45,93],"2":[46,94],")":[47,95],"O(n)":[49],"with":[50],"respect":[51],"number":[54],"of":[55,83,104,112,131],"posts.":[56],"demonstrate":[58],"such":[60],"yield":[64],"performance":[66],"better":[67],"than":[68],"baseline":[69],"methods":[71],"based":[72],"on":[73],"Latent":[74],"Dirichlet":[75],"Allocation":[76],"Furthermore,":[77],"there":[78],"high":[81,128],"degree":[82],"coherence":[84],"between":[85,101],"our":[86],"exhaustive":[91],"comparison":[92],"which":[98],"similarity":[100],"every":[102],"pair":[103],"found.":[107],"makes":[109],"use":[111],"more":[119],"practical":[120],"unsupervised":[122],"tasks":[124],"due":[125],"runtime":[129],"overhead":[130],"each":[132],"computation.":[134]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
