{"id":"https://openalex.org/W4387619785","doi":"https://doi.org/10.15439/2023f6275","title":"Text embeddings and clustering for characterizing online communities on Reddit","display_name":"Text embeddings and clustering for characterizing online communities on Reddit","publication_year":2023,"publication_date":"2023-09-26","ids":{"openalex":"https://openalex.org/W4387619785","doi":"https://doi.org/10.15439/2023f6275"},"language":"en","primary_location":{"id":"doi:10.15439/2023f6275","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f6275","pdf_url":"https://annals-csis.org/Volume_35/drp/pdf/6275.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://annals-csis.org/Volume_35/drp/pdf/6275.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014127378","display_name":"Jan Sawicki","orcid":"https://orcid.org/0000-0002-5945-1047"},"institutions":[{"id":"https://openalex.org/I108403487","display_name":"Warsaw University of Technology","ror":"https://ror.org/00y0xnp53","country_code":"PL","type":"education","lineage":["https://openalex.org/I108403487"]}],"countries":["PL"],"is_corresponding":true,"raw_author_name":"Jan Sawicki","raw_affiliation_strings":["Warsaw University of Technology"],"affiliations":[{"raw_affiliation_string":"Warsaw University of Technology","institution_ids":["https://openalex.org/I108403487"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5014127378"],"corresponding_institution_ids":["https://openalex.org/I108403487"],"apc_list":null,"apc_paid":null,"fwci":0.6232,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.67613636,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"35","issue":null,"first_page":"1131","last_page":"1136"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.963100016117096,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.963100016117096,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12592","display_name":"Opinion Dynamics and Social Influence","score":0.9417999982833862,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9247000217437744,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6599072217941284},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6414660215377808},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3648350238800049},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.34501519799232483},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32963213324546814}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6599072217941284},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6414660215377808},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3648350238800049},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.34501519799232483},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32963213324546814}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.15439/2023f6275","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f6275","pdf_url":"https://annals-csis.org/Volume_35/drp/pdf/6275.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:doaj.org/article:9c8cfa57b62f4051b0727e92c859ec22","is_oa":true,"landing_page_url":"https://doaj.org/article/9c8cfa57b62f4051b0727e92c859ec22","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Annals of computer science and information systems, Vol 35, Pp 1131-1136 (2023)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.15439/2023f6275","is_oa":true,"landing_page_url":"http://dx.doi.org/10.15439/2023f6275","pdf_url":"https://annals-csis.org/Volume_35/drp/pdf/6275.pdf","source":{"id":"https://openalex.org/S4220651875","display_name":"Annals of Computer Science and Information Systems","issn_l":"2300-5963","issn":["2300-5963"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":"https://openalex.org/P4310317484","host_organization_name":"Polskie Towarzystwo Informatyczne","host_organization_lineage":["https://openalex.org/P4310317484"],"host_organization_lineage_names":["Polskie Towarzystwo Informatyczne"],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Annals of Computer Science and Information Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387619785.pdf","grobid_xml":"https://content.openalex.org/works/W4387619785.grobid-xml"},"referenced_works_count":33,"referenced_works":["https://openalex.org/W1515908375","https://openalex.org/W1597284285","https://openalex.org/W2103115813","https://openalex.org/W2128724692","https://openalex.org/W2131744502","https://openalex.org/W2250539671","https://openalex.org/W2741058728","https://openalex.org/W2777164715","https://openalex.org/W2802772536","https://openalex.org/W2896457183","https://openalex.org/W2938824800","https://openalex.org/W2978017171","https://openalex.org/W3002330681","https://openalex.org/W3011718307","https://openalex.org/W3019913914","https://openalex.org/W3039304003","https://openalex.org/W3048804154","https://openalex.org/W3090527213","https://openalex.org/W3104667152","https://openalex.org/W3113238662","https://openalex.org/W3139580003","https://openalex.org/W3167344319","https://openalex.org/W3175424618","https://openalex.org/W3206629020","https://openalex.org/W4200261147","https://openalex.org/W4224433779","https://openalex.org/W4286900933","https://openalex.org/W4317671147","https://openalex.org/W4380302077","https://openalex.org/W6691431627","https://openalex.org/W6773395774","https://openalex.org/W6774952039","https://openalex.org/W6780099825"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2130043461","https://openalex.org/W2530322880","https://openalex.org/W1596801655"],"abstract_inverted_index":{"This":[0],"work":[1],"analyses":[2],"Reddit,":[3],"the":[4,10],"largest":[5],"public,":[6],"topiccentered":[7],"social":[8],"forum.In":[9],"experiments,":[11],"contextualized":[12],"text":[13],"embeddings,":[14],"obtained":[15,35],"using":[16,24],"DistilBERT,":[17],"represented":[18],"subreddit":[19],"content.Next,":[20],"clustering":[21,33],"was":[22],"performed,":[23],"an":[25],"unsupervised":[26],"K-means":[27],"algorithm":[28],"and":[29,45],"evaluated":[30],"with":[31],"multiple":[32],"metrics.The":[34],"clusters":[36],"were":[37],"analyzed.Moreover,":[38],"changes":[39],"of":[40],"cluster":[41],"structure,":[42],"between":[43],"2019":[44],"2022":[46],"have":[47],"been":[48],"examined.":[49]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-10T14:07:55.174380","created_date":"2025-10-10T00:00:00"}
