{"id":"https://openalex.org/W4292478702","doi":"https://doi.org/10.3389/frai.2022.948313","title":"Experiments with LDA and Top2Vec for embedded topic discovery on social media data\u2014A case study of cystic fibrosis","display_name":"Experiments with LDA and Top2Vec for embedded topic discovery on social media data\u2014A case study of cystic fibrosis","publication_year":2022,"publication_date":"2022-08-18","ids":{"openalex":"https://openalex.org/W4292478702","doi":"https://doi.org/10.3389/frai.2022.948313","pmid":"https://pubmed.ncbi.nlm.nih.gov/36062265"},"language":"en","primary_location":{"id":"doi:10.3389/frai.2022.948313","is_oa":true,"landing_page_url":"https://doi.org/10.3389/frai.2022.948313","pdf_url":"https://www.frontiersin.org/articles/10.3389/frai.2022.948313/pdf","source":{"id":"https://openalex.org/S4210197006","display_name":"Frontiers in Artificial Intelligence","issn_l":"2624-8212","issn":["2624-8212"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.frontiersin.org/articles/10.3389/frai.2022.948313/pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036922268","display_name":"Bradley Karas","orcid":"https://orcid.org/0000-0002-4063-1080"},"institutions":[{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]},{"id":"https://openalex.org/I4210148682","display_name":"National Center for Advancing Translational Sciences","ror":"https://ror.org/04pw6fb54","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210148682"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bradley Karas","raw_affiliation_strings":["Division of Rare Diseases Research Innovation, National Center for Advancing Translational Sciences (NCATS), National Institutes of Health (NIH), Bethesda, MD, United States"],"affiliations":[{"raw_affiliation_string":"Division of Rare Diseases Research Innovation, National Center for Advancing Translational Sciences (NCATS), National Institutes of Health (NIH), Bethesda, MD, United States","institution_ids":["https://openalex.org/I4210148682","https://openalex.org/I1299303238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028656333","display_name":"Sue Qu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210148682","display_name":"National Center for Advancing Translational Sciences","ror":"https://ror.org/04pw6fb54","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210148682"]},{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sue Qu","raw_affiliation_strings":["Division of Rare Diseases Research Innovation, National Center for Advancing Translational Sciences (NCATS), National Institutes of Health (NIH), Bethesda, MD, United States"],"affiliations":[{"raw_affiliation_string":"Division of Rare Diseases Research Innovation, National Center for Advancing Translational Sciences (NCATS), National Institutes of Health (NIH), Bethesda, MD, United States","institution_ids":["https://openalex.org/I4210148682","https://openalex.org/I1299303238"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004924663","display_name":"Yanji Xu","orcid":"https://orcid.org/0000-0001-8033-3793"},"institutions":[{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]},{"id":"https://openalex.org/I4210148682","display_name":"National Center for Advancing Translational Sciences","ror":"https://ror.org/04pw6fb54","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210148682"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yanji Xu","raw_affiliation_strings":["Division of Rare Diseases Research Innovation, National Center for Advancing Translational Sciences (NCATS), National Institutes of Health (NIH), Bethesda, MD, United States"],"affiliations":[{"raw_affiliation_string":"Division of Rare Diseases Research Innovation, National Center for Advancing Translational Sciences (NCATS), National Institutes of Health (NIH), Bethesda, MD, United States","institution_ids":["https://openalex.org/I4210148682","https://openalex.org/I1299303238"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073074181","display_name":"Qian Zhu","orcid":"https://orcid.org/0000-0002-4858-6333"},"institutions":[{"id":"https://openalex.org/I1299303238","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238"]},{"id":"https://openalex.org/I4210148682","display_name":"National Center for Advancing Translational Sciences","ror":"https://ror.org/04pw6fb54","country_code":"US","type":"government","lineage":["https://openalex.org/I1299022934","https://openalex.org/I1299303238","https://openalex.org/I4210148682"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Qian Zhu","raw_affiliation_strings":["Division of Pre-Clinical Innovation, National Center for Advancing Translational Sciences, (NCATS), National Institutes of Health (NIH), Rockville, MD, United States"],"affiliations":[{"raw_affiliation_string":"Division of Pre-Clinical Innovation, National Center for Advancing Translational Sciences, (NCATS), National Institutes of Health (NIH), Rockville, MD, United States","institution_ids":["https://openalex.org/I4210148682","https://openalex.org/I1299303238"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5004924663","https://openalex.org/A5073074181"],"corresponding_institution_ids":["https://openalex.org/I1299303238","https://openalex.org/I4210148682"],"apc_list":{"value":1150,"currency":"USD","value_usd":1150},"apc_paid":{"value":1150,"currency":"USD","value_usd":1150},"fwci":2.776,"has_fulltext":true,"cited_by_count":20,"citation_normalized_percentile":{"value":0.91634046,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"5","issue":null,"first_page":"948313","last_page":"948313"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9925000071525574,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9908999800682068,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9302999973297119,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.8545604944229126},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.7991747260093689},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.7127661108970642},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6239270567893982},{"id":"https://openalex.org/keywords/readability","display_name":"Readability","score":0.606006920337677},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4846563935279846},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.4755632281303406},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3465002775192261},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.20003372430801392},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14352747797966003}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.8545604944229126},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.7991747260093689},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.7127661108970642},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6239270567893982},{"id":"https://openalex.org/C2778143727","wikidata":"https://www.wikidata.org/wiki/Q1820650","display_name":"Readability","level":2,"score":0.606006920337677},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4846563935279846},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4755632281303406},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3465002775192261},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.20003372430801392},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14352747797966003},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3389/frai.2022.948313","is_oa":true,"landing_page_url":"https://doi.org/10.3389/frai.2022.948313","pdf_url":"https://www.frontiersin.org/articles/10.3389/frai.2022.948313/pdf","source":{"id":"https://openalex.org/S4210197006","display_name":"Frontiers in Artificial Intelligence","issn_l":"2624-8212","issn":["2624-8212"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence","raw_type":"journal-article"},{"id":"pmid:36062265","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/36062265","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in artificial intelligence","raw_type":null},{"id":"pmh:oai:doaj.org/article:5186662befaf49bcae31550370db8330","is_oa":true,"landing_page_url":"https://doaj.org/article/5186662befaf49bcae31550370db8330","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Frontiers in Artificial Intelligence, Vol 5 (2022)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:9433987","is_oa":true,"landing_page_url":"https://www.ncbi.nlm.nih.gov/pmc/articles/9433987","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Front Artif Intell","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3389/frai.2022.948313","is_oa":true,"landing_page_url":"https://doi.org/10.3389/frai.2022.948313","pdf_url":"https://www.frontiersin.org/articles/10.3389/frai.2022.948313/pdf","source":{"id":"https://openalex.org/S4210197006","display_name":"Frontiers in Artificial Intelligence","issn_l":"2624-8212","issn":["2624-8212"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320527","host_organization_name":"Frontiers Media","host_organization_lineage":["https://openalex.org/P4310320527"],"host_organization_lineage_names":["Frontiers Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5199999809265137}],"awards":[{"id":"https://openalex.org/G2789588635","display_name":null,"funder_award_id":"NCATS","funder_id":"https://openalex.org/F4320332161","funder_display_name":"National Institutes of Health"}],"funders":[{"id":"https://openalex.org/F4320332161","display_name":"National Institutes of Health","ror":"https://ror.org/01cwqze88"},{"id":"https://openalex.org/F4320337472","display_name":"National Center for Advancing Translational Sciences","ror":"https://ror.org/04pw6fb54"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4292478702.pdf","grobid_xml":"https://content.openalex.org/works/W4292478702.grobid-xml"},"referenced_works_count":37,"referenced_works":["https://openalex.org/W1984251878","https://openalex.org/W2038043464","https://openalex.org/W2106411961","https://openalex.org/W2527330444","https://openalex.org/W2596585349","https://openalex.org/W2607056881","https://openalex.org/W2790855988","https://openalex.org/W2794557536","https://openalex.org/W2803437449","https://openalex.org/W2910136931","https://openalex.org/W2968058920","https://openalex.org/W2970641574","https://openalex.org/W2985790538","https://openalex.org/W2995074753","https://openalex.org/W3038033387","https://openalex.org/W3045065095","https://openalex.org/W3081636963","https://openalex.org/W3100806282","https://openalex.org/W3101884113","https://openalex.org/W3125519889","https://openalex.org/W3194604497","https://openalex.org/W4205267746","https://openalex.org/W4206368408","https://openalex.org/W4220807282","https://openalex.org/W4229011615","https://openalex.org/W4231510805","https://openalex.org/W4287687124","https://openalex.org/W4385245566","https://openalex.org/W6606906144","https://openalex.org/W6636510571","https://openalex.org/W6639619044","https://openalex.org/W6677088747","https://openalex.org/W6684489972","https://openalex.org/W6751854905","https://openalex.org/W6773395774","https://openalex.org/W6803783077","https://openalex.org/W6805401517"],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W3159709618","https://openalex.org/W2611137333","https://openalex.org/W2122605835"],"abstract_inverted_index":{"Social":[0],"media":[1,170,183],"has":[2],"become":[3],"an":[4,95],"important":[5],"resource":[6],"for":[7,44,76,172,176],"discussing,":[8],"sharing,":[9],"and":[10,19,62,110,127,159],"seeking":[11],"information":[12],"pertinent":[13],"to":[14,52,89,150,161],"rare":[15,174],"diseases":[16,175],"by":[17,104],"patients":[18,56],"their":[20],"families,":[21],"given":[22],"the":[23,27,65,78,91,99,113,121,137,143],"low":[24],"prevalence":[25],"in":[26],"extraordinarily":[28],"sparse":[29],"populations.":[30],"In":[31],"our":[32,87,147],"previous":[33,92],"study,":[34],"we":[35,49,59,85,135],"identified":[36],"prevalent":[37],"topics":[38,152],"from":[39,153],"Reddit":[40],"via":[41],"topic":[42,69,81,102],"modeling":[43],"cystic":[45],"fibrosis":[46],"(CF).":[47],"While":[48],"were":[50],"able":[51],"derive/access":[53],"concerns/needs/questions":[54],"of":[55,68,80,97,101,112,132,156,168],"with":[57,64,94,106,116,124,140,165,181],"CF,":[58],"observed":[60],"challenges":[61],"issues":[63],"traditional":[66],"techniques":[67],"modeling,":[70,103],"e.g.,":[71],"Latent":[72],"Dirichlet":[73],"Allocation":[74],"(LDA),":[75],"fulfilling":[77],"task":[79],"extraction.":[82],"Thus,":[83],"here":[84],"present":[86],"experiments":[88],"extend":[90],"study":[93],"aim":[96],"improving":[98],"performance":[100],"experimenting":[105],"LDA":[107],"model":[108,115,139,145,149],"optimization":[109],"examination":[111],"Top2Vec":[114,138],"different":[117],"embedding":[118,144],"models.":[119],"With":[120],"demonstrated":[122],"results":[123],"higher":[125,129],"coherence":[126],"qualitatively":[128],"human":[130],"readability":[131],"derived":[133],"topics,":[134],"implemented":[136],"doc2vec":[141],"as":[142,146],"final":[148],"extract":[151],"a":[154],"subreddit":[155],"CF":[157],"(\"r/CysticFibrosis\")":[158],"proposed":[160],"expand":[162],"its":[163],"use":[164],"other":[166,173],"types":[167],"social":[169,182],"data":[171],"better":[177],"assessing":[178],"patients'":[179],"needs":[180],"data.":[184]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
