{"id":"https://openalex.org/W3201405160","doi":"https://doi.org/10.1109/access.2021.3112620","title":"Analyzing LDA and NMF Topic Models for Urdu Tweets via Automatic Labeling","display_name":"Analyzing LDA and NMF Topic Models for Urdu Tweets via Automatic Labeling","publication_year":2021,"publication_date":"2021-01-01","ids":{"openalex":"https://openalex.org/W3201405160","doi":"https://doi.org/10.1109/access.2021.3112620","mag":"3201405160"},"language":"en","primary_location":{"id":"doi:10.1109/access.2021.3112620","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3112620","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09536731.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09536731.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003090396","display_name":"Zoya","orcid":null},"institutions":[{"id":"https://openalex.org/I929597975","display_name":"National University of Sciences and Technology","ror":"https://ror.org/03w2j5y17","country_code":"PK","type":"education","lineage":["https://openalex.org/I929597975"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Zoya","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan","institution_ids":["https://openalex.org/I929597975"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024120099","display_name":"Seemab Latif","orcid":"https://orcid.org/0000-0002-5801-1568"},"institutions":[{"id":"https://openalex.org/I929597975","display_name":"National University of Sciences and Technology","ror":"https://ror.org/03w2j5y17","country_code":"PK","type":"education","lineage":["https://openalex.org/I929597975"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Seemab Latif","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan","institution_ids":["https://openalex.org/I929597975"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003304863","display_name":"Faisal Shafait","orcid":"https://orcid.org/0000-0002-0922-0566"},"institutions":[{"id":"https://openalex.org/I929597975","display_name":"National University of Sciences and Technology","ror":"https://ror.org/03w2j5y17","country_code":"PK","type":"education","lineage":["https://openalex.org/I929597975"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Faisal Shafait","raw_affiliation_strings":["School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan","School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan and Deep Learning Laboratory, National Center of Artificial Intelligence, Islamabad, Pakistan"],"affiliations":[{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan","institution_ids":["https://openalex.org/I929597975"]},{"raw_affiliation_string":"School of Electrical Engineering and Computer Science, National University of Sciences and Technology (NUST), Islamabad, Pakistan and Deep Learning Laboratory, National Center of Artificial Intelligence, Islamabad, Pakistan","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076524479","display_name":"Rabia Latif","orcid":"https://orcid.org/0000-0001-5304-5948"},"institutions":[{"id":"https://openalex.org/I142024983","display_name":"Prince Sultan University","ror":"https://ror.org/053mqrf26","country_code":"SA","type":"education","lineage":["https://openalex.org/I142024983"]}],"countries":["SA"],"is_corresponding":false,"raw_author_name":"Rabia Latif","raw_affiliation_strings":["College of Computer and Information Science, Prince Sultan University, Riyadh, Saudi Arabia"],"affiliations":[{"raw_affiliation_string":"College of Computer and Information Science, Prince Sultan University, Riyadh, Saudi Arabia","institution_ids":["https://openalex.org/I142024983"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5003090396"],"corresponding_institution_ids":["https://openalex.org/I929597975"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":3.8073,"has_fulltext":true,"cited_by_count":42,"citation_normalized_percentile":{"value":0.94443962,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"9","issue":null,"first_page":"127531","last_page":"127547"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.8554243445396423},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8537122011184692},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.7781757116317749},{"id":"https://openalex.org/keywords/probabilistic-latent-semantic-analysis","display_name":"Probabilistic latent semantic analysis","score":0.7237789630889893},{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.6096451282501221},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.6029158234596252},{"id":"https://openalex.org/keywords/latent-semantic-analysis","display_name":"Latent semantic analysis","score":0.5488501191139221},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5112416744232178},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5028418898582458},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.4823433756828308},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.46732771396636963},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.3964790999889374},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3867315649986267},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.11530640721321106}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.8554243445396423},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8537122011184692},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.7781757116317749},{"id":"https://openalex.org/C112933361","wikidata":"https://www.wikidata.org/wiki/Q2845258","display_name":"Probabilistic latent semantic analysis","level":2,"score":0.7237789630889893},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.6096451282501221},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.6029158234596252},{"id":"https://openalex.org/C170133592","wikidata":"https://www.wikidata.org/wiki/Q1806883","display_name":"Latent semantic analysis","level":2,"score":0.5488501191139221},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5112416744232178},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5028418898582458},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.4823433756828308},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.46732771396636963},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.3964790999889374},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3867315649986267},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.11530640721321106},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2021.3112620","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3112620","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09536731.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:1639d54853914e2c9b0e08403a5c80bc","is_oa":true,"landing_page_url":"https://doaj.org/article/1639d54853914e2c9b0e08403a5c80bc","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 9, Pp 127531-127547 (2021)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2021.3112620","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2021.3112620","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/09536731.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3201405160.pdf","grobid_xml":"https://content.openalex.org/works/W3201405160.grobid-xml"},"referenced_works_count":71,"referenced_works":["https://openalex.org/W1714665356","https://openalex.org/W1880262756","https://openalex.org/W1902027874","https://openalex.org/W2004192095","https://openalex.org/W2038043464","https://openalex.org/W2043147077","https://openalex.org/W2061922307","https://openalex.org/W2064772995","https://openalex.org/W2097089247","https://openalex.org/W2107743791","https://openalex.org/W2128507180","https://openalex.org/W2129604374","https://openalex.org/W2130339025","https://openalex.org/W2132052677","https://openalex.org/W2147152072","https://openalex.org/W2147946282","https://openalex.org/W2151703435","https://openalex.org/W2158266063","https://openalex.org/W2164777277","https://openalex.org/W2168332560","https://openalex.org/W2178725228","https://openalex.org/W2222893162","https://openalex.org/W2293163851","https://openalex.org/W2328995640","https://openalex.org/W2352369035","https://openalex.org/W2409439155","https://openalex.org/W2507349564","https://openalex.org/W2509601217","https://openalex.org/W2516537890","https://openalex.org/W2522581443","https://openalex.org/W2560103719","https://openalex.org/W2573319818","https://openalex.org/W2574441945","https://openalex.org/W2605183993","https://openalex.org/W2702896255","https://openalex.org/W2737946880","https://openalex.org/W2740139069","https://openalex.org/W2745617509","https://openalex.org/W2763261656","https://openalex.org/W2788615138","https://openalex.org/W2790504398","https://openalex.org/W2790792830","https://openalex.org/W2803437449","https://openalex.org/W2807662642","https://openalex.org/W2856395111","https://openalex.org/W2903016493","https://openalex.org/W2963959132","https://openalex.org/W2969961168","https://openalex.org/W2970397832","https://openalex.org/W3010643076","https://openalex.org/W3023281526","https://openalex.org/W3028873360","https://openalex.org/W3081332416","https://openalex.org/W3138387439","https://openalex.org/W4233135949","https://openalex.org/W4385682194","https://openalex.org/W6639619044","https://openalex.org/W6679076926","https://openalex.org/W6679108089","https://openalex.org/W6679482899","https://openalex.org/W6682044806","https://openalex.org/W6684485952","https://openalex.org/W6689050917","https://openalex.org/W6731664008","https://openalex.org/W6736756693","https://openalex.org/W6742546227","https://openalex.org/W6748613083","https://openalex.org/W6751854905","https://openalex.org/W6753202691","https://openalex.org/W6777012294","https://openalex.org/W6792223450"],"related_works":["https://openalex.org/W1551384396","https://openalex.org/W2251863249","https://openalex.org/W4291700620","https://openalex.org/W2132052677","https://openalex.org/W2921491680","https://openalex.org/W3159709618","https://openalex.org/W2110027950","https://openalex.org/W3046324450","https://openalex.org/W2995939990","https://openalex.org/W4214866631"],"abstract_inverted_index":{"Various":[0],"topic":[1,105,137,182],"modeling":[2,138],"methods":[3],"provide":[4],"a":[5,58,175],"means":[6],"of":[7,44,78,111,116,136,180,193,200,238],"understanding":[8],"and":[9,19,41,51,76,120,122,153,204,220,229,252],"analyzing":[10],"content":[11],"available":[12],"on":[13,125,158,211,222,260,276],"social":[14,81],"media":[15,82],"platforms":[16],"like":[17,139],"Twitter":[18,168],"Facebook":[20],"in":[21,183],"an":[22],"unsupervised":[23],"manner.":[24],"However,":[25],"despite":[26],"several":[27],"existing":[28,90],"conventional":[29,104],"techniques,":[30],"they":[31],"have":[32,189,233],"had":[33],"limited":[34,114],"success":[35],"when":[36],"applied":[37],"directly":[38],"for":[39,86,95],"filtering":[40],"quick":[42],"comprehension":[43],"short-text":[45],"contents":[46],"due":[47,108],"to":[48,61,98,109,177,208],"text":[49,97,192,279],"sparseness":[50],"noise.":[52],"Thus,":[53],"it":[54],"always":[55],"has":[56],"been":[57],"challenging":[59],"problem":[60],"discover":[62],"reliable":[63],"latent":[64],"topics":[65,101],"from":[66],"online":[67],"discussion":[68],"texts":[69],"that":[70,266],"prevailed":[71],"with":[72,103,133,272,284],"low":[73],"words":[74],"co-occurrence":[75],"availability":[77,115],"large":[79,126],"size":[80,127,247],"benchmark":[83,112],"datasets":[84],"even":[85,102],"resource-rich":[87],"languages.":[88],"The":[89],"literature":[91],"lacks":[92],"such":[93],"work":[94,130],"Urdu":[96,161,277],"unveil":[99],"niche":[100],"models":[106],"mainly":[107],"lack":[110],"datasets,":[113],"pre-processing":[117],"tools/":[118],"algorithms,":[119],"time":[121],"compute":[123],"limitations":[124],"datasets.":[128],"This":[129],"presents":[131],"experiments":[132],"multiple":[134,206],"approaches":[135,240],"Latent":[140,145,149],"Semantic":[141,146],"Analysis":[142,147],"(LSA),":[143],"Probabilistic":[144],"(PLSA),":[148],"Dirichlet":[150],"Allocation":[151],"(LDA),":[152],"Non-negative":[154],"Matrix":[155],"Factorization":[156],"(NMF)":[157],"0.8":[159],"million":[160],"tweets.":[162],"These":[163],"tweets":[164,246,278],"are":[165,218],"collected":[166,202],"through":[167,241],"API":[169],"by":[170],"giving":[171,255],"various":[172],"hashtags":[173,253],"as":[174],"query":[176],"avoid":[178],"dominance":[179],"single":[181],"the":[184,191,194,197,201,223,236,270],"dataset.":[185],"In":[186],"addition,":[187],"we":[188],"pre-processed":[190],"tweets,":[195],"prepared":[196],"three":[198],"variants":[199,225],"dataset,":[203],"extracted":[205],"features":[207],"represent":[209],"documents":[210],"different":[212],"n-grams.":[213],"Furthermore,":[214],"all":[215],"these":[216,239],"techniques":[217,271],"compared":[219],"evaluated":[221],"dataset":[224],"using":[226],"both":[227],"qualitative":[228],"quantitative":[230],"measures.":[231],"We":[232],"also":[234],"demonstrated":[235],"results":[237,264],"visualization":[242],"methods,":[243],"graphs":[244],"depicting":[245],"per":[248],"topic,":[249],"word":[250],"clouds,":[251],"analysis":[254],"insights":[256],"about":[257],"algorithms":[258],"performances":[259],"finalized":[261],"topics.":[262],"Observed":[263],"reveal":[265],"NMF":[267],"outperformed":[268],"aa":[269],"TF-IDF":[273],"feature":[274],"vectors":[275],"while":[280],"LDA":[281],"performed":[282],"best":[283],"merging":[285],"shorttext":[286],"strategy":[287],"into":[288],"long":[289],"pseudo":[290],"documents.":[291]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":12},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":12},{"year":2022,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
