{"id":"https://openalex.org/W4411207935","doi":"https://doi.org/10.1109/isdfs65363.2025.11012074","title":"dataLDA: Analyzing Data Quality in Big Data Using Traditional Approaches vs. Latent Dirichlet Allocation - Systematic Review","display_name":"dataLDA: Analyzing Data Quality in Big Data Using Traditional Approaches vs. Latent Dirichlet Allocation - Systematic Review","publication_year":2025,"publication_date":"2025-04-24","ids":{"openalex":"https://openalex.org/W4411207935","doi":"https://doi.org/10.1109/isdfs65363.2025.11012074"},"language":"en","primary_location":{"id":"doi:10.1109/isdfs65363.2025.11012074","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isdfs65363.2025.11012074","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 13th International Symposium on Digital Forensics and Security (ISDFS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5093367359","display_name":"Sayed Abu Sayeed","orcid":"https://orcid.org/0009-0003-8524-4046"},"institutions":[{"id":"https://openalex.org/I63772739","display_name":"Florida Atlantic University","ror":"https://ror.org/05p8w6387","country_code":"US","type":"education","lineage":["https://openalex.org/I63772739"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Sayed Abu Sayeed","raw_affiliation_strings":["College of Business, Florida Atlantic University,Boca Raton,FL,USA"],"affiliations":[{"raw_affiliation_string":"College of Business, Florida Atlantic University,Boca Raton,FL,USA","institution_ids":["https://openalex.org/I63772739"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040347462","display_name":"Naresh Kshetri","orcid":"https://orcid.org/0000-0002-3282-7331"},"institutions":[{"id":"https://openalex.org/I155173764","display_name":"Rochester Institute of Technology","ror":"https://ror.org/00v4yb702","country_code":"US","type":"education","lineage":["https://openalex.org/I155173764"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Naresh Kshetri","raw_affiliation_strings":["Rochester Institute of Technology,Department of Cybersecurity,Rochester,NY,USA"],"affiliations":[{"raw_affiliation_string":"Rochester Institute of Technology,Department of Cybersecurity,Rochester,NY,USA","institution_ids":["https://openalex.org/I155173764"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101925336","display_name":"Mir Mehedi Rahman","orcid":"https://orcid.org/0009-0002-7837-8639"},"institutions":[{"id":"https://openalex.org/I93131583","display_name":"Emporia State University","ror":"https://ror.org/04e6r1478","country_code":"US","type":"education","lineage":["https://openalex.org/I93131583"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mir Mehedi Rahman","raw_affiliation_strings":["School of Business &#x0026; Technology, Emporia State University,Emporia,KS,USA"],"affiliations":[{"raw_affiliation_string":"School of Business &#x0026; Technology, Emporia State University,Emporia,KS,USA","institution_ids":["https://openalex.org/I93131583"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004504233","display_name":"S.M. Khorshed Alam","orcid":null},"institutions":[{"id":"https://openalex.org/I83809506","display_name":"University of South Alabama","ror":"https://ror.org/01s7b5y08","country_code":"US","type":"education","lineage":["https://openalex.org/I83809506"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samiul Alam","raw_affiliation_strings":["School of Computing, University of South Alabama,Mobile,AL,USA"],"affiliations":[{"raw_affiliation_string":"School of Computing, University of South Alabama,Mobile,AL,USA","institution_ids":["https://openalex.org/I83809506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111660059","display_name":"Abdur Rahman","orcid":null},"institutions":[{"id":"https://openalex.org/I93131583","display_name":"Emporia State University","ror":"https://ror.org/04e6r1478","country_code":"US","type":"education","lineage":["https://openalex.org/I93131583"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abdur Rahman","raw_affiliation_strings":["School of Business &#x0026; Technology, Emporia State University,Emporia,KS,USA"],"affiliations":[{"raw_affiliation_string":"School of Business &#x0026; Technology, Emporia State University,Emporia,KS,USA","institution_ids":["https://openalex.org/I93131583"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5093367359"],"corresponding_institution_ids":["https://openalex.org/I63772739"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21205207,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9228000044822693,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9228000044822693,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.954620361328125},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6605588793754578},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.517799973487854},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4649343192577362},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.45462656021118164},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.45370572805404663},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.4440726637840271},{"id":"https://openalex.org/keywords/dirichlet-distribution","display_name":"Dirichlet distribution","score":0.4107888340950012},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35163694620132446},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2040894627571106},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09821337461471558}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.954620361328125},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6605588793754578},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.517799973487854},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4649343192577362},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.45462656021118164},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.45370572805404663},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.4440726637840271},{"id":"https://openalex.org/C169214877","wikidata":"https://www.wikidata.org/wiki/Q981016","display_name":"Dirichlet distribution","level":3,"score":0.4107888340950012},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35163694620132446},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2040894627571106},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09821337461471558},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C182310444","wikidata":"https://www.wikidata.org/wiki/Q1332643","display_name":"Boundary value problem","level":2,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/isdfs65363.2025.11012074","is_oa":false,"landing_page_url":"https://doi.org/10.1109/isdfs65363.2025.11012074","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 13th International Symposium on Digital Forensics and Security (ISDFS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W2497860580","https://openalex.org/W2891616219","https://openalex.org/W3204672119"],"abstract_inverted_index":{"Big":[0],"data":[1,12,27,45,68,81,101,116,163],"quality":[2,46,82,102,117,164],"is":[3,19,92],"all":[4],"about":[5],"ensuring":[6],"that":[7,87],"the":[8,48,58,64,112],"huge":[9],"amounts":[10],"of":[11,50,66],"are":[13,43],"accurate,":[14],"reliable,":[15],"and":[16,37,61,104,125,133,149,169],"useful.":[17],"It":[18],"important":[20],"because":[21],"decisions":[22],"made":[23],"based":[24],"on":[25,115],"this":[26],"can":[28,156],"affect":[29],"many":[30],"things,":[31],"like":[32],"business":[33],"strategies,":[34,166],"customer":[35],"experiences,":[36],"even":[38],"public":[39],"policies.":[40],"Many":[41],"researchers":[42],"studying":[44],"in":[47,75,97,118,141],"context":[49],"big":[51,67,98],"data.":[52],"This":[53,70],"study":[54],"aims":[55],"to":[56,79,160],"analyze":[57],"research":[59,129],"trends":[60,107,132],"patterns":[62],"within":[63],"domain":[65],"quality.":[69],"method":[71],"reveals":[72],"hidden":[73],"themes":[74],"large":[76],"datasets,":[77],"helping":[78],"understand":[80],"better.":[83],"The":[84,128],"findings":[85],"show":[86],"Latent":[88],"Dirichlet":[89],"Allocation":[90],"(LDA)":[91],"effective":[93,134,162],"for":[94],"topic":[95],"modeling":[96],"data,":[99],"highlighting":[100],"challenges":[103],"opportunities.":[105],"Key":[106],"identified":[108,130],"through":[109],"LDA":[110,140],"include":[111],"increasing":[113],"focus":[114],"supply":[119],"chain":[120],"management,":[121],"health":[122],"care":[123],"applications,":[124],"environmental":[126],"science.":[127],"key":[131],"assessment":[135],"methods.":[136],"For":[137],"researchers,":[138],"using":[139],"a":[142],"systematic":[143],"review":[144],"helps":[145],"summarize":[146],"existing":[147],"studies":[148],"find":[150],"gaps,":[151],"guiding":[152],"future":[153],"research.":[154],"Practitioners":[155],"leverage":[157],"these":[158],"insights":[159],"implement":[161],"management":[165],"improving":[167],"efficiency":[168],"decision-making":[170],"across":[171],"various":[172],"industries.":[173]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
