{"id":"https://openalex.org/W3091085709","doi":"https://doi.org/10.1145/3406242","title":"Probabilistic Modeling for Frequency Vectors Using a Flexible Shifted-Scaled Dirichlet Distribution Prior","display_name":"Probabilistic Modeling for Frequency Vectors Using a Flexible Shifted-Scaled Dirichlet Distribution Prior","publication_year":2020,"publication_date":"2020-09-28","ids":{"openalex":"https://openalex.org/W3091085709","doi":"https://doi.org/10.1145/3406242","mag":"3091085709"},"language":"en","primary_location":{"id":"doi:10.1145/3406242","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3406242","pdf_url":null,"source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060719711","display_name":"Nuha Zamzami","orcid":"https://orcid.org/0000-0001-9328-9218"},"institutions":[{"id":"https://openalex.org/I4210099699","display_name":"University of Jeddah","ror":"https://ror.org/015ya8798","country_code":"SA","type":"education","lineage":["https://openalex.org/I4210099699"]}],"countries":["SA"],"is_corresponding":true,"raw_author_name":"Nuha Zamzami","raw_affiliation_strings":["Concordia Institute for Information Systems Engineering and Department of Computer Science and Artificial Intelligence, University of Jeddah, Jeddah, Saudi Arabia"],"raw_orcid":"https://orcid.org/0000-0001-9328-9218","affiliations":[{"raw_affiliation_string":"Concordia Institute for Information Systems Engineering and Department of Computer Science and Artificial Intelligence, University of Jeddah, Jeddah, Saudi Arabia","institution_ids":["https://openalex.org/I4210099699"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090600716","display_name":"Nizar Bouguila","orcid":"https://orcid.org/0000-0001-7224-7940"},"institutions":[{"id":"https://openalex.org/I161856759","display_name":"Concordia University","ror":"https://ror.org/01qxhf360","country_code":"US","type":"education","lineage":["https://openalex.org/I161856759"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nizar Bouguila","raw_affiliation_strings":["Concordia Institute for Information Systems Engineering"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Concordia Institute for Information Systems Engineering","institution_ids":["https://openalex.org/I161856759"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5060719711"],"corresponding_institution_ids":["https://openalex.org/I4210099699"],"apc_list":null,"apc_paid":null,"fwci":0.8154,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.79488313,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"14","issue":"6","first_page":"1","last_page":"35"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11980","display_name":"Human Mobility and Location-Based Analysis","score":0.9320999979972839,"subfield":{"id":"https://openalex.org/subfields/3313","display_name":"Transportation"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11819","display_name":"Data-Driven Disease Surveillance","score":0.9194999933242798,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dirichlet-distribution","display_name":"Dirichlet distribution","score":0.7112869620323181},{"id":"https://openalex.org/keywords/multinomial-distribution","display_name":"Multinomial distribution","score":0.6793006658554077},{"id":"https://openalex.org/keywords/overdispersion","display_name":"Overdispersion","score":0.6547871828079224},{"id":"https://openalex.org/keywords/categorical-distribution","display_name":"Categorical distribution","score":0.5143757462501526},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4950491487979889},{"id":"https://openalex.org/keywords/count-data","display_name":"Count data","score":0.48484838008880615},{"id":"https://openalex.org/keywords/exponential-family","display_name":"Exponential family","score":0.4684956669807434},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4402257800102234},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4384923577308655},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.4299231767654419},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.4127178490161896},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.38652893900871277},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3782516121864319},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34753215312957764},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.297174870967865},{"id":"https://openalex.org/keywords/poisson-distribution","display_name":"Poisson distribution","score":0.28812313079833984},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.23752981424331665},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.14696693420410156},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.14324212074279785},{"id":"https://openalex.org/keywords/bayesian-hierarchical-modeling","display_name":"Bayesian hierarchical modeling","score":0.10647597908973694}],"concepts":[{"id":"https://openalex.org/C169214877","wikidata":"https://www.wikidata.org/wiki/Q981016","display_name":"Dirichlet distribution","level":3,"score":0.7112869620323181},{"id":"https://openalex.org/C192065140","wikidata":"https://www.wikidata.org/wiki/Q1147928","display_name":"Multinomial distribution","level":2,"score":0.6793006658554077},{"id":"https://openalex.org/C117236510","wikidata":"https://www.wikidata.org/wiki/Q7113620","display_name":"Overdispersion","level":4,"score":0.6547871828079224},{"id":"https://openalex.org/C67926830","wikidata":"https://www.wikidata.org/wiki/Q5051810","display_name":"Categorical distribution","level":5,"score":0.5143757462501526},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4950491487979889},{"id":"https://openalex.org/C33643355","wikidata":"https://www.wikidata.org/wiki/Q5176731","display_name":"Count data","level":3,"score":0.48484838008880615},{"id":"https://openalex.org/C55974624","wikidata":"https://www.wikidata.org/wiki/Q1188504","display_name":"Exponential family","level":2,"score":0.4684956669807434},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4402257800102234},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4384923577308655},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.4299231767654419},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.4127178490161896},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.38652893900871277},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3782516121864319},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34753215312957764},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.297174870967865},{"id":"https://openalex.org/C100906024","wikidata":"https://www.wikidata.org/wiki/Q205692","display_name":"Poisson distribution","level":2,"score":0.28812313079833984},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.23752981424331665},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.14696693420410156},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.14324212074279785},{"id":"https://openalex.org/C191413810","wikidata":"https://www.wikidata.org/wiki/Q17100952","display_name":"Bayesian hierarchical modeling","level":4,"score":0.10647597908973694},{"id":"https://openalex.org/C182310444","wikidata":"https://www.wikidata.org/wiki/Q1332643","display_name":"Boundary value problem","level":2,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3406242","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3406242","pdf_url":null,"source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8299999833106995}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":78,"referenced_works":["https://openalex.org/W10916678","https://openalex.org/W170307911","https://openalex.org/W584423923","https://openalex.org/W1482815597","https://openalex.org/W1534506107","https://openalex.org/W1548390947","https://openalex.org/W1574979081","https://openalex.org/W1575363794","https://openalex.org/W1603978410","https://openalex.org/W1953794278","https://openalex.org/W1966829807","https://openalex.org/W1995875735","https://openalex.org/W2006170882","https://openalex.org/W2009156926","https://openalex.org/W2010396133","https://openalex.org/W2015245929","https://openalex.org/W2025653016","https://openalex.org/W2048239613","https://openalex.org/W2048695473","https://openalex.org/W2055337076","https://openalex.org/W2077041217","https://openalex.org/W2078693345","https://openalex.org/W2096765209","https://openalex.org/W2097241944","https://openalex.org/W2104978738","https://openalex.org/W2105101328","https://openalex.org/W2110383222","https://openalex.org/W2113110240","https://openalex.org/W2122361470","https://openalex.org/W2126579184","https://openalex.org/W2135631383","https://openalex.org/W2138092272","https://openalex.org/W2140617711","https://openalex.org/W2143869282","https://openalex.org/W2144244105","https://openalex.org/W2144245426","https://openalex.org/W2146950091","https://openalex.org/W2149197198","https://openalex.org/W2151103935","https://openalex.org/W2153668970","https://openalex.org/W2154468968","https://openalex.org/W2164489414","https://openalex.org/W2259092848","https://openalex.org/W2331518786","https://openalex.org/W2334026559","https://openalex.org/W2492608700","https://openalex.org/W2494311810","https://openalex.org/W2610376375","https://openalex.org/W2613977835","https://openalex.org/W2687551887","https://openalex.org/W2741065173","https://openalex.org/W2756489700","https://openalex.org/W2779931100","https://openalex.org/W2781738159","https://openalex.org/W2807567715","https://openalex.org/W2891273344","https://openalex.org/W2901065680","https://openalex.org/W2904879525","https://openalex.org/W2908844536","https://openalex.org/W2920815048","https://openalex.org/W2921547035","https://openalex.org/W2947566949","https://openalex.org/W2963391384","https://openalex.org/W2963481894","https://openalex.org/W2965887888","https://openalex.org/W2989118260","https://openalex.org/W3003413895","https://openalex.org/W3006840371","https://openalex.org/W3103061166","https://openalex.org/W4231374395","https://openalex.org/W4232080660","https://openalex.org/W4238346259","https://openalex.org/W4239521804","https://openalex.org/W4250453066","https://openalex.org/W4250619709","https://openalex.org/W4322382706","https://openalex.org/W6674201379","https://openalex.org/W6682443497"],"related_works":["https://openalex.org/W3210067883","https://openalex.org/W1998473291","https://openalex.org/W4246387142","https://openalex.org/W2059633033","https://openalex.org/W2726816385","https://openalex.org/W2107302669","https://openalex.org/W4234453013","https://openalex.org/W2141209004","https://openalex.org/W2950696647","https://openalex.org/W4298475239"],"abstract_inverted_index":{"Burstiness":[0],"and":[1,34,72,108,136,175,213,253,274],"overdispersion":[2],"phenomena":[3,53],"of":[4,19,83,147,178,196,200,226,231,250],"count":[5,179],"vectors":[6,29,282],"pose":[7],"significant":[8],"challenges":[9],"in":[10,30,128,132,246,256,297],"modeling":[11,54],"such":[12,241],"data":[13,35],"accurately.":[14],"While":[15],"the":[16,20,43,47,63,84,88,95,99,111,114,121,145,149,161,167,173,190,197,224,227,232,262,287,289,294],"dependency":[17],"assumption":[18],"multinomial":[21,44,50],"distribution":[22,45,60],"causes":[23],"its":[24,70,154,185],"failure":[25],"to":[26,46,78,94,103,143,183,286],"model":[27,100,113],"frequency":[28,281],"several":[31],"machine":[32],"learning":[33,215],"mining":[36],"applications,":[37],"researchers":[38],"found":[39],"that":[40,120,261],"by":[41,152,188],"extending":[42],"Dirichlet":[48,59,85,117],"Compound":[49],"(DCM),":[51],"both":[52],"can":[55],"be":[56],"addressed.":[57],"However,":[58],"is":[61,164,208,220],"not":[62],"best":[64],"choice,":[65],"as":[66,91,193,242],"a":[67,80,92,101,125,194,216,267],"prior,":[68],"given":[69,172],"negative-correlation":[71],"equal-confidence":[73],"requirements.":[74],"Thus,":[75],"we":[76,109,141,181,203],"propose":[77,142,182],"use":[79],"flexible":[81],"generalization":[82],"distribution,":[86,201],"namely,":[87],"shifted-scaled":[89],"Dirichlet,":[90],"prior":[93],"multinomial,":[96],"which":[97,202],"grants":[98],"capability":[102],"better":[104],"fit":[105],"real":[106],"data,":[107],"call":[110,204],"new":[112],"Multinomial":[115],"Shifted-Scaled":[116],"(MSSD).":[118],"Given":[119],"likelihood":[122,134],"function":[123,155,163],"plays":[124],"key":[126],"role":[127],"statistical":[129],"inference,":[130],"e.g.,":[131],"maximum":[133],"estimation":[135,225],"Fisher":[137],"information":[138],"matrix":[139],"investigation,":[140],"improve":[144,184],"efficiency":[146,187],"computing":[148],"MSSD":[150,192],"log-likelihood":[151,162],"approximating":[153,189],"based":[156,209],"on":[157,210],"Bernoulli":[158],"polynomials":[159],"where":[160],"computed":[165],"using":[166],"proposed":[168,233,263],"mesh":[169],"algorithm.":[170],"Moreover,":[171],"sparsity":[174],"high-dimensionality":[176],"nature":[177],"vectors,":[180],"computation":[186],"novel":[191],"member":[195],"exponential":[198],"family":[199],"EMSSD.":[205],"The":[206,229],"clustering":[207,264],"mixture":[211],"models,":[212],"for":[214,280],"model,":[217],"selection":[218],"approach":[219,234],"seamlessly":[221],"integrated":[222],"with":[223],"parameters.":[228],"merits":[230],"are":[235],"validated":[236],"via":[237],"challenging":[238],"real-world":[239],"applications":[240],"hate":[243],"speech":[244],"detection":[245,255],"Twitter,":[247],"real-time":[248],"recognition":[249],"criminal":[251],"action,":[252],"anomaly":[254],"crowded":[257],"scenes.":[258],"Results":[259],"reveal":[260],"frameworks":[265],"offer":[266],"good":[268],"compromise":[269],"between":[270],"other":[271,276],"state-of-the-art":[272],"techniques":[273],"outperform":[275],"approaches":[277],"previously":[278],"used":[279],"modeling.":[283],"Besides,":[284],"comparing":[285],"MSSD,":[288],"approximation":[290],"EMSSD":[291],"has":[292],"reduced":[293],"computational":[295],"complexity":[296],"high-dimensional":[298],"feature":[299],"spaces.":[300]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
