{"id":"https://openalex.org/W2897613601","doi":"https://doi.org/10.1109/ijcnn.2018.8489670","title":"Regularized Maximum-Likelihood Estimation of Mixture-of-Experts for Regression and Clustering","display_name":"Regularized Maximum-Likelihood Estimation of Mixture-of-Experts for Regression and Clustering","publication_year":2018,"publication_date":"2018-07-01","ids":{"openalex":"https://openalex.org/W2897613601","doi":"https://doi.org/10.1109/ijcnn.2018.8489670","mag":"2897613601"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn.2018.8489670","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2018.8489670","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020695688","display_name":"Fa\u00efcel Chamroukhi","orcid":"https://orcid.org/0000-0002-5894-3103"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I98702875","display_name":"Universit\u00e9 de Caen Normandie","ror":"https://ror.org/051kpcy16","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918","https://openalex.org/I98702875"]},{"id":"https://openalex.org/I4210105918","display_name":"Normandie Universit\u00e9","ror":"https://ror.org/01k40cz91","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Faicel Chamroukhi","raw_affiliation_strings":["Normandie Univ, UNICAEN, CNRS, LMNO, Caen, France"],"affiliations":[{"raw_affiliation_string":"Normandie Univ, UNICAEN, CNRS, LMNO, Caen, France","institution_ids":["https://openalex.org/I98702875","https://openalex.org/I4210105918","https://openalex.org/I1294671590"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5010674359","display_name":"Bao Huynh","orcid":"https://orcid.org/0000-0002-1882-6877"},"institutions":[{"id":"https://openalex.org/I4210105918","display_name":"Normandie Universit\u00e9","ror":"https://ror.org/01k40cz91","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918"]},{"id":"https://openalex.org/I98702875","display_name":"Universit\u00e9 de Caen Normandie","ror":"https://ror.org/051kpcy16","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210105918","https://openalex.org/I98702875"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Bao Tuyen Huynh","raw_affiliation_strings":["Normandie Univ, UNICAEN, CNRS, LMNO, Caen, France"],"affiliations":[{"raw_affiliation_string":"Normandie Univ, UNICAEN, CNRS, LMNO, Caen, France","institution_ids":["https://openalex.org/I98702875","https://openalex.org/I4210105918","https://openalex.org/I1294671590"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5020695688"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210105918","https://openalex.org/I98702875"],"apc_list":null,"apc_paid":null,"fwci":0.3258,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.68122819,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10136","display_name":"Statistical Methods and Inference","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10243","display_name":"Statistical Methods and Bayesian Inference","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7048649191856384},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6463800072669983},{"id":"https://openalex.org/keywords/regularization","display_name":"Regularization (linguistics)","score":0.5256170630455017},{"id":"https://openalex.org/keywords/feature-selection","display_name":"Feature selection","score":0.45754262804985046},{"id":"https://openalex.org/keywords/regression-analysis","display_name":"Regression analysis","score":0.448175311088562},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44709864258766174},{"id":"https://openalex.org/keywords/regression","display_name":"Regression","score":0.43977272510528564},{"id":"https://openalex.org/keywords/coordinate-descent","display_name":"Coordinate descent","score":0.4250290095806122},{"id":"https://openalex.org/keywords/model-selection","display_name":"Model selection","score":0.42343753576278687},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4148474633693695},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3622870147228241},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3490695357322693},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32414454221725464},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2667893171310425},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.12795960903167725}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7048649191856384},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6463800072669983},{"id":"https://openalex.org/C2776135515","wikidata":"https://www.wikidata.org/wiki/Q17143721","display_name":"Regularization (linguistics)","level":2,"score":0.5256170630455017},{"id":"https://openalex.org/C148483581","wikidata":"https://www.wikidata.org/wiki/Q446488","display_name":"Feature selection","level":2,"score":0.45754262804985046},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.448175311088562},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44709864258766174},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.43977272510528564},{"id":"https://openalex.org/C157553263","wikidata":"https://www.wikidata.org/wiki/Q5168004","display_name":"Coordinate descent","level":2,"score":0.4250290095806122},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.42343753576278687},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4148474633693695},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3622870147228241},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3490695357322693},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32414454221725464},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2667893171310425},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.12795960903167725},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn.2018.8489670","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2018.8489670","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W1523409240","https://openalex.org/W1523985187","https://openalex.org/W1540764732","https://openalex.org/W1839582124","https://openalex.org/W2032936552","https://openalex.org/W2046738186","https://openalex.org/W2049633694","https://openalex.org/W2068238590","https://openalex.org/W2074682976","https://openalex.org/W2085831769","https://openalex.org/W2112335378","https://openalex.org/W2138142480","https://openalex.org/W2150884987","https://openalex.org/W2155628440","https://openalex.org/W2163696743","https://openalex.org/W2286729967","https://openalex.org/W2324376776","https://openalex.org/W2460444101","https://openalex.org/W2552939581","https://openalex.org/W2730546798","https://openalex.org/W2734898258","https://openalex.org/W3101651037","https://openalex.org/W3101767848","https://openalex.org/W3102884061","https://openalex.org/W4248081355","https://openalex.org/W6631333301","https://openalex.org/W6741030580"],"related_works":["https://openalex.org/W2117229703","https://openalex.org/W3120756218","https://openalex.org/W2139276415","https://openalex.org/W2187599770","https://openalex.org/W2022712430","https://openalex.org/W3152506997","https://openalex.org/W4295727671","https://openalex.org/W2953178323","https://openalex.org/W1980034243","https://openalex.org/W2283037149"],"abstract_inverted_index":{"Mixture":[0],"of":[1,50,73,77,88,96,132,150,184,189,201],"experts":[2],"(MoE)":[3],"models":[4],"are":[5],"successful":[6],"neural-network":[7],"architectures":[8],"for":[9,79,107,140],"modeling":[10,95,144],"heterogeneous":[11,97,108,202],"data":[12,110],"in":[13,27,42,62,93,187,195,199],"many":[14],"machine":[15],"learning":[16,25],"problems":[17],"including":[18,99],"regression,":[19],"clustering":[20,200],"and":[21,56,59,81,111,164,172,198],"classification.":[22],"The":[23,86,153],"model":[24],"is":[26,40,91],"general":[28],"performed":[29],"by":[30],"maximum":[31,67],"likelihood":[32,68],"estimation":[33,69,116],"(MLE).":[34],"For":[35],"high-dimensional":[36,55,64,119],"data,":[37,98],"a":[38,63,74,113,123],"regularization":[39],"needed":[41],"order":[43],"to":[44,54,157],"avoid":[45],"possible":[46],"degeneracies":[47],"or":[48],"infeasibility":[49],"the":[51,71,94,105,133,142,151,181,185,191],"MLE":[52,139],"related":[53],"possibly":[57,118],"redundant":[58],"correlated":[60],"features":[61,78],"scenario.":[65],"Regularized":[66],"allows":[70,156],"selection":[72,90],"relevant":[75],"subset":[76],"prediction":[80],"thus":[82,174],"encourages":[83],"sparse":[84,160,193],"solutions.":[85],"problem":[87],"variable":[89],"challenging":[92],"with":[100,117],"MoE":[101,106],"models.":[102],"We":[103],"consider":[104],"regression":[109,203],"propose":[112],"regularized":[114,138],"maximum-likelihood":[115],"features,":[120],"based":[121],"on":[122],"dedicated":[124],"EM":[125],"algorithm":[126,155,186],"which":[127],"integrates":[128],"coordinate":[129,166],"ascent":[130,167],"updates":[131,168],"parameters.":[134],"Unlike":[135],"state-of-the":[136],"art":[137],"MoE,":[141],"proposed":[143,154],"does":[145],"not":[146],"require":[147],"an":[148],"approximate":[149],"regularization.":[152],"automatically":[158],"obtaining":[159],"solutions":[161],"without":[162],"thresholding,":[163],"includes":[165],"avoiding":[169],"matrix":[170],"inversion,":[171],"can":[173],"be":[175],"scalable.":[176],"An":[177],"experimental":[178],"study":[179],"shows":[180],"good":[182],"performance":[183],"terms":[188],"recovering":[190],"actual":[192],"solutions,":[194],"parameter":[196],"estimation,":[197],"data.":[204]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
