{"id":"https://openalex.org/W7128644212","doi":"https://doi.org/10.48550/arxiv.2602.09386","title":"SMES: Towards Scalable Multi-Task Recommendation via Expert Sparsity","display_name":"SMES: Towards Scalable Multi-Task Recommendation via Expert Sparsity","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7128644212","doi":"https://doi.org/10.48550/arxiv.2602.09386"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2602.09386","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09386","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2602.09386","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125680273","display_name":"Yukun Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Yukun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125668023","display_name":"Si Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Si","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125625044","display_name":"Xu Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125646369","display_name":"Bo Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Bo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125635152","display_name":"Qinglin Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Qinglin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100408109","display_name":"Bo Wang","orcid":"https://orcid.org/0000-0002-5596-1795"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Shengzhe","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123554145","display_name":"Jinlong Jiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiao, Jinlong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125655014","display_name":"Runhan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Runhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125624808","display_name":"Jiaqing Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jiaqing","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074529126","display_name":"Chaoyi Ma","orcid":"https://orcid.org/0000-0002-3572-0046"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Chaoyi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125671739","display_name":"Ruiming Tang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tang, Ruiming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125646962","display_name":"Guorui Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Guorui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125662535","display_name":"Han Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Han","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125661873","display_name":"Kun Gai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gai, Kun","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5125680273"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.5692999958992004,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.5692999958992004,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.06759999692440033,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.03840000182390213,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7915999889373779},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.7506999969482422},{"id":"https://openalex.org/keywords/skew","display_name":"Skew","score":0.7204999923706055},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.7064999938011169},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.5230000019073486},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.4803999960422516},{"id":"https://openalex.org/keywords/expert-system","display_name":"Expert system","score":0.47999998927116394}],"concepts":[{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7915999889373779},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7562999725341797},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.7506999969482422},{"id":"https://openalex.org/C43711488","wikidata":"https://www.wikidata.org/wiki/Q7534783","display_name":"Skew","level":2,"score":0.7204999923706055},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.7064999938011169},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5322999954223633},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.5230000019073486},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48410001397132874},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.4803999960422516},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.47999998927116394},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4620000123977661},{"id":"https://openalex.org/C105002631","wikidata":"https://www.wikidata.org/wiki/Q4833645","display_name":"Subject-matter expert","level":3,"score":0.37400001287460327},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33009999990463257},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.31119999289512634},{"id":"https://openalex.org/C102600418","wikidata":"https://www.wikidata.org/wiki/Q6517507","display_name":"Legal expert system","level":3,"score":0.3025999963283539},{"id":"https://openalex.org/C72161134","wikidata":"https://www.wikidata.org/wiki/Q5421219","display_name":"Expert elicitation","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.26660001277923584}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2602.09386","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09386","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2602.09386","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.09386","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Industry, innovation and infrastructure","id":"https://metadata.un.org/sdg/9","score":0.5429438352584839}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Industrial":[0],"recommender":[1],"systems":[2],"typically":[3],"rely":[4],"on":[5],"multi-task":[6,69,94],"learning":[7],"to":[8,93],"estimate":[9],"diverse":[10],"user":[11,206],"feedback":[12],"signals":[13],"and":[14,40,58,83,103,141,201],"aggregate":[15],"them":[16],"for":[17,45,67],"ranking.":[18],"Recent":[19],"advances":[20],"in":[21,28,178,205],"model":[22,33],"scaling":[23,57,81],"have":[24],"shown":[25],"promising":[26],"gains":[27],"recommendation.":[29,70],"However,":[30],"naively":[31],"increasing":[32],"capacity":[34,61],"imposes":[35],"prohibitive":[36],"online":[37,191],"inference":[38],"costs":[39],"often":[41],"yields":[42],"diminishing":[43],"returns":[44],"sparse":[46,90,121],"tasks":[47,140],"with":[48,124,196],"skewed":[49],"label":[50],"distributions.":[51],"This":[52],"mismatch":[53],"between":[54],"uniform":[55],"parameter":[56,76],"heterogeneous":[59],"task":[60],"demands":[62],"poses":[63],"a":[64,79,119,133,158,202],"fundamental":[65],"challenge":[66],"scalable":[68,120],"In":[71,154],"this":[72],"work,":[73],"we":[74,116],"investigate":[75],"sparsification":[77],"as":[78],"principled":[80],"paradigm":[82],"identify":[84],"two":[85],"critical":[86],"obstacles":[87],"when":[88],"applying":[89],"Mixture-of-Experts":[91],"(MoE)":[92],"recommendation:":[95],"exploded":[96],"expert":[97,104,126,130,135,148,169],"activation":[98,131],"that":[99,163],"undermines":[100],"instance-level":[101],"sparsity":[102],"load":[105],"skew":[106],"caused":[107],"by":[108,166],"independent":[109],"task-wise":[110],"routing.":[111,127],"To":[112],"address":[113],"these":[114],"challenges,":[115],"propose":[117],"SMES,":[118],"MoE":[122],"framework":[123],"progressive":[125],"SMES":[128,156,174],"decomposes":[129],"into":[132],"task-shared":[134],"subset":[136],"jointly":[137],"selected":[138],"across":[139,171],"task-adaptive":[142],"private":[143],"experts,":[144],"explicitly":[145],"bounding":[146],"per-instance":[147],"execution":[149],"while":[150],"preserving":[151],"task-specific":[152],"capacity.":[153],"addition,":[155],"introduces":[157],"global":[159],"multi-gate":[160],"load-balancing":[161],"regularizer":[162],"stabilizes":[164],"training":[165],"regulating":[167],"aggregated":[168],"utilization":[170],"all":[172],"tasks.":[173],"has":[175],"been":[176],"deployed":[177],"Kuaishou":[179],"large-scale":[180],"short-video":[181],"services,":[182],"supporting":[183],"over":[184],"400":[185],"million":[186],"daily":[187],"active":[188],"users.":[189],"Extensive":[190],"experiments":[192],"demonstrate":[193],"stable":[194],"improvements,":[195],"GAUC":[197],"gain":[198],"of":[199],"0.29%":[200],"0.31%":[203],"uplift":[204],"watch":[207],"time.":[208]},"counts_by_year":[],"updated_date":"2026-02-12T06:17:30.163165","created_date":"2026-02-12T00:00:00"}
