{"id":"https://openalex.org/W4414034992","doi":"https://doi.org/10.1145/3705328.3748143","title":"Scaling Generative Recommendations with Context Parallelism on Hierarchical Sequential Transducers","display_name":"Scaling Generative Recommendations with Context Parallelism on Hierarchical Sequential Transducers","publication_year":2025,"publication_date":"2025-09-06","ids":{"openalex":"https://openalex.org/W4414034992","doi":"https://doi.org/10.1145/3705328.3748143"},"language":"en","primary_location":{"id":"doi:10.1145/3705328.3748143","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3705328.3748143","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3705328.3748143","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth ACM Conference on Recommender Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3705328.3748143","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111730964","display_name":"Yan Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yue Dong","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0009-0007-8781-2384","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003924813","display_name":"Han Li","orcid":"https://orcid.org/0009-0009-4818-2759"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Han Li","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0009-0009-4818-2759","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Shen Li","orcid":"https://orcid.org/0009-0005-8484-0166"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shen Li","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0009-0005-8484-0166","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nikhil Patel","orcid":"https://orcid.org/0000-0003-0369-5058"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nikhil Patel","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0000-0003-0369-5058","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100381490","display_name":"Xing Liu","orcid":"https://orcid.org/0009-0005-0172-8698"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xing Liu","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0009-0005-0172-8698","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032372272","display_name":"Xiaodong Wang","orcid":"https://orcid.org/0000-0001-5436-9952"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaodong Wang","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0000-0001-5436-9952","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040614886","display_name":"Chuanhao Zhuge","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chuanhao Zhuge","raw_affiliation_strings":["Meta Platforms, Menlo Park, USA"],"raw_orcid":"https://orcid.org/0009-0009-3325-991X","affiliations":[{"raw_affiliation_string":"Meta Platforms, Menlo Park, USA","institution_ids":["https://openalex.org/I4210114444"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5111730964"],"corresponding_institution_ids":["https://openalex.org/I4210114444"],"apc_list":null,"apc_paid":null,"fwci":2.9051,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.92738692,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1058","last_page":"1061"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.965499997138977,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11478","display_name":"Caching and Content Delivery","score":0.9614999890327454,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/parallelism","display_name":"Parallelism (grammar)","score":0.8288289308547974},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7461010217666626},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.6952981948852539},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.61885666847229},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6101964712142944},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.41521212458610535},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22213372588157654},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10499736666679382}],"concepts":[{"id":"https://openalex.org/C2781172179","wikidata":"https://www.wikidata.org/wiki/Q853109","display_name":"Parallelism (grammar)","level":2,"score":0.8288289308547974},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7461010217666626},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.6952981948852539},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.61885666847229},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6101964712142944},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.41521212458610535},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22213372588157654},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10499736666679382},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3705328.3748143","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3705328.3748143","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3705328.3748143","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth ACM Conference on Recommender Systems","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3705328.3748143","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3705328.3748143","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3705328.3748143","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Nineteenth ACM Conference on Recommender Systems","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4414034992.pdf","grobid_xml":"https://content.openalex.org/works/W4414034992.grobid-xml"},"referenced_works_count":2,"referenced_works":["https://openalex.org/W2984100107","https://openalex.org/W4296591817"],"related_works":["https://openalex.org/W2380075625","https://openalex.org/W2045183646","https://openalex.org/W2162409446","https://openalex.org/W2109463584","https://openalex.org/W141820298","https://openalex.org/W2504075107","https://openalex.org/W2049584446","https://openalex.org/W2079781215","https://openalex.org/W1595672120","https://openalex.org/W4230999561"],"abstract_inverted_index":{"Large-scale":[0],"recommendation":[1,45],"systems":[2],"are":[3],"pivotal":[4],"to":[5,24,63,80,121],"process":[6],"an":[7,36],"immense":[8],"volume":[9],"of":[10,18],"daily":[11],"user":[12,65,123,159],"interactions,":[13],"requiring":[14],"the":[15,52,99],"effective":[16],"modeling":[17,40],"high":[19,41],"cardinality":[20],"and":[21,58],"heterogeneous":[22],"features":[23],"ensure":[25],"accurate":[26],"predictions.In":[27],"prior":[28],"work,":[29,132],"we":[30,133],"introduced":[31],"Hierarchical":[32],"Sequential":[33],"Transducers":[34],"(HSTU),":[35],"attention-based":[37],"architecture":[38],"for":[39,141,147],"cardinality,":[42],"non-stationary":[43],"streaming":[44],"data,":[46],"providing":[47],"good":[48],"scaling":[49,72,148,167],"law":[50],"in":[51,157],"generative":[53],"recommender":[54],"framework":[55],"(GR).Recent":[56],"studies":[57],"experiments":[59],"demonstrate":[60],"that":[61,95],"attending":[62],"longer":[64],"history":[66],"sequences":[67],"yields":[68],"significant":[69],"metric":[70],"improvements.However,":[71],"sequence":[73,150,161],"length":[74],"is":[75,90],"activation-heavy,":[76],"necessitating":[77],"parallelism":[78,88,136],"solutions":[79],"effectively":[81,105],"shard":[82],"activation":[83],"memory.In":[84],"transformer-based":[85],"LLMs,":[86],"context":[87,135],"(CP)":[89],"a":[91,154,165],"commonly":[92],"used":[93],"technique":[94],"distributes":[96],"computation":[97],"along":[98],"sequence-length":[100],"dimension":[101],"across":[102],"multiple":[103],"GPUs,":[104],"reducing":[106],"memory":[107],"usage":[108],"from":[109],"attention":[110],"activations.In":[111],"contrast,":[112],"production":[113],"ranking":[114],"models":[115],"typically":[116],"utilize":[117],"jagged":[118,138],"input":[119],"tensors":[120],"represent":[122],"interaction":[124,160],"features,":[125],"introducing":[126],"unique":[127],"CP":[128],"implementation":[129],"challenges.In":[130],"this":[131],"introduce":[134],"with":[137,171],"tensor":[139],"support":[140],"HSTU":[142],"attention,":[143],"establishing":[144],"foundational":[145],"capabilities":[146],"up":[149],"dimensions.Our":[151],"approach":[152],"enables":[153],"5.3":[155],"increase":[156],"supported":[158],"length,":[162],"while":[163],"achieving":[164],"1.55":[166],"factor":[168],"when":[169],"combined":[170],"Distributed":[172],"Data":[173],"Parallelism":[174],"(DDP).":[175]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
