{"id":"https://openalex.org/W4415538063","doi":"https://doi.org/10.1145/3746027.3755317","title":"HGC-Avatar: Hierarchical Gaussian Compression for Streamable Dynamic 3D Avatars","display_name":"HGC-Avatar: Hierarchical Gaussian Compression for Streamable Dynamic 3D Avatars","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415538063","doi":"https://doi.org/10.1145/3746027.3755317"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3755317","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755317","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.16463","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Haocheng Tang","orcid":"https://orcid.org/0009-0002-5253-6547"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haocheng Tang","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0002-5253-6547","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041324197","display_name":"Ruoke Yan","orcid":"https://orcid.org/0000-0003-4570-5402"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruoke Yan","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4570-5402","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xinhui Yin","orcid":"https://orcid.org/0009-0004-7148-162X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinhui Yin","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-7148-162X","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100360264","display_name":"Qi Zhang","orcid":"https://orcid.org/0000-0002-1189-8755"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Zhang","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-1189-8755","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055937409","display_name":"Xinfeng Zhang","orcid":"https://orcid.org/0000-0002-7517-3868"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinfeng Zhang","raw_affiliation_strings":["School of Computer Science and Technology, University of the Chinese Academy of Sciences, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7517-3868","affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of the Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039832462","display_name":"Siwei Ma","orcid":"https://orcid.org/0000-0002-2731-5403"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siwei Ma","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2731-5403","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101523804","display_name":"Wen Gao","orcid":"https://orcid.org/0000-0001-8894-1806"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Gao","raw_affiliation_strings":["State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8894-1806","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Multimedia Information Processing, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040292663","display_name":"Chuanmin Jia","orcid":"https://orcid.org/0000-0002-7418-6245"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuanmin Jia","raw_affiliation_strings":["WICT, State Key Laboratory of Multimedia Information Processing, Peking University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7418-6245","affiliations":[{"raw_affiliation_string":"WICT, State Key Laboratory of Multimedia Information Processing, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.49429015,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"8125","last_page":"8134"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10481","display_name":"Computer Graphics and Visualization Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1704","display_name":"Computer Graphics and Computer-Aided Design"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.691100001335144},{"id":"https://openalex.org/keywords/avatar","display_name":"Avatar","score":0.6100000143051147},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.5095999836921692},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.4147999882698059},{"id":"https://openalex.org/keywords/retargeting","display_name":"Retargeting","score":0.3928000032901764},{"id":"https://openalex.org/keywords/virtual-reality","display_name":"Virtual reality","score":0.374099999666214},{"id":"https://openalex.org/keywords/virtual-actor","display_name":"Virtual actor","score":0.3370000123977661},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion capture","score":0.33079999685287476}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8360999822616577},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.691100001335144},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6233999729156494},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6155999898910522},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.6100000143051147},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.5095999836921692},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.4147999882698059},{"id":"https://openalex.org/C2780575108","wikidata":"https://www.wikidata.org/wiki/Q7316652","display_name":"Retargeting","level":2,"score":0.3928000032901764},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.374099999666214},{"id":"https://openalex.org/C150303390","wikidata":"https://www.wikidata.org/wiki/Q1983852","display_name":"Virtual actor","level":3,"score":0.3370000123977661},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.33079999685287476},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.32510000467300415},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C160086991","wikidata":"https://www.wikidata.org/wiki/Q5939193","display_name":"Human visual system model","level":3,"score":0.321399986743927},{"id":"https://openalex.org/C116921373","wikidata":"https://www.wikidata.org/wiki/Q2816483","display_name":"Real-time rendering","level":3,"score":0.32100000977516174},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.31779998540878296},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.3122999966144562},{"id":"https://openalex.org/C44185422","wikidata":"https://www.wikidata.org/wiki/Q6002064","display_name":"Image-based modeling and rendering","level":3,"score":0.3093999922275543},{"id":"https://openalex.org/C138591656","wikidata":"https://www.wikidata.org/wiki/Q5157538","display_name":"Computer facial animation","level":4,"score":0.2896000146865845},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.28060001134872437},{"id":"https://openalex.org/C36816356","wikidata":"https://www.wikidata.org/wiki/Q16911860","display_name":"3D rendering","level":3,"score":0.2799000144004822},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C144986985","wikidata":"https://www.wikidata.org/wiki/Q871236","display_name":"Hierarchical database model","level":2,"score":0.2614000141620636},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3746027.3755317","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3755317","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2510.16463","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.16463","pdf_url":"https://arxiv.org/pdf/2510.16463","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.16463","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.16463","pdf_url":"https://arxiv.org/pdf/2510.16463","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1987648924","https://openalex.org/W2027461913","https://openalex.org/W2962785568","https://openalex.org/W3153220274","https://openalex.org/W3176327543","https://openalex.org/W3202804820","https://openalex.org/W4200150166","https://openalex.org/W4312891300","https://openalex.org/W4367622621","https://openalex.org/W4376311815","https://openalex.org/W4385318467","https://openalex.org/W4385527434","https://openalex.org/W4386075797","https://openalex.org/W4386160522","https://openalex.org/W4392024621","https://openalex.org/W4402704624","https://openalex.org/W4402716022","https://openalex.org/W4402716359","https://openalex.org/W4402716405","https://openalex.org/W4402716437","https://openalex.org/W4402727211","https://openalex.org/W4402733569","https://openalex.org/W4403780676","https://openalex.org/W4404525293","https://openalex.org/W4404525447","https://openalex.org/W4404624588"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,19,23,46,61,187],"3D":[3,14,63,179],"Gaussian":[4,72,89],"Splatting":[5],"(3DGS)":[6],"have":[7],"enabled":[8],"fast,":[9],"photorealistic":[10],"rendering":[11,81,131],"of":[12,42,82],"dynamic":[13,83],"scenes,":[15],"showing":[16],"strong":[17],"potential":[18],"immersive":[20],"communication.":[21],"However,":[22],"digital":[24],"human":[25,43],"encoding":[26],"and":[27,50,79,104,119,129,162,191],"transmission,":[28],"the":[29,40,54,88,110],"compression":[30,192],"methods":[31,186],"based":[32],"on":[33],"general":[34],"3DGS":[35],"representations":[36],"are":[37,144],"limited":[38],"by":[39],"lack":[41],"priors,":[44],"resulting":[45],"suboptimal":[47],"bitrate":[48],"efficiency":[49],"reconstruction":[51],"quality":[52,190],"at":[53],"decoder":[55],"side,":[56],"which":[57,95,108],"hinders":[58],"their":[59],"application":[60],"streamable":[62,175],"avatar":[64,180],"systems.":[65],"We":[66],"propose":[67],"HGC-Avatar,":[68],"a":[69,92,101,105,152,174],"novel":[70],"Hierarchical":[71],"Compression":[73],"framework":[74],"designed":[75],"for":[76,177],"efficient":[77],"transmission":[78],"high-quality":[80],"avatars.":[84],"Our":[85],"method":[86],"disentangles":[87],"representation":[90],"into":[91],"structural":[93],"layer,":[94,107],"maps":[96],"poses":[97],"to":[98,113,159],"Gaussians":[99],"via":[100],"StyleUNet-based":[102],"generator,":[103],"motion":[106],"leverages":[109],"SMPL-X":[111],"model":[112],"represent":[114],"temporal":[115],"pose":[116,134],"variations":[117],"compactly":[118],"semantically.":[120],"This":[121],"hierarchical":[122],"design":[123],"supports":[124],"layer-wise":[125],"compression,":[126],"progressive":[127],"decoding,":[128],"controllable":[130],"from":[132],"diverse":[133],"inputs":[135],"such":[136],"as":[137],"video":[138],"sequences":[139],"or":[140],"text.":[141],"Since":[142],"people":[143],"most":[145],"concerned":[146],"with":[147],"facial":[148,153],"realism,":[149],"we":[150],"incorporate":[151],"attention":[154],"mechanism":[155],"during":[156],"StyleUNet":[157],"training":[158],"preserve":[160],"identity":[161],"expression":[163],"details":[164],"under":[165],"low-bitrate":[166],"constraints.":[167],"Experimental":[168],"results":[169],"demonstrate":[170],"that":[171],"HGC-Avatar":[172],"provides":[173],"solution":[176],"rapid":[178],"rendering,":[181],"while":[182],"significantly":[183],"outperforming":[184],"prior":[185],"both":[188],"visual":[189],"efficiency.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-25T00:00:00"}
