{"id":"https://openalex.org/W4414198827","doi":"https://doi.org/10.1109/dac63849.2025.11132792","title":"Local-GS: An Order-Independent Gaussian Splatting Training Accelerator Exploiting Splat Locality","display_name":"Local-GS: An Order-Independent Gaussian Splatting Training Accelerator Exploiting Splat Locality","publication_year":2025,"publication_date":"2025-06-22","ids":{"openalex":"https://openalex.org/W4414198827","doi":"https://doi.org/10.1109/dac63849.2025.11132792"},"language":"en","primary_location":{"id":"doi:10.1109/dac63849.2025.11132792","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac63849.2025.11132792","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 62nd ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102002226","display_name":"Yiyang Sun","orcid":"https://orcid.org/0009-0003-8453-3436"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yiyang Sun","raw_affiliation_strings":["Peking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114554075","display_name":"Qinzhe Zhi","orcid":"https://orcid.org/0009-0001-4866-7213"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qinzhe Zhi","raw_affiliation_strings":["Peking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114069394","display_name":"Yiqi Jing","orcid":"https://orcid.org/0009-0004-7690-5356"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yiqi Jing","raw_affiliation_strings":["Peking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003039083","display_name":"Le Ye","orcid":"https://orcid.org/0000-0003-0599-7762"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Le Ye","raw_affiliation_strings":["Peking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050500375","display_name":"Ru Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ru Huang","raw_affiliation_strings":["Peking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088551028","display_name":"Tianyu Jia","orcid":"https://orcid.org/0000-0002-4570-4613"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianyu Jia","raw_affiliation_strings":["Peking University,School of Integrated Circuits,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Peking University,School of Integrated Circuits,Beijing,China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102002226"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10822495,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11044","display_name":"Particle Detector Development and Performance","score":0.817799985408783,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11044","display_name":"Particle Detector Development and Performance","score":0.817799985408783,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11216","display_name":"Radiation Detection and Scintillator Technologies","score":0.7957000136375427,"subfield":{"id":"https://openalex.org/subfields/3108","display_name":"Radiation"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.7922000288963318,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.6912999749183655},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.5788999795913696},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.43939998745918274},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.41100001335144043},{"id":"https://openalex.org/keywords/speedup","display_name":"Speedup","score":0.3939000070095062},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.3531000018119812},{"id":"https://openalex.org/keywords/thread","display_name":"Thread (computing)","score":0.35199999809265137},{"id":"https://openalex.org/keywords/3d-rendering","display_name":"3D rendering","score":0.304500013589859}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8654000163078308},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.6912999749183655},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.5788999795913696},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.5266000032424927},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.43939998745918274},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.41100001335144043},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.3939000070095062},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3677000105381012},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.3531000018119812},{"id":"https://openalex.org/C138101251","wikidata":"https://www.wikidata.org/wiki/Q213092","display_name":"Thread (computing)","level":2,"score":0.35199999809265137},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33880001306533813},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.32989999651908875},{"id":"https://openalex.org/C36816356","wikidata":"https://www.wikidata.org/wiki/Q16911860","display_name":"3D rendering","level":3,"score":0.304500013589859},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.30399999022483826},{"id":"https://openalex.org/C2778090530","wikidata":"https://www.wikidata.org/wiki/Q2523931","display_name":"Viewport","level":2,"score":0.29350000619888306},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C116921373","wikidata":"https://www.wikidata.org/wiki/Q2816483","display_name":"Real-time rendering","level":3,"score":0.2784000039100647},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.2712000012397766},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.26980000734329224},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C18766215","wikidata":"https://www.wikidata.org/wiki/Q7708532","display_name":"Texture memory","level":5,"score":0.25920000672340393},{"id":"https://openalex.org/C544400634","wikidata":"https://www.wikidata.org/wiki/Q188695","display_name":"DirectX","level":2,"score":0.2590999901294708}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dac63849.2025.11132792","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dac63849.2025.11132792","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 62nd ACM/IEEE Design Automation Conference (DAC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2346205343","https://openalex.org/W2471962767","https://openalex.org/W2901982540","https://openalex.org/W2963627347","https://openalex.org/W2979447669","https://openalex.org/W3215769467","https://openalex.org/W4200150166","https://openalex.org/W4385318467","https://openalex.org/W4386231251","https://openalex.org/W4386755312","https://openalex.org/W4395106423","https://openalex.org/W4402754225","https://openalex.org/W4404954627","https://openalex.org/W4409334625"],"related_works":[],"abstract_inverted_index":{"3D":[0,10,69,138],"Gaussian":[1,16,70,101],"Splatting":[2,17,71],"has":[3,18],"emerged":[4],"as":[5],"the":[6,43,55,79],"SOTA":[7],"approach":[8],"for":[9],"representation":[11],"and":[12,22,54,58,104,122,132,152],"view":[13],"synthesis.":[14],"While":[15],"demonstrated":[19],"impressive":[20],"capability":[21],"rendering":[23,76,121],"quality":[24],"on":[25,31,100],"desktop":[26],"GPUs,":[27],"achieving":[28],"on-demand":[29],"training":[30,44,72,150],"resource-constrained":[32],"edge":[33,142],"devices":[34],"is":[35,127,133],"still":[36],"challenging.":[37],"In":[38],"this":[39],"work,":[40],"we":[41,65],"identified":[42],"bottleneck":[45],"from":[46],"a":[47,68,89],"few":[48],"perspectives":[49],"including":[50],"algorithm":[51],"splat":[52,102],"locality":[53,103],"limited":[56],"memory":[57],"hardware":[59,106],"under-utilization.":[60],"To":[61],"address":[62],"these":[63],"problems,":[64],"present":[66],"Local-GS,":[67],"accelerator":[73],"with":[74],"order-independent":[75],"to":[77,95,116,141],"break":[78],"depth-wise":[80],"data":[81],"dependency":[82],"between":[83],"overlapping":[84],"Gaussians.":[85],"We":[86],"further":[87],"incorporate":[88],"parallel":[90,120],"pixel":[91],"intersection":[92],"test":[93],"unit":[94],"schedule":[96],"thread":[97],"workload":[98],"based":[99],"improve":[105],"utilization.":[107],"A":[108],"set":[109],"of":[110,155],"unified":[111],"training-rendering":[112],"cores":[113],"are":[114],"designed":[115],"achieve":[117,147],"efficient":[118],"splat-level":[119],"gradient":[123],"propagation.":[124],"Our":[125],"Local-GS":[126,146],"implemented":[128],"in":[129],"7":[130],"nm":[131],"evaluated":[134],"by":[135],"several":[136],"real-world":[137],"scenes.":[139],"Compared":[140],"Jetson":[143],"NX":[144],"GPU,":[145],"26.9-53":[148],"$\\times$":[149],"speedup":[151],"three":[153],"orders":[154],"magnitude":[156],"efficiency":[157],"boost.":[158]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
