{"id":"https://openalex.org/W7155187000","doi":"https://doi.org/10.48550/arxiv.2604.19337","title":"POLAR-PIC: A Holistic Framework for Matrixized PIC with Co-Designed Compute, Layout, and Communication","display_name":"POLAR-PIC: A Holistic Framework for Matrixized PIC with Co-Designed Compute, Layout, and Communication","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155187000","doi":"https://doi.org/10.48550/arxiv.2604.19337"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19337","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134312763","display_name":"Yizhuo Rao","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rao, Yizhuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134300910","display_name":"Xingjian Cui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cui, Xingjian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123015569","display_name":"Shangzhi Pang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pang, Shangzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134354828","display_name":"Jiabin Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Jiabin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134277422","display_name":"Guangnan Feng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Feng, Guangnan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079342260","display_name":"Jinhui Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Jinhui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100658079","display_name":"Ziyan Zhang","orcid":"https://orcid.org/0000-0002-2983-9729"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Ziyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076579589","display_name":"Languang Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Languang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134314083","display_name":"Zhenyu Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhenyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134347602","display_name":"Zhiguang Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zhiguang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5101633465","display_name":"Yutong Lu","orcid":"https://orcid.org/0000-0001-5315-3375"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Yutong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5134312763"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10384","display_name":"Laser-Plasma Interactions and Diagnostics","score":0.5658000111579895,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10384","display_name":"Laser-Plasma Interactions and Diagnostics","score":0.5658000111579895,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10346","display_name":"Magnetic confinement fusion research","score":0.27489998936653137,"subfield":{"id":"https://openalex.org/subfields/3106","display_name":"Nuclear and High Energy Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10781","display_name":"Plasma Diagnostics and Applications","score":0.020999999716877937,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/asynchronous-communication","display_name":"Asynchronous communication","score":0.6904000043869019},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6626999974250793},{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.5462999939918518},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4514000117778778},{"id":"https://openalex.org/keywords/locality","display_name":"Locality","score":0.43050000071525574},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.4284000098705292},{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.34549999237060547},{"id":"https://openalex.org/keywords/efficient-energy-use","display_name":"Efficient energy use","score":0.3172000050544739}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7325000166893005},{"id":"https://openalex.org/C151319957","wikidata":"https://www.wikidata.org/wiki/Q752739","display_name":"Asynchronous communication","level":2,"score":0.6904000043869019},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6626999974250793},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.6114000082015991},{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.5462999939918518},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4934999942779541},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4514000117778778},{"id":"https://openalex.org/C2779808786","wikidata":"https://www.wikidata.org/wiki/Q6664603","display_name":"Locality","level":2,"score":0.43050000071525574},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.4284000098705292},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.38659998774528503},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.34549999237060547},{"id":"https://openalex.org/C2742236","wikidata":"https://www.wikidata.org/wiki/Q924713","display_name":"Efficient energy use","level":2,"score":0.3172000050544739},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3111000061035156},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.3077000081539154},{"id":"https://openalex.org/C2778692605","wikidata":"https://www.wikidata.org/wiki/Q4041866","display_name":"Joins","level":2,"score":0.3057999908924103},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.30140000581741333},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C74080474","wikidata":"https://www.wikidata.org/wiki/Q7305975","display_name":"Redistribution (election)","level":3,"score":0.2809999883174896},{"id":"https://openalex.org/C130795937","wikidata":"https://www.wikidata.org/wiki/Q2561570","display_name":"Remote direct memory access","level":2,"score":0.2743000090122223},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.2524000108242035},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Particle-in-Cell":[0],"(PIC)":[1],"simulations":[2,73],"are":[3,158],"fundamental":[4],"to":[5,15,91,102,126,139],"plasma":[6,130],"physics":[7],"but":[8],"often":[9],"suffer":[10],"from":[11],"limited":[12],"scalability":[13,198],"due":[14],"particle-grid":[16,25],"interaction":[17,26],"bottlenecks":[18],"and":[19,47,95,131,156,160,163],"particle":[20,41,89,98],"redistribution":[21,50,104],"costs.":[22],"Specifically,":[23],"the":[24,34,40,48,109,120,140,151,164,184,197,218],"computations":[27],"have":[28],"not":[29],"taken":[30],"full":[31],"advantage":[32],"of":[33,112,179,220],"emerging":[35],"Matrix":[36],"Processing":[37],"Units":[38],"(MPUs),":[39],"motion":[42],"introduces":[43],"irregular":[44],"memory":[45,93],"accesses,":[46],"bulk-synchronous":[49],"further":[51],"destroys":[52],"long-term":[53],"data":[54],"locality":[55],"thereby":[56],"limiting":[57],"parallel":[58],"efficiency.":[59],"To":[60],"address":[61],"these":[62],"inefficiencies,":[63],"we":[64],"present":[65],"POLAR-PIC,":[66],"a":[67,86,169],"co-designed":[68],"framework":[69],"for":[70,223],"large-scale":[71],"PIC":[72],"that":[74,117,150,201],"(i)":[75],"reformulates":[76],"Field":[77],"Interpolation":[78,155],"into":[79],"an":[80,113],"MPU-friendly":[81],"outer-product":[82],"form,":[83],"(ii)":[84],"maintains":[85,203],"physically":[87],"ordered":[88],"layout":[90],"preserve":[92],"contiguity,":[94],"(iii)":[96],"overlaps":[97],"communication":[99,166],"with":[100],"Deposition":[101,157],"hide":[103],"overhead.":[105],"The":[106],"evaluation":[107,199],"on":[108,145,183,192,208],"pilot":[110],"system":[111],"Exascale":[114],"supercomputer":[115],"demonstrates":[116,200],"POLAR-PIC":[118,176,202],"accelerates":[119],"entire":[121],"particle-processing":[122],"phase":[123],"by":[124,154],"up":[125],"10.9x":[127],"in":[128,133],"uniform":[129],"4.4x":[132],"real-world":[134],"laser-ion":[135],"acceleration":[136],"scenarios":[137],"compared":[138],"native":[141],"WarpX":[142,189],"reference":[143],"pipeline":[144],"LX2.":[146],"Ablation":[147],"studies":[148],"reveal":[149],"speedups":[152],"achieved":[153],"8.0x":[159],"13.2x,":[161],"respectively,":[162],"asynchronous":[165],"design":[167],"sustains":[168],"99.1%":[170],"overlap":[171],"ratio.":[172],"In":[173],"cross-platform":[174],"comparisons,":[175],"achieves":[177],"13.2%":[178],"theoretical":[180],"peak":[181],"efficiency":[182,207],"CPU-based":[185],"LS":[186],"system,":[187],"while":[188],"reaches":[190],"9.6%":[191],"NVIDIA":[193],"A800":[194],"GPUs.":[195],"Notably,":[196],"67.5%":[204],"weak":[205],"scaling":[206],"over":[209],"2":[210],"million":[211],"cores":[212],"under":[213],"high-migration":[214],"dynamic":[215],"workloads,":[216],"highlighting":[217],"importance":[219],"holistic":[221],"co-design":[222],"future":[224],"matrix-centric":[225],"HPC":[226],"systems.":[227]},"counts_by_year":[],"updated_date":"2026-04-23T06:20:18.424754","created_date":"2026-04-23T00:00:00"}
