{"id":"https://openalex.org/W7146965903","doi":"https://doi.org/10.1109/cnml68938.2026.11452489","title":"GPU-Accelerated Homomorphic Encryption with Optimized Performance","display_name":"GPU-Accelerated Homomorphic Encryption with Optimized Performance","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7146965903","doi":"https://doi.org/10.1109/cnml68938.2026.11452489"},"language":null,"primary_location":{"id":"doi:10.1109/cnml68938.2026.11452489","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cnml68938.2026.11452489","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on Communication Networks and Machine Learning (CNML)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132597000","display_name":"Jing Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I5343935","display_name":"Guilin University of Electronic Technology","ror":"https://ror.org/05arjae42","country_code":"CN","type":"education","lineage":["https://openalex.org/I5343935"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jing Wang","raw_affiliation_strings":["Guilin University of Electronic Technology,Computer Science and Information Security,Guilin,China"],"affiliations":[{"raw_affiliation_string":"Guilin University of Electronic Technology,Computer Science and Information Security,Guilin,China","institution_ids":["https://openalex.org/I5343935"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021665931","display_name":"Zecheng Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I5343935","display_name":"Guilin University of Electronic Technology","ror":"https://ror.org/05arjae42","country_code":"CN","type":"education","lineage":["https://openalex.org/I5343935"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zecheng Lu","raw_affiliation_strings":["Guilin University of Electronic Technology,Computer Science and Information Security,Guilin,China"],"affiliations":[{"raw_affiliation_string":"Guilin University of Electronic Technology,Computer Science and Information Security,Guilin,China","institution_ids":["https://openalex.org/I5343935"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5132597000"],"corresponding_institution_ids":["https://openalex.org/I5343935"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.9301534,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"411","last_page":"414"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.8848999738693237,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.8848999738693237,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11693","display_name":"Cryptography and Residue Arithmetic","score":0.07769999653100967,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10951","display_name":"Cryptographic Implementations and Security","score":0.007199999876320362,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/homomorphic-encryption","display_name":"Homomorphic encryption","score":0.7110999822616577},{"id":"https://openalex.org/keywords/correctness","display_name":"Correctness","score":0.6309000253677368},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.5995000004768372},{"id":"https://openalex.org/keywords/encryption","display_name":"Encryption","score":0.5885999798774719},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.44940000772476196},{"id":"https://openalex.org/keywords/cryptography","display_name":"Cryptography","score":0.44290000200271606},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.42899999022483826},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.3799999952316284}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8518999814987183},{"id":"https://openalex.org/C158338273","wikidata":"https://www.wikidata.org/wiki/Q2154943","display_name":"Homomorphic encryption","level":3,"score":0.7110999822616577},{"id":"https://openalex.org/C55439883","wikidata":"https://www.wikidata.org/wiki/Q360812","display_name":"Correctness","level":2,"score":0.6309000253677368},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.5995000004768372},{"id":"https://openalex.org/C148730421","wikidata":"https://www.wikidata.org/wiki/Q141090","display_name":"Encryption","level":2,"score":0.5885999798774719},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5134000182151794},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.44940000772476196},{"id":"https://openalex.org/C178489894","wikidata":"https://www.wikidata.org/wiki/Q8789","display_name":"Cryptography","level":2,"score":0.44290000200271606},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.42899999022483826},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.39169999957084656},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.3799999952316284},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.3691999912261963},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.36800000071525574},{"id":"https://openalex.org/C311688","wikidata":"https://www.wikidata.org/wiki/Q2393193","display_name":"Time complexity","level":2,"score":0.34459999203681946},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.32199999690055847},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C90119067","wikidata":"https://www.wikidata.org/wiki/Q43260","display_name":"Polynomial","level":2,"score":0.29420000314712524},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.29159998893737793},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.27549999952316284},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.27309998869895935},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.272599995136261},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.25119999051094055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cnml68938.2026.11452489","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cnml68938.2026.11452489","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 International Conference on Communication Networks and Machine Learning (CNML)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W3048071914","https://openalex.org/W3048936228","https://openalex.org/W3108669911","https://openalex.org/W4312722125","https://openalex.org/W4392309219","https://openalex.org/W4400488260","https://openalex.org/W4407218945","https://openalex.org/W4409248416","https://openalex.org/W4411713636","https://openalex.org/W4413925532","https://openalex.org/W7103751830"],"related_works":[],"abstract_inverted_index":{"Fully":[0],"Homomorphic":[1],"Encryption":[2],"(FHE)":[3],"enables":[4],"arbitrary":[5],"computations":[6],"on":[7,58,154],"encrypted":[8,183],"data,":[9],"thereby":[10],"protecting":[11],"data":[12,107],"privacy":[13],"throughout":[14],"the":[15,19,46,59,125,128,152,178],"entire":[16],"processing.":[17],"However,":[18],"practical":[20],"deployment":[21],"of":[22,49,127,182],"FHE":[23,51],"is":[24],"severely":[25],"limited":[26],"by":[27],"its":[28,77],"high":[29],"computational":[30,110],"overhead,":[31],"especially":[32],"for":[33,69,137],"operations":[34,74,142],"such":[35],"as":[36],"polynomial":[37,70],"multiplication":[38,71],"and":[39,63,72,97,109,115,139,143,180],"Number-Theoretic":[40],"Transform":[41],"(NTT),":[42],"which":[43],"usually":[44],"become":[45],"performance":[47],"bottleneck":[48],"most":[50],"schemes.":[52],"In":[53,130],"this":[54],"paper,":[55],"we":[56,118,132],"focus":[57],"Brakerski/Fan-Vercauteren":[60],"(BFV)":[61],"scheme":[62],"propose":[64],"a":[65,82,87],"GPU-based":[66],"optimization":[67],"framework":[68,153],"NTT":[73,141],"to":[75,92,112,146],"accelerate":[76],"computations.":[78,184],"Our":[79],"approach":[80],"combines":[81],"pipelined":[83],"scheduling":[84],"strategy":[85],"with":[86,166],"producer-consumer":[88],"memory":[89],"management":[90],"model":[91],"maximize":[93],"GPU":[94,113],"resource":[95],"utilization":[96],"reduce":[98],"idle":[99],"time":[100],"between":[101],"computation":[102],"stages.":[103],"By":[104],"accurately":[105],"mapping":[106],"dependencies":[108],"tasks":[111],"threads":[114],"thread":[116],"blocks,":[117],"achieve":[119],"efficient":[120],"parallel":[121],"execution":[122],"while":[123,176],"ensuring":[124],"correctness":[126,181],"results.":[129],"addition,":[131],"integrate":[133],"optimized":[134,170],"kernel":[135],"implementations":[136],"forward":[138],"inverse":[140],"other":[144],"techniques":[145],"further":[147],"improve":[148],"efficiency.":[149],"We":[150],"evaluate":[151],"an":[155],"NVIDIA":[156],"RTX":[157],"4060":[158],"GPU.":[159],"The":[160],"experimental":[161],"results":[162],"show":[163],"that,":[164],"compared":[165],"traditional":[167],"implementations,":[168],"our":[169],"implementation":[171],"significantly":[172],"reduces":[173],"system":[174],"latency":[175],"maintaining":[177],"integrity":[179]},"counts_by_year":[],"updated_date":"2026-04-02T13:53:19.096889","created_date":"2026-04-02T00:00:00"}
