{"id":"https://openalex.org/W7154214557","doi":"https://doi.org/10.48550/arxiv.2604.11659","title":"GPU Acceleration of Sparse Fully Homomorphic Encrypted DNNs","display_name":"GPU Acceleration of Sparse Fully Homomorphic Encrypted DNNs","publication_year":2026,"publication_date":"2026-04-13","ids":{"openalex":"https://openalex.org/W7154214557","doi":"https://doi.org/10.48550/arxiv.2604.11659"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.11659","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11659","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.11659","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116867492","display_name":"Lara D'Agata","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"D'Agata, Lara","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119217842","display_name":"Carlos Agull\u00f3-Domingo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Agull\u00f3-Domingo, Carlos","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119217843","display_name":"\u00d3scar Vera-L\u00f3pez","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vera-L\u00f3pez, \u00d3scar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087616265","display_name":"Kaustubh Shivdikar","orcid":"https://orcid.org/0000-0002-4449-7974"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shivdikar, Kaustubh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134864293","display_name":"Ardhi W. B. Yudha","orcid":"https://orcid.org/0000-0002-1946-0555"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yudha, Ardhi W. B.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133559547","display_name":"Ferhat Yaman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yaman, Ferhat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133574686","display_name":"David Kaeli","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaeli, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133594463","display_name":"Jos\u00e9 L. Abell\u00e1n","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abell\u00e1n, Jos\u00e9 L.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072053383","display_name":"Ian Colbert","orcid":"https://orcid.org/0000-0002-1669-5519"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Colbert, Ian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133567628","display_name":"Jos\u00e9 Cano","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cano, Jos\u00e9","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.8920999765396118,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10237","display_name":"Cryptography and Data Security","score":0.8920999765396118,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11693","display_name":"Cryptography and Residue Arithmetic","score":0.06260000169277191,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10951","display_name":"Cryptographic Implementations and Security","score":0.006899999920278788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/homomorphic-encryption","display_name":"Homomorphic encryption","score":0.8733999729156494},{"id":"https://openalex.org/keywords/matrix-multiplication","display_name":"Matrix multiplication","score":0.5526999831199646},{"id":"https://openalex.org/keywords/cryptography","display_name":"Cryptography","score":0.5117999911308289},{"id":"https://openalex.org/keywords/encryption","display_name":"Encryption","score":0.4952999949455261},{"id":"https://openalex.org/keywords/ciphertext","display_name":"Ciphertext","score":0.4803999960422516},{"id":"https://openalex.org/keywords/acceleration","display_name":"Acceleration","score":0.47920000553131104},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.41830000281333923},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.3937000036239624},{"id":"https://openalex.org/keywords/multiplication","display_name":"Multiplication (music)","score":0.35030001401901245}],"concepts":[{"id":"https://openalex.org/C158338273","wikidata":"https://www.wikidata.org/wiki/Q2154943","display_name":"Homomorphic encryption","level":3,"score":0.8733999729156494},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.847100019454956},{"id":"https://openalex.org/C17349429","wikidata":"https://www.wikidata.org/wiki/Q1049914","display_name":"Matrix multiplication","level":3,"score":0.5526999831199646},{"id":"https://openalex.org/C178489894","wikidata":"https://www.wikidata.org/wiki/Q8789","display_name":"Cryptography","level":2,"score":0.5117999911308289},{"id":"https://openalex.org/C148730421","wikidata":"https://www.wikidata.org/wiki/Q141090","display_name":"Encryption","level":2,"score":0.4952999949455261},{"id":"https://openalex.org/C93974786","wikidata":"https://www.wikidata.org/wiki/Q1589480","display_name":"Ciphertext","level":3,"score":0.4803999960422516},{"id":"https://openalex.org/C117896860","wikidata":"https://www.wikidata.org/wiki/Q11376","display_name":"Acceleration","level":2,"score":0.47920000553131104},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.41830000281333923},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4171000123023987},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.40610000491142273},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3937000036239624},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36579999327659607},{"id":"https://openalex.org/C2780595030","wikidata":"https://www.wikidata.org/wiki/Q3860309","display_name":"Multiplication (music)","level":2,"score":0.35030001401901245},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3465999960899353},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C56372850","wikidata":"https://www.wikidata.org/wiki/Q1050404","display_name":"Sparse matrix","level":3,"score":0.3434999883174896},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.3386000096797943},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3253999948501587},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.32440000772476196},{"id":"https://openalex.org/C186633575","wikidata":"https://www.wikidata.org/wiki/Q845060","display_name":"Maxima and minima","level":2,"score":0.3192000091075897},{"id":"https://openalex.org/C15927051","wikidata":"https://www.wikidata.org/wiki/Q246593","display_name":"Cryptographic primitive","level":4,"score":0.3046000003814697},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.2854999899864197},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.2793000042438507},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.2759999930858612},{"id":"https://openalex.org/C13164978","wikidata":"https://www.wikidata.org/wiki/Q600158","display_name":"Hardware acceleration","level":3,"score":0.26499998569488525},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.2606000006198883},{"id":"https://openalex.org/C100980136","wikidata":"https://www.wikidata.org/wiki/Q4668956","display_name":"Malleability","level":4,"score":0.2581999897956848},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.25270000100135803}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.11659","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11659","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.11659","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.11659","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Fully":[0],"homomorphic":[1],"encryption":[2],"(FHE)":[3],"has":[4],"recently":[5],"attracted":[6],"significant":[7],"attention":[8],"as":[9],"both":[10,98],"a":[11,15,27,53,69,85],"cryptographic":[12],"primitive":[13],"and":[14,59,77,112],"systems":[16],"challenge.":[17],"Given":[18],"the":[19,43,75,114],"latest":[20],"advances":[21],"in":[22,48,97],"accelerated":[23],"computing,":[24],"FHE":[25,88,126],"presents":[26],"promising":[28],"opportunity":[29],"for":[30,62,92],"progress,":[31],"with":[32],"applications":[33],"ranging":[34],"from":[35,52,117],"machine":[36],"learning":[37],"to":[38,110,119],"information":[39],"security.":[40],"We":[41,67],"target":[42],"most":[44],"computationally":[45],"intensive":[46],"operation":[47],"deep":[49],"neural":[50],"networks":[51],"hardware":[54],"perspective,":[55],"matrix":[56],"multiplication":[57],"(matmul),":[58],"adapt":[60],"it":[61],"execution":[63],"on":[64],"AMD":[65],"GPUs.":[66,93],"propose":[68],"new":[70],"optimized":[71],"method":[72],"that":[73],"improves":[74],"runtime":[76],"complexity":[78,116],"of":[79],"ciphertext":[80],"matmul":[81,102,127],"by":[82,108],"using":[83],"FIDESlib,":[84],"recent":[86],"open-source":[87],"library":[89],"designed":[90],"specifically":[91],"By":[94],"exploiting":[95],"sparsity":[96],"operands,":[99],"our":[100],"sparse":[101],"implementation":[103],"outperforms":[104],"its":[105],"CPU":[106],"counterpart":[107],"up":[109],"$3.0\\times$":[111],"reduces":[113],"time":[115],"cubic":[118],"semi-linear,":[120],"demonstrating":[121],"an":[122],"improvement":[123],"over":[124],"existing":[125],"implementations.":[128]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-15T00:00:00"}
