{"id":"https://openalex.org/W4388581101","doi":"https://doi.org/10.1145/3624062.3624223","title":"Enabling Quantum Computer Simulations on AMD GPUs: a HIP Backend for Google's qsim","display_name":"Enabling Quantum Computer Simulations on AMD GPUs: a HIP Backend for Google's qsim","publication_year":2023,"publication_date":"2023-11-10","ids":{"openalex":"https://openalex.org/W4388581101","doi":"https://doi.org/10.1145/3624062.3624223"},"language":"en","primary_location":{"id":"doi:10.1145/3624062.3624223","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3624062.3624223","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3624062.3624223","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SC '23 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3624062.3624223","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085178088","display_name":"Stefano Markidis","orcid":"https://orcid.org/0000-0003-0639-0639"},"institutions":[{"id":"https://openalex.org/I86987016","display_name":"KTH Royal Institute of Technology","ror":"https://ror.org/026vcq606","country_code":"SE","type":"education","lineage":["https://openalex.org/I86987016"]}],"countries":["SE"],"is_corresponding":true,"raw_author_name":"Stefano Markidis","raw_affiliation_strings":["KTH Royal Institute of Technology, Sweden, Sweden"],"affiliations":[{"raw_affiliation_string":"KTH Royal Institute of Technology, Sweden, Sweden","institution_ids":["https://openalex.org/I86987016"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5085178088"],"corresponding_institution_ids":["https://openalex.org/I86987016"],"apc_list":null,"apc_paid":null,"fwci":0.8641,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.79494649,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1478","last_page":"1486"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10682","display_name":"Quantum Computing Algorithms and Architecture","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10020","display_name":"Quantum Information and Cryptography","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13182","display_name":"Quantum-Dot Cellular Automata","score":0.9869999885559082,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8510897159576416},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.6652238965034485},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5481141805648804},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.49336639046669006},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.46185600757598877},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.43381935358047485},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.4033430814743042},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.1385849416255951},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.13034239411354065}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8510897159576416},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.6652238965034485},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5481141805648804},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.49336639046669006},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.46185600757598877},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.43381935358047485},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.4033430814743042},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.1385849416255951},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.13034239411354065},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3624062.3624223","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3624062.3624223","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3624062.3624223","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SC '23 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3624062.3624223","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3624062.3624223","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3624062.3624223","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SC '23 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.47999998927116394,"display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G3165808449","display_name":null,"funder_award_id":"022-06725","funder_id":"https://openalex.org/F4320322581","funder_display_name":"Vetenskapsr\u00e5det"},{"id":"https://openalex.org/G4493597635","display_name":null,"funder_award_id":"NAISS","funder_id":"https://openalex.org/F4320322581","funder_display_name":"Vetenskapsr\u00e5det"},{"id":"https://openalex.org/G8338695050","display_name":null,"funder_award_id":"2022-0672","funder_id":"https://openalex.org/F4320322581","funder_display_name":"Vetenskapsr\u00e5det"},{"id":"https://openalex.org/G8531805188","display_name":"Plasma Exascale-Performance Simulations CoE - Pushing flagship plasma simulations codes to tackle exascale-enabled Grand Challenges via performance optimisation and codesign","funder_award_id":"101093261","funder_id":"https://openalex.org/F4320320300","funder_display_name":"European Commission"},{"id":"https://openalex.org/G8869864247","display_name":null,"funder_award_id":"2022-06725","funder_id":"https://openalex.org/F4320322581","funder_display_name":"Vetenskapsr\u00e5det"}],"funders":[{"id":"https://openalex.org/F4320320300","display_name":"European Commission","ror":"https://ror.org/00k4n6c32"},{"id":"https://openalex.org/F4320322581","display_name":"Vetenskapsr\u00e5det","ror":"https://ror.org/03zttf063"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4388581101.pdf"},"referenced_works_count":30,"referenced_works":["https://openalex.org/W1480958225","https://openalex.org/W1631356911","https://openalex.org/W2072969317","https://openalex.org/W2158138673","https://openalex.org/W2607213325","https://openalex.org/W2800906530","https://openalex.org/W2904368027","https://openalex.org/W2920893842","https://openalex.org/W2944581240","https://openalex.org/W2946582523","https://openalex.org/W2963212486","https://openalex.org/W3003732914","https://openalex.org/W3016555448","https://openalex.org/W3041333143","https://openalex.org/W3099332271","https://openalex.org/W3100200555","https://openalex.org/W3101479050","https://openalex.org/W3108987040","https://openalex.org/W3128354053","https://openalex.org/W3135510046","https://openalex.org/W3181290353","https://openalex.org/W4205110008","https://openalex.org/W4206951734","https://openalex.org/W4234592442","https://openalex.org/W4307872100","https://openalex.org/W6931031300","https://openalex.org/W6931468768","https://openalex.org/W6950286395","https://openalex.org/W6950480785","https://openalex.org/W6969035171"],"related_works":["https://openalex.org/W66594024","https://openalex.org/W1963859303","https://openalex.org/W2364044215","https://openalex.org/W2389600408","https://openalex.org/W240129890","https://openalex.org/W3048701459","https://openalex.org/W2149078538","https://openalex.org/W2080146221","https://openalex.org/W2370314112","https://openalex.org/W1912958759"],"abstract_inverted_index":{"Quantum":[0,88],"computer":[1,27],"simulators":[2],"play":[3],"a":[4,25,49,69,94,111,157,162,166,171,192,208],"critical":[5],"role":[6],"in":[7],"supporting":[8],"the":[9,37,44,63,74,79,86,107,128,140,179,197,201],"development":[10],"and":[11,16,42,78,131,144],"validation":[12],"of":[13,183],"quantum":[14,26,185],"algorithms":[15],"hardware.":[17],"This":[18],"study":[19],"focuses":[20],"on":[21,61,68,103,127],"porting":[22],"Google\u2019s":[23],"qsim,":[24],"simulator,":[28],"to":[29,47,116,196],"AMD":[30,55,75,80,104,132,141,202],"Graphics":[31],"Processing":[32],"Units":[33],"(GPUs).":[34],"We":[35,84],"leverage":[36],"existing":[38],"qsim":[39,50,100,198,204],"CUDA":[40,199],"backend":[41,52,102,205],"harness":[43],"HIPIFY":[45],"tool":[46],"provide":[48],"HIP":[51,64,101,203],"tailored":[53],"for":[54,212],"GPUs.":[56,134],"Our":[57,121,176],"performance":[58,126,146,174,181,193],"analysis":[59],"centers":[60],"evaluating":[62],"backend\u2019s":[65],"capabilities,":[66],"executed":[67],"computing":[70],"node":[71],"equipped":[72],"with":[73,150],"MI250X":[76,133],"GPU":[77,105],"EPYC":[81],"Trento":[82],"CPU.":[83],"use":[85],"Random":[87],"Circuit":[89],"(RQC)":[90],"sampling":[91],"benchmark,":[92],"employing":[93],"circuit":[95],"featuring":[96],"30":[97],"qubits.":[98],"The":[99,135],"outperforms":[106,139],"CPU":[108,189],"version":[109],"by":[110],"remarkable":[112],"margin,":[113],"achieving":[114],"seven":[115],"nine":[117],"times":[118],"faster":[119],"speeds.":[120],"investigation":[122],"also":[123],"compares":[124],"qsim\u2019s":[125],"Nvidia":[129,136],"A100":[130,137],"consistently":[138],"MI250x":[142],"counterpart,":[143],"this":[145],"gap":[147],"further":[148,213],"widens":[149],"optimal":[151],"gate":[152],"fusion":[153,159,168],"configurations.":[154],"For":[155],"instance,":[156],"two-gate":[158],"configuration":[160],"exhibits":[161],"5%":[163],"difference,":[164],"whereas":[165],"four-gate":[167],"setup":[169],"reveals":[170],"large":[172],"44%":[173],"gap.":[175],"work":[177],"highlights":[178],"substantial":[180],"advantage":[182],"GPU-based":[184],"simulation":[186],"over":[187],"traditional":[188],"approaches.":[190],"Despite":[191],"lag":[194],"compared":[195],"backend,":[200],"emerges":[206],"as":[207],"competitive":[209],"alternative":[210],"poised":[211],"optimization.":[214]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
