{"id":"https://openalex.org/W4388581228","doi":"https://doi.org/10.1145/3624062.3625534","title":"Hardware Specialization: Estimating Monte Carlo Cross-Section Lookup Kernel Performance and Area","display_name":"Hardware Specialization: Estimating Monte Carlo Cross-Section Lookup Kernel Performance and Area","publication_year":2023,"publication_date":"2023-11-10","ids":{"openalex":"https://openalex.org/W4388581228","doi":"https://doi.org/10.1145/3624062.3625534"},"language":"en","primary_location":{"id":"doi:10.1145/3624062.3625534","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3624062.3625534","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SC '23 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5032371884","display_name":"Kazutomo Yoshii","orcid":"https://orcid.org/0000-0003-1904-5383"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Kazutomo Yoshii","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019482956","display_name":"John Tramm","orcid":"https://orcid.org/0000-0002-5397-4402"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"John Tramm","raw_affiliation_strings":["Argonne National Laboratory, United States of America"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, United States of America","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020047116","display_name":"Bryce Allen","orcid":"https://orcid.org/0000-0001-7081-3267"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bryce Allen","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103033249","display_name":"Tomohiro Ueno","orcid":"https://orcid.org/0000-0002-0228-0566"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomohiro Ueno","raw_affiliation_strings":["RIKEN Center for Computational Science (R-CCS), Japan"],"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science (R-CCS), Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081752237","display_name":"Kentaro Sano","orcid":"https://orcid.org/0000-0002-6681-4192"},"institutions":[{"id":"https://openalex.org/I4210129730","display_name":"RIKEN Center for Computational Science","ror":"https://ror.org/03r519674","country_code":"JP","type":"facility","lineage":["https://openalex.org/I4210110652","https://openalex.org/I4210129730"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kentaro Sano","raw_affiliation_strings":["RIKEN Center for Computational Science (R-CCS), Japan"],"affiliations":[{"raw_affiliation_string":"RIKEN Center for Computational Science (R-CCS), Japan","institution_ids":["https://openalex.org/I4210129730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002070572","display_name":"Andrew Siegel","orcid":"https://orcid.org/0009-0002-6552-0982"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Siegel","raw_affiliation_strings":["Argonne National Laboratory, USA"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, USA","institution_ids":["https://openalex.org/I1282105669"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038177319","display_name":"Pete Beckman","orcid":"https://orcid.org/0000-0002-9428-7801"},"institutions":[{"id":"https://openalex.org/I1282105669","display_name":"Argonne National Laboratory","ror":"https://ror.org/05gvnxz63","country_code":"US","type":"facility","lineage":["https://openalex.org/I1282105669","https://openalex.org/I1330989302","https://openalex.org/I39565521","https://openalex.org/I40347166"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Pete Beckman","raw_affiliation_strings":["Argonne National Laboratory, United States of America"],"affiliations":[{"raw_affiliation_string":"Argonne National Laboratory, United States of America","institution_ids":["https://openalex.org/I1282105669"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5032371884"],"corresponding_institution_ids":["https://openalex.org/I1282105669"],"apc_list":null,"apc_paid":null,"fwci":0.6151,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.64604271,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1274","last_page":"1278"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7957309484481812},{"id":"https://openalex.org/keywords/kernel","display_name":"Kernel (algebra)","score":0.6682320833206177},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6615928411483765},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.5647770166397095},{"id":"https://openalex.org/keywords/monte-carlo-method","display_name":"Monte Carlo method","score":0.5240219235420227},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.5107157230377197},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.48536717891693115},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.43608468770980835},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.4314861595630646},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3220423460006714},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.16413089632987976}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7957309484481812},{"id":"https://openalex.org/C74193536","wikidata":"https://www.wikidata.org/wiki/Q574844","display_name":"Kernel (algebra)","level":2,"score":0.6682320833206177},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6615928411483765},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5647770166397095},{"id":"https://openalex.org/C19499675","wikidata":"https://www.wikidata.org/wiki/Q232207","display_name":"Monte Carlo method","level":2,"score":0.5240219235420227},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.5107157230377197},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.48536717891693115},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.43608468770980835},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.4314861595630646},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3220423460006714},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.16413089632987976},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3624062.3625534","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3624062.3625534","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SC '23 Workshops of the International Conference on High Performance Computing, Network, Storage, and Analysis","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W2013248679","https://openalex.org/W2085012105","https://openalex.org/W2162385899","https://openalex.org/W2176890627","https://openalex.org/W2222609946","https://openalex.org/W2512569446","https://openalex.org/W2524971917","https://openalex.org/W2983971024","https://openalex.org/W3209739359","https://openalex.org/W3216238950","https://openalex.org/W4293023438"],"related_works":["https://openalex.org/W1981780420","https://openalex.org/W2182707996","https://openalex.org/W45233828","https://openalex.org/W2964988449","https://openalex.org/W2111241003","https://openalex.org/W2397952901","https://openalex.org/W2029380707","https://openalex.org/W1967938402","https://openalex.org/W2386041993","https://openalex.org/W1608572506"],"abstract_inverted_index":{"Hardware":[0],"specialization":[1,19],"is":[2,13,111],"one":[3],"of":[4,33,87,136],"the":[5,9,30,48,88,92,108,117,137],"promising":[6],"directions":[7],"in":[8,91],"post-Moore":[10],"era.":[11],"It":[12],"imperative":[14],"to":[15,65,75],"understand":[16],"how":[17],"hardware":[18,41,81],"paradigms":[20],"can":[21],"benefit":[22],"HPC.":[23],"An":[24],"essential":[25],"question":[26],"revolves":[27],"around":[28],"estimating":[29],"theoretical":[31],"performance":[32],"an":[34],"optimally":[35],"specialized":[36,68],"architecture":[37],"without":[38],"requiring":[39],"extensive":[40],"development":[42],"expertise":[43],"and":[44,71,96,124],"efforts.":[45],"Focusing":[46],"on":[47],"Monte":[49],"Carlo":[50],"cross-section":[51],"lookup":[52,115],"kernel,":[53],"known":[54],"for":[55,100],"its":[56],"notably":[57],"low":[58],"resource":[59,73,101],"utilization,":[60],"we":[61],"develop":[62],"a":[63,67,125,131],"workflow":[64],"simulate":[66],"architecture\u2019s":[69],"timing":[70],"estimate":[72],"usage":[74],"answer":[76],"these":[77],"questions,":[78],"leveraging":[79],"open-source":[80],"tools.":[82],"We":[83],"implement":[84],"building":[85],"blocks":[86],"kernel":[89,109],"pipeline":[90,128],"Chisel":[93],"construction":[94],"language":[95],"generate":[97],"Verilog":[98],"codes":[99],"estimation.":[102],"Our":[103],"late-breaking":[104],"results":[105],"show":[106],"that":[107],"latency":[110],"46":[112],"cycles":[113],"per":[114],"while":[116],"optimized":[118],"CPU":[119],"code":[120],"takes":[121],"680":[122],"cycles,":[123],"potential":[126],"15k":[127],"copies":[129],"within":[130],"698":[132],"mm2":[133],"die,":[134],"reflective":[135],"Intel":[138],"Xeon":[139],"Platinum":[140],"8180":[141],"dimensions.":[142]},"counts_by_year":[{"year":2025,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
