{"id":"https://openalex.org/W4390880528","doi":"https://doi.org/10.1145/3640464","title":"LL-GNN: Low Latency Graph Neural Networks on FPGAs for High Energy Physics","display_name":"LL-GNN: Low Latency Graph Neural Networks on FPGAs for High Energy Physics","publication_year":2024,"publication_date":"2024-01-15","ids":{"openalex":"https://openalex.org/W4390880528","doi":"https://doi.org/10.1145/3640464"},"language":"en","primary_location":{"id":"doi:10.1145/3640464","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3640464","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3640464","source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3640464","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054475218","display_name":"Zhiqiang Que","orcid":"https://orcid.org/0000-0002-9263-6529"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Zhiqiang Que","raw_affiliation_strings":["Department of Computing, Imperial College London, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computing, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057043409","display_name":"Hongxiang Fan","orcid":"https://orcid.org/0000-0003-2387-5611"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hongxiang Fan","raw_affiliation_strings":["Department of Computing, Imperial College London, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computing, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015420000","display_name":"Marcus H. Loo","orcid":"https://orcid.org/0009-0006-1254-8120"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Marcus Loo","raw_affiliation_strings":["Department of Computing, Imperial College London, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computing, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100317850","display_name":"He Li","orcid":"https://orcid.org/0000-0002-1540-189X"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"He Li","raw_affiliation_strings":["School of Electronic and Engineering, Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031107943","display_name":"Michaela Blott","orcid":"https://orcid.org/0000-0002-7833-4057"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michaela Blott","raw_affiliation_strings":["AMD Adaptive and Embedded Computing Group (AECG) Labs, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"AMD Adaptive and Embedded Computing Group (AECG) Labs, Dublin, Ireland","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106315352","display_name":"M. Pierini","orcid":"https://orcid.org/0000-0003-1939-4268"},"institutions":[{"id":"https://openalex.org/I67311998","display_name":"European Organization for Nuclear Research","ror":"https://ror.org/01ggx4157","country_code":"CH","type":"facility","lineage":["https://openalex.org/I67311998"]}],"countries":["CH"],"is_corresponding":false,"raw_author_name":"Maurizio Pierini","raw_affiliation_strings":["European Organization for Nuclear Research (CERN), Geneva, Switzerland"],"affiliations":[{"raw_affiliation_string":"European Organization for Nuclear Research (CERN), Geneva, Switzerland","institution_ids":["https://openalex.org/I67311998"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064345784","display_name":"A. Tapper","orcid":"https://orcid.org/0000-0003-4543-864X"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Alexander Tapper","raw_affiliation_strings":["Department of Physics, Imperial College London, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Physics, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057940557","display_name":"Wayne Luk","orcid":"https://orcid.org/0000-0002-6750-927X"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wayne Luk","raw_affiliation_strings":["Department of Computing, Imperial College London, London, UK"],"affiliations":[{"raw_affiliation_string":"Department of Computing, Imperial College London, London, UK","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5054475218"],"corresponding_institution_ids":["https://openalex.org/I47508984"],"apc_list":null,"apc_paid":null,"fwci":4.4871,"has_fulltext":true,"cited_by_count":19,"citation_normalized_percentile":{"value":0.954829,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"23","issue":"2","first_page":"1","last_page":"28"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14347","display_name":"Big Data and Digital Economy","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.8064958453178406},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8021502494812012},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.6123257279396057},{"id":"https://openalex.org/keywords/low-latency","display_name":"Low latency (capital markets)","score":0.528788149356842},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4765232801437378},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.38124769926071167},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.3223339021205902},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3146096169948578},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2534950375556946},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.14900940656661987},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.14050984382629395}],"concepts":[{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.8064958453178406},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8021502494812012},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.6123257279396057},{"id":"https://openalex.org/C46637626","wikidata":"https://www.wikidata.org/wiki/Q6693015","display_name":"Low latency (capital markets)","level":2,"score":0.528788149356842},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4765232801437378},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.38124769926071167},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3223339021205902},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3146096169948578},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2534950375556946},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.14900940656661987},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.14050984382629395}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3640464","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3640464","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3640464","source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},{"id":"pmh:oai:cds.cern.ch:2933200","is_oa":true,"landing_page_url":"http://cds.cern.ch/record/2933200","pdf_url":"https://cds.cern.ch/record/2933200/files/Published version.pdf","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":null}],"best_oa_location":{"id":"doi:10.1145/3640464","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3640464","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3640464","source":{"id":"https://openalex.org/S136160450","display_name":"ACM Transactions on Embedded Computing Systems","issn_l":"1539-9087","issn":["1539-9087","1558-3465"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Embedded Computing Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2562028074","display_name":null,"funder_award_id":"ST/V005936/1","funder_id":"https://openalex.org/F4320334632","funder_display_name":"Science and Technology Facilities Council"},{"id":"https://openalex.org/G2784140359","display_name":"Application Customisation: Enhancing Design Quality and Developer Productivity","funder_award_id":"EP/P010040/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G3496335909","display_name":"Centre for Spatial Computational Learning","funder_award_id":"EP/S030069/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G4587427570","display_name":null,"funder_award_id":"EP/S030069/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G514660964","display_name":"DART: Design Accelerators by Regulating Transformations","funder_award_id":"EP/V028251/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5201431165","display_name":"EPSRC Centre for Doctoral Training in High Performance Embedded and Distributed Systems","funder_award_id":"EP/L016796/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5248561189","display_name":"Event-based parallel computing - partially ordered event-triggered systems (POETS)","funder_award_id":"EP/N031768/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G6653872853","display_name":null,"funder_award_id":"EP/L016","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7493804148","display_name":null,"funder_award_id":"EP/N031768/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G774180880","display_name":null,"funder_award_id":"EP/P010040/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8051675292","display_name":null,"funder_award_id":"EP/V028251/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8719353587","display_name":null,"funder_award_id":"EP/P0","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320313559","display_name":"CERN","ror":"https://ror.org/01ggx4157"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"},{"id":"https://openalex.org/F4320334632","display_name":"Science and Technology Facilities Council","ror":"https://ror.org/057g20z61"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390880528.pdf","grobid_xml":"https://content.openalex.org/works/W4390880528.grobid-xml"},"referenced_works_count":38,"referenced_works":["https://openalex.org/W2433841930","https://openalex.org/W2594183968","https://openalex.org/W2798084934","https://openalex.org/W2807021761","https://openalex.org/W2883927138","https://openalex.org/W2891946740","https://openalex.org/W2911708692","https://openalex.org/W2914721378","https://openalex.org/W2916639378","https://openalex.org/W2964571482","https://openalex.org/W2968312879","https://openalex.org/W3000310304","https://openalex.org/W3002851826","https://openalex.org/W3047846843","https://openalex.org/W3048084597","https://openalex.org/W3092940566","https://openalex.org/W3100848837","https://openalex.org/W3101493857","https://openalex.org/W3105412497","https://openalex.org/W3106125969","https://openalex.org/W3119613749","https://openalex.org/W3175548485","https://openalex.org/W3177366646","https://openalex.org/W3183056907","https://openalex.org/W3202404106","https://openalex.org/W4200157451","https://openalex.org/W4221029921","https://openalex.org/W4221155008","https://openalex.org/W4282011755","https://openalex.org/W4293243633","https://openalex.org/W4295365496","https://openalex.org/W4308083831","https://openalex.org/W4360831960","https://openalex.org/W4377715555","https://openalex.org/W4388214761","https://openalex.org/W4393923520","https://openalex.org/W4394057280","https://openalex.org/W7051956745"],"related_works":["https://openalex.org/W1967938402","https://openalex.org/W2386041993","https://openalex.org/W1608572506","https://openalex.org/W3205411230","https://openalex.org/W4286899009","https://openalex.org/W3163341049","https://openalex.org/W9168048","https://openalex.org/W4300849822","https://openalex.org/W4376480820","https://openalex.org/W3155891479"],"abstract_inverted_index":{"This":[0,67],"work":[1,238],"presents":[2,29],"a":[3,30,47,70,87,95,124,141,152,155,162,173,201,228,262],"novel":[4,71],"reconfigurable":[5],"architecture":[6,182],"for":[7,15,42,99,176],"Low":[8],"Latency":[9],"Graph":[10],"Neural":[11],"Network":[12],"(LL-GNN)":[13],"designs":[14,195],"particle":[16,27],"detectors,":[17],"delivering":[18],"unprecedented":[19],"low":[20,178,255],"latency":[21,37,118,135,158,168,179,248],"performance.":[22],"Incorporating":[23],"FPGA-based":[24],"GNNs":[25,260],"into":[26],"detectors":[28],"unique":[31],"challenge":[32],"since":[33],"it":[34,269],"requires":[35],"sub-microsecond":[36],"to":[38,116,129,214,221,232,241,256,270,290],"deploy":[39],"the":[40,57,61,82,100,106,132,190,233,247,280],"networks":[41],"online":[43],"event":[44],"selection":[45],"with":[46,154,196],"data":[48,89,293],"rate":[49],"of":[50,52,113,192,249,259,283],"hundreds":[51],"terabytes":[53],"per":[54],"second":[55],"in":[56,261],"Level-1":[58],"triggers":[59],"at":[60],"CERN":[62],"Large":[63],"Hadron":[64],"Collider":[65],"experiments.":[66],"article":[68],"proposes":[69],"outer-product":[72],"based":[73],"matrix":[74,85,101],"multiplication":[75,102],"approach,":[76],"which":[77,104,148,188],"is":[78,127,146,212,253],"enhanced":[79],"by":[80,136,286],"exploiting":[81],"structured":[83,107],"adjacency":[84,114],"and":[86,110,119,186,218],"column-major":[88],"layout.":[90],"In":[91],"addition,":[92],"we":[93],"propose":[94],"custom":[96],"code":[97],"transformation":[98],"operations,":[103],"leverages":[105],"sparsity":[108],"patterns":[109],"binary":[111],"features":[112],"matrices":[115],"reduce":[117,131],"improve":[120],"hardware":[121,181],"efficiency.":[122],"Moreover,":[123,246],"fusion":[125],"step":[126],"introduced":[128],"further":[130],"end-to-end":[133],"design":[134,153,165,252,278],"eliminating":[137],"unnecessary":[138],"boundaries.":[139],"Furthermore,":[140],"GNN-specific":[142],"algorithm-hardware":[143],"co-design":[144],"approach":[145],"presented":[147],"not":[149],"only":[150],"finds":[151,161],"much":[156],"better":[157],"but":[159],"also":[160],"high":[163],"accuracy":[164],"under":[166],"given":[167],"constraints.":[169],"To":[170],"facilitate":[171],"this,":[172],"customizable":[174],"template":[175],"this":[177,237],"GNN":[180],"has":[183],"been":[184],"designed":[185],"open-sourced,":[187],"enables":[189],"generation":[191,282],"low-latency":[193],"FPGA":[194,210,235,251],"efficient":[197],"resource":[198],"utilization":[199],"using":[200],"high-level":[202],"synthesis":[203],"tool.":[204],"Evaluation":[205],"results":[206],"show":[207],"that":[208],"our":[209,250],"implementation":[211],"up":[213,220],"9.0":[215],"times":[216,223,243],"faster":[217],"achieves":[219,239],"13.1":[222],"higher":[224],"power":[225],"efficiency":[226],"than":[227],"GPU":[229],"implementation.":[230],"Compared":[231],"previous":[234],"implementations,":[236],"6.51":[240],"16.7":[242],"lower":[244],"latency.":[245],"sufficiently":[254],"enable":[257],"deployment":[258],"sub-microsecond,":[263],"real-time":[264],"collider":[265],"trigger":[266,284],"system,":[267],"enabling":[268,287],"benefit":[271],"from":[272],"improved":[273],"accuracy.":[274],"The":[275],"proposed":[276],"LL-GNN":[277],"advances":[279],"next":[281],"systems":[285],"sophisticated":[288],"algorithms":[289],"process":[291],"experimental":[292],"efficiently.":[294]},"counts_by_year":[{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
