{"id":"https://openalex.org/W4408256689","doi":"https://doi.org/10.1145/3722219","title":"Gator: Accelerating Graph Attention Networks by Jointly Optimizing Attention and Graph Processing","display_name":"Gator: Accelerating Graph Attention Networks by Jointly Optimizing Attention and Graph Processing","publication_year":2025,"publication_date":"2025-03-08","ids":{"openalex":"https://openalex.org/W4408256689","doi":"https://doi.org/10.1145/3722219"},"language":"en","primary_location":{"id":"doi:10.1145/3722219","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3722219","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3722219","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3722219","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004560818","display_name":"Xiaobo Lu","orcid":"https://orcid.org/0009-0005-2673-8673"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaobo Lu","raw_affiliation_strings":["National University of Defense Technology","National University of Defense Technology,  Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense Technology,  Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083171604","display_name":"Jianbin Fang","orcid":"https://orcid.org/0000-0003-3542-4869"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianbin Fang","raw_affiliation_strings":["National University of Defense Technology","National University of Defense Technology,  Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense Technology,  Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103142055","display_name":"Peng Lin","orcid":"https://orcid.org/0000-0002-6828-3364"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Peng","raw_affiliation_strings":["National University of Defense Technology","National University of Defense Technology,  Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense Technology,  Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101626850","display_name":"Chun Huang","orcid":"https://orcid.org/0000-0002-0317-8192"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chun Huang","raw_affiliation_strings":["National University of Defense Technology","National University of Defense Technology,  Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense Technology,  Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111043550","display_name":"Zixiao Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zixiao Yu","raw_affiliation_strings":["National University of Defense Technology","National University of Defense Technology,  Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense Technology,  Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055015632","display_name":"Tiejun Li","orcid":"https://orcid.org/0000-0003-3381-3027"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tiejun Li","raw_affiliation_strings":["National University of Defense Technology","National University of Defense Technology,  Changsha, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense Technology,  Changsha, China","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5004560818"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.7467,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.69213475,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"22","issue":"2","first_page":"1","last_page":"24"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8663648366928101},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.6589173078536987},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.36902350187301636},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3219561278820038}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8663648366928101},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.6589173078536987},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36902350187301636},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3219561278820038}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3722219","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3722219","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3722219","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3722219","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3722219","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3722219","source":{"id":"https://openalex.org/S26056741","display_name":"ACM Transactions on Architecture and Code Optimization","issn_l":"1544-3566","issn":["1544-3566","1544-3973"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Architecture and Code Optimization","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4408256689.pdf"},"referenced_works_count":52,"referenced_works":["https://openalex.org/W1977661221","https://openalex.org/W1983394510","https://openalex.org/W2070232376","https://openalex.org/W2120000030","https://openalex.org/W2725159389","https://openalex.org/W2761132374","https://openalex.org/W2908404712","https://openalex.org/W2945623882","https://openalex.org/W2945827377","https://openalex.org/W3009233884","https://openalex.org/W3015616869","https://openalex.org/W3017024317","https://openalex.org/W3017228913","https://openalex.org/W3024534448","https://openalex.org/W3045613009","https://openalex.org/W3086821706","https://openalex.org/W3093563174","https://openalex.org/W3101553402","https://openalex.org/W3103168911","https://openalex.org/W3105753905","https://openalex.org/W3111142806","https://openalex.org/W3116604690","https://openalex.org/W3135280793","https://openalex.org/W3144812654","https://openalex.org/W3155936517","https://openalex.org/W3157609068","https://openalex.org/W3158126894","https://openalex.org/W3158371160","https://openalex.org/W3159727696","https://openalex.org/W3175201128","https://openalex.org/W3189877953","https://openalex.org/W3205531882","https://openalex.org/W3206453033","https://openalex.org/W4200042293","https://openalex.org/W4211165432","https://openalex.org/W4214686755","https://openalex.org/W4224267386","https://openalex.org/W4226137788","https://openalex.org/W4293025165","https://openalex.org/W4312076502","https://openalex.org/W4315977496","https://openalex.org/W4318541578","https://openalex.org/W4318686642","https://openalex.org/W4321446145","https://openalex.org/W4321466207","https://openalex.org/W4360831816","https://openalex.org/W4360831960","https://openalex.org/W4380881077","https://openalex.org/W4385801275","https://openalex.org/W4389476227","https://openalex.org/W4400410020","https://openalex.org/W6921559792"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Graph":[0],"attention":[1,14,49],"networks":[2,20],"(GATs)":[3],"have":[4,40],"advanced":[5],"performance":[6,54],"in":[7,52,168],"various":[8,120],"application":[9],"domains":[10],"by":[11,122],"introducing":[12],"the":[13,17,44,48,77,92,101,105,109],"mechanism":[15],"into":[16],"graph":[18,83,94],"neural":[19],"(GNNs).":[21],"The":[22],"inefficiency":[23],"of":[24,104,157],"running":[25],"GATs":[26],"on":[27,42],"CPUs":[28],"or":[29,47],"GPUs":[30],"necessitates":[31],"specialized":[32,37],"hardware":[33,110],"designs.":[34],"Unfortunately,":[35],"previous":[36],"architecture":[38,46],"designs":[39,113],"focused":[41],"either":[43],"GNN":[45],"mechanism,":[50],"resulting":[51],"limited":[53],"and":[55,85,99,128,153],"leaving":[56],"ample":[57],"room":[58],"for":[59,73,132],"improvement.":[60],"This":[61],"article":[62],"presents":[63],"Gator":[64,80,112],",":[65],"a":[66,114,124,129,155,163],"joint":[67],"optimization":[68],"approach":[69,142],"with":[70,162,177],"software\u2013hardware":[71],"co-designs":[72],"GAT":[74],"inference.":[75],"On":[76,108],"software":[78],"level,":[79,111],"leverages":[81],"degree-weighted":[82],"partitioning":[84],"parameter-adaptive":[86],"feature":[87],"selection":[88],"techniques":[89],"to":[90,118,149,159,165,173],"preprocess":[91],"input":[93],"data,":[95],"mining":[96],"subgraph-level":[97],"parallelism":[98],"mitigating":[100],"computation":[102,126],"bottleneck":[103],"dedicated":[106],"dataflow.":[107],"unified":[115],"processing":[116],"engine":[117],"support":[119],"kernels":[121],"extracting":[123],"common":[125],"pattern":[127],"dimension-aware":[130],"microarchitecture":[131],"efficient":[133],"partial":[134],"sum":[135],"reduction.":[136],"Extensive":[137],"experiments":[138],"show":[139],"that":[140],"our":[141],"can":[143],"achieve":[144],"11.5\u00d7":[145],"more":[146],"efficiency":[147],"compared":[148,172],"NVIDIA":[150],"RTX":[151],"4090":[152],"provide":[154],"speedup":[156],"3\u00d7":[158],"9.4\u00d7,":[160],"along":[161],"2.6\u00d7":[164],"4.7\u00d7":[166],"reduction":[167],"memory":[169],"traffic,":[170],"when":[171],"six":[174],"state-of-the-art":[175],"methods,":[176],"minimal":[178],"accuracy":[179],"loss.":[180]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
