{"id":"https://openalex.org/W4387848944","doi":"https://doi.org/10.1145/3583780.3615206","title":"A Flash Attention Transformer for Multi-Behaviour Recommendation","display_name":"A Flash Attention Transformer for Multi-Behaviour Recommendation","publication_year":2023,"publication_date":"2023-10-21","ids":{"openalex":"https://openalex.org/W4387848944","doi":"https://doi.org/10.1145/3583780.3615206"},"language":"en","primary_location":{"id":"doi:10.1145/3583780.3615206","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3583780.3615206","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615206","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615206","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075946456","display_name":"Tendai Mukande","orcid":"https://orcid.org/0000-0002-0654-7141"},"institutions":[{"id":"https://openalex.org/I42934936","display_name":"Dublin City University","ror":"https://ror.org/04a1a1e81","country_code":"IE","type":"education","lineage":["https://openalex.org/I42934936"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Tendai Mukande","raw_affiliation_strings":["Dublin City University, Dublin, Ireland"],"raw_orcid":"https://orcid.org/0000-0002-0654-7141","affiliations":[{"raw_affiliation_string":"Dublin City University, Dublin, Ireland","institution_ids":["https://openalex.org/I42934936"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004314068","display_name":"Esraa Ali","orcid":"https://orcid.org/0000-0003-1600-3161"},"institutions":[{"id":"https://openalex.org/I42934936","display_name":"Dublin City University","ror":"https://ror.org/04a1a1e81","country_code":"IE","type":"education","lineage":["https://openalex.org/I42934936"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Esraa Ali","raw_affiliation_strings":["Dublin City University, Dublin, Ireland"],"raw_orcid":"https://orcid.org/0000-0003-1600-3161","affiliations":[{"raw_affiliation_string":"Dublin City University, Dublin, Ireland","institution_ids":["https://openalex.org/I42934936"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061679230","display_name":"Annalina Caputo","orcid":"https://orcid.org/0000-0002-7144-8545"},"institutions":[{"id":"https://openalex.org/I42934936","display_name":"Dublin City University","ror":"https://ror.org/04a1a1e81","country_code":"IE","type":"education","lineage":["https://openalex.org/I42934936"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Annalina Caputo","raw_affiliation_strings":["Dublin City University, Dublin, Ireland"],"raw_orcid":"https://orcid.org/0000-0002-7144-8545","affiliations":[{"raw_affiliation_string":"Dublin City University, Dublin, Ireland","institution_ids":["https://openalex.org/I42934936"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009000289","display_name":"Ruihai Dong","orcid":"https://orcid.org/0000-0002-2509-1370"},"institutions":[{"id":"https://openalex.org/I100930933","display_name":"University College Dublin","ror":"https://ror.org/05m7pjf47","country_code":"IE","type":"education","lineage":["https://openalex.org/I100930933"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Ruihai Dong","raw_affiliation_strings":["University College Dublin, Dublin, Ireland"],"raw_orcid":"https://orcid.org/0000-0002-2509-1370","affiliations":[{"raw_affiliation_string":"University College Dublin, Dublin, Ireland","institution_ids":["https://openalex.org/I100930933"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5106498523","display_name":"Noel E. O\u2019Connor","orcid":"https://orcid.org/0000-0002-4033-9135"},"institutions":[{"id":"https://openalex.org/I42934936","display_name":"Dublin City University","ror":"https://ror.org/04a1a1e81","country_code":"IE","type":"education","lineage":["https://openalex.org/I42934936"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Noel E. O'Connor","raw_affiliation_strings":["Dublin City University, Dublin, Ireland"],"raw_orcid":"https://orcid.org/0000-0002-4033-9135","affiliations":[{"raw_affiliation_string":"Dublin City University, Dublin, Ireland","institution_ids":["https://openalex.org/I42934936"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4285,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.69659949,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"4210","last_page":"4214"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.988099992275238,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8191137909889221},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6273418664932251},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.5723317861557007},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44551610946655273},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.44438040256500244},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.42421725392341614},{"id":"https://openalex.org/keywords/high-memory","display_name":"High memory","score":0.42385134100914},{"id":"https://openalex.org/keywords/attention-network","display_name":"Attention network","score":0.4130491316318512},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.40435171127319336},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.11963284015655518}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8191137909889221},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6273418664932251},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.5723317861557007},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44551610946655273},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.44438040256500244},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.42421725392341614},{"id":"https://openalex.org/C2781357197","wikidata":"https://www.wikidata.org/wiki/Q5757597","display_name":"High memory","level":2,"score":0.42385134100914},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.4130491316318512},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.40435171127319336},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.11963284015655518},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3583780.3615206","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3583780.3615206","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615206","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},{"id":"pmh:oai:doras.dcu.ie:32650","is_oa":true,"landing_page_url":"https://orcid.org/0000-0002-0654-7141>,","pdf_url":"https://doras.dcu.ie/32650/1/shp2686.pdf","source":{"id":"https://openalex.org/S4306401511","display_name":"Dublin City University Open Access Institutional Repository (Dublin City University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I42934936","host_organization_name":"Dublin City University","host_organization_lineage":["https://openalex.org/I42934936"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"PeerReviewed"}],"best_oa_location":{"id":"doi:10.1145/3583780.3615206","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3583780.3615206","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3583780.3615206","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7316039843","display_name":"SFI Centre for Research Training in Machine Learning","funder_award_id":"18/CRT/6183","funder_id":"https://openalex.org/F4320320847","funder_display_name":"Science Foundation Ireland"}],"funders":[{"id":"https://openalex.org/F4320320847","display_name":"Science Foundation Ireland","ror":"https://ror.org/0271asj38"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4387848944.pdf","grobid_xml":"https://content.openalex.org/works/W4387848944.grobid-xml"},"referenced_works_count":27,"referenced_works":["https://openalex.org/W2606722458","https://openalex.org/W2740920897","https://openalex.org/W2783272285","https://openalex.org/W2892880750","https://openalex.org/W2911286998","https://openalex.org/W2951369132","https://openalex.org/W2963367478","https://openalex.org/W2974594200","https://openalex.org/W2984100107","https://openalex.org/W3015661699","https://openalex.org/W3035287707","https://openalex.org/W3035666843","https://openalex.org/W3081304929","https://openalex.org/W3085131702","https://openalex.org/W3085139254","https://openalex.org/W3131922516","https://openalex.org/W3175450343","https://openalex.org/W3207257408","https://openalex.org/W3208227120","https://openalex.org/W4214540501","https://openalex.org/W4243552710","https://openalex.org/W4281758439","https://openalex.org/W4284668205","https://openalex.org/W4285252216","https://openalex.org/W4285428788","https://openalex.org/W6775837273","https://openalex.org/W6782808188"],"related_works":["https://openalex.org/W4390273403","https://openalex.org/W4386781444","https://openalex.org/W2150182025","https://openalex.org/W3092950680","https://openalex.org/W3197542405","https://openalex.org/W2056712470","https://openalex.org/W3125580266","https://openalex.org/W4317039510","https://openalex.org/W4238861846","https://openalex.org/W4200094402"],"abstract_inverted_index":{"\\beginabstract":[0],"Recently,":[1],"modelling":[2],"heterogeneous":[3],"interactions":[4,18],"in":[5,39,69,103,110,158],"recommender":[6],"systems":[7],"has":[8],"attracted":[9],"research":[10],"interest.":[11],"Real-world":[12],"scenarios":[13],"involve":[14],"sequential":[15,44],"multi-type":[16],"user-item":[17,45,72,136],"such":[19],"as":[20],"''shape":[21,23,25,28],"view'',":[22],"add-to-favourites'',":[24],"add-to-cart''":[26],"and":[27,57,93,106,149],"purchase''.":[29],"Graph":[30],"Neural":[31],"Network":[32],"(GNN)":[33],"methods":[34,64],"have":[35,49],"been":[36,50],"widely":[37],"adopted":[38],"Representation":[40],"Learning":[41],"of":[42,55,86],"similar":[43],"interactions.":[46],"Promising":[47],"results":[48,102,140],"achieved":[51],"by":[52],"the":[53,90,120,130,146,151,161,163],"integration":[54],"GNNs":[56],"transformers":[58],"for":[59,76],"self-attention.":[60],"However,":[61],"GNN":[62],"based":[63],"suffer":[65],"from":[66],"limited":[67],"capability":[68],"handling":[70],"global":[71],"interaction":[73,137],"dependencies,":[74],"particularly":[75],"long":[77],"sequences.":[78,138],"Moreover,":[79],"these":[80,116],"models":[81],"require":[82],"high":[83],"computational":[84,111],"cost":[85],"transformers,":[87],"due":[88],"to":[89,98,128],"quadratic":[91],"memory":[92,104,132,152],"time":[94],"complexity":[95],"with":[96,154,160],"respect":[97],"sequence":[99],"length.":[100],"This":[101],"bottlenecks":[105],"slow":[107],"training":[108,147],"especially":[109],"resource-constrained":[112],"environments.":[113],"To":[114],"address":[115],"challenges,":[117],"we":[118],"propose":[119],"FATH":[121],"model":[122,144],"which":[123],"employs":[124],"Flash":[125],"Attention":[126],"mechanism":[127],"reduce":[129],"high-bandwidth":[131],"usage":[133,153],"over":[134],"higher-order":[135],"Experimental":[139],"show":[141],"that":[142],"our":[143],"improves":[145],"speed":[148],"reduces":[150],"better":[155],"recommendation":[156],"performance":[157],"comparison":[159],"state-of":[162],"art":[164],"baselines.":[165]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-22T08:00:12.763002","created_date":"2025-10-10T00:00:00"}
