{"id":"https://openalex.org/W4281782777","doi":"https://doi.org/10.1145/3477495.3531811","title":"Understanding Long Programming Languages with Structure-Aware Sparse Attention","display_name":"Understanding Long Programming Languages with Structure-Aware Sparse Attention","publication_year":2022,"publication_date":"2022-07-06","ids":{"openalex":"https://openalex.org/W4281782777","doi":"https://doi.org/10.1145/3477495.3531811"},"language":"en","primary_location":{"id":"doi:10.1145/3477495.3531811","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3531811","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100442032","display_name":"Tingting Liu","orcid":"https://orcid.org/0000-0002-8533-6202"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tingting Liu","raw_affiliation_strings":["East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100373451","display_name":"Chengyu Wang","orcid":"https://orcid.org/0000-0003-1010-9678"},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengyu Wang","raw_affiliation_strings":["Alibaba Group, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Hangzhou, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114734448","display_name":"Cen Chen","orcid":"https://orcid.org/0000-0003-0325-1705"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cen Chen","raw_affiliation_strings":["East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075501144","display_name":"Ming Gao","orcid":"https://orcid.org/0000-0003-3397-5659"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Gao","raw_affiliation_strings":["East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101511862","display_name":"Aoying Zhou","orcid":"https://orcid.org/0000-0002-4665-7302"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aoying Zhou","raw_affiliation_strings":["East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100442032"],"corresponding_institution_ids":["https://openalex.org/I66867065"],"apc_list":null,"apc_paid":null,"fwci":0.5821,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65806265,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2093","last_page":"2098"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10260","display_name":"Software Engineering Research","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9898999929428101,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8555161356925964},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.560854971408844},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.46475544571876526},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4485156834125519},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.44682565331459045},{"id":"https://openalex.org/keywords/abstract-syntax-tree","display_name":"Abstract syntax tree","score":0.43481960892677307},{"id":"https://openalex.org/keywords/computational-complexity-theory","display_name":"Computational complexity theory","score":0.42615553736686707},{"id":"https://openalex.org/keywords/tree-structure","display_name":"Tree structure","score":0.4136987328529358},{"id":"https://openalex.org/keywords/syntax","display_name":"Syntax","score":0.35399919748306274},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.34620967507362366},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.29637277126312256},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2611253261566162}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8555161356925964},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.560854971408844},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.46475544571876526},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4485156834125519},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.44682565331459045},{"id":"https://openalex.org/C58646249","wikidata":"https://www.wikidata.org/wiki/Q127380","display_name":"Abstract syntax tree","level":3,"score":0.43481960892677307},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.42615553736686707},{"id":"https://openalex.org/C163797641","wikidata":"https://www.wikidata.org/wiki/Q2067937","display_name":"Tree structure","level":3,"score":0.4136987328529358},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.35399919748306274},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.34620967507362366},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.29637277126312256},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2611253261566162},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3477495.3531811","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3531811","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4264741699","display_name":null,"funder_award_id":"U1911203, 61877018","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2516621648","https://openalex.org/W2955426500","https://openalex.org/W2962739339","https://openalex.org/W2964110616","https://openalex.org/W2970120757","https://openalex.org/W3167354871","https://openalex.org/W3170092793","https://openalex.org/W3177492177","https://openalex.org/W3198685994","https://openalex.org/W3213368993","https://openalex.org/W4235670907","https://openalex.org/W4239249613","https://openalex.org/W4301168982"],"related_works":["https://openalex.org/W2077104824","https://openalex.org/W2536864162","https://openalex.org/W2390421503","https://openalex.org/W2364428493","https://openalex.org/W4400066978","https://openalex.org/W44541701","https://openalex.org/W2387926336","https://openalex.org/W2385522099","https://openalex.org/W2354135050","https://openalex.org/W2773378563"],"abstract_inverted_index":{"Programming-based":[0],"Pre-trained":[1],"Language":[2],"Models":[3],"(PPLMs)":[4],"such":[5,50],"as":[6,51],"CodeBERT":[7],"have":[8],"achieved":[9],"great":[10],"success":[11],"in":[12,25,44,66,92],"many":[13],"downstream":[14],"code-related":[15],"tasks.":[16,88],"Since":[17],"the":[18,26,31,37,79,109,123,127,130,138,161],"memory":[19],"and":[20,81,98],"computational":[21,120],"complexity":[22,80],"of":[23,129],"self-attention":[24],"Transformer":[27],"grow":[28],"quadratically":[29],"with":[30,117],"sequence":[32,140],"length,":[33],"PPLMs":[34],"typically":[35],"limit":[36],"code":[38,52,86,124,131,139],"length":[39],"to":[40,137],"512.":[41],"However,":[42],"codes":[43],"real-world":[45],"applications":[46],"are":[47,94],"generally":[48],"long,":[49],"searches,":[53],"which":[54,77,133],"cannot":[55],"be":[56,115],"processed":[57],"efficiently":[58],"by":[59],"existing":[60],"PPLMs.":[61],"To":[62],"solve":[63],"this":[64,67],"problem,":[65],"paper,":[68],"we":[69,142],"present":[70],"SASA,":[71],"a":[72,118,135],"Structure-Aware":[73],"Sparse":[74],"Attention":[75],"mechanism,":[76],"reduces":[78],"improves":[82],"performance":[83,159],"for":[84],"long":[85],"understanding":[87],"The":[89],"key":[90],"components":[91],"SASA":[93,156],"top-k":[95,106],"sparse":[96,107],"attention":[97,112],"Abstract":[99],"Syntax":[100],"Tree":[101],"(AST)-based":[102],"structure-aware":[103],"attention.":[104,148],"With":[105],"attention,":[108],"most":[110],"crucial":[111],"relation":[113],"can":[114],"obtained":[116],"lower":[119],"cost.":[121],"As":[122],"structure":[125],"represents":[126],"logic":[128],"statements,":[132],"is":[134],"complement":[136],"characteristics,":[141],"further":[143],"introduce":[144],"AST":[145],"structures":[146],"into":[147],"Extensive":[149],"experiments":[150],"on":[151],"CodeXGLUE":[152],"tasks":[153],"show":[154],"that":[155],"achieves":[157],"better":[158],"than":[160],"competing":[162],"baselines.":[163]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
