{"id":"https://openalex.org/W4409131810","doi":"https://doi.org/10.1109/hpec62836.2024.10938451","title":"Comparative Analysis of GCC and LLVM for Performance Optimization on Aarch64","display_name":"Comparative Analysis of GCC and LLVM for Performance Optimization on Aarch64","publication_year":2024,"publication_date":"2024-09-23","ids":{"openalex":"https://openalex.org/W4409131810","doi":"https://doi.org/10.1109/hpec62836.2024.10938451"},"language":"en","primary_location":{"id":"doi:10.1109/hpec62836.2024.10938451","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpec62836.2024.10938451","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE High Performance Extreme Computing Conference (HPEC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5116901167","display_name":"Mriganka Bezbaruah","orcid":null},"institutions":[{"id":"https://openalex.org/I1331500379","display_name":"Centre for Development of Advanced Computing","ror":"https://ror.org/022abst40","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1331500379","https://openalex.org/I4210121746"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Mriganka Bezbaruah","raw_affiliation_strings":["Centre for Development of Advanced Computing,Bengaluru,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Development of Advanced Computing,Bengaluru,India","institution_ids":["https://openalex.org/I1331500379"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116901168","display_name":"Samruddhi Dhakulkar","orcid":null},"institutions":[{"id":"https://openalex.org/I1331500379","display_name":"Centre for Development of Advanced Computing","ror":"https://ror.org/022abst40","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1331500379","https://openalex.org/I4210121746"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Samruddhi Dhakulkar","raw_affiliation_strings":["Centre for Development of Advanced Computing,Bengaluru,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Development of Advanced Computing,Bengaluru,India","institution_ids":["https://openalex.org/I1331500379"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101765211","display_name":"Prachi Pandey","orcid":"https://orcid.org/0000-0002-1826-9601"},"institutions":[{"id":"https://openalex.org/I1331500379","display_name":"Centre for Development of Advanced Computing","ror":"https://ror.org/022abst40","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1331500379","https://openalex.org/I4210121746"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Prachi Pandey","raw_affiliation_strings":["Centre for Development of Advanced Computing,Bengaluru,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Development of Advanced Computing,Bengaluru,India","institution_ids":["https://openalex.org/I1331500379"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038622495","display_name":"P Haribabu","orcid":null},"institutions":[{"id":"https://openalex.org/I1331500379","display_name":"Centre for Development of Advanced Computing","ror":"https://ror.org/022abst40","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1331500379","https://openalex.org/I4210121746"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Haribabu P","raw_affiliation_strings":["Centre for Development of Advanced Computing,Bengaluru,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Development of Advanced Computing,Bengaluru,India","institution_ids":["https://openalex.org/I1331500379"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101957775","display_name":"Sathish Kumar","orcid":"https://orcid.org/0000-0002-3162-2211"},"institutions":[{"id":"https://openalex.org/I1331500379","display_name":"Centre for Development of Advanced Computing","ror":"https://ror.org/022abst40","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1331500379","https://openalex.org/I4210121746"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"S A Kumar","raw_affiliation_strings":["Centre for Development of Advanced Computing,Bengaluru,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Development of Advanced Computing,Bengaluru,India","institution_ids":["https://openalex.org/I1331500379"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102868385","display_name":"S D Sudarsan","orcid":"https://orcid.org/0000-0002-7990-6686"},"institutions":[{"id":"https://openalex.org/I1331500379","display_name":"Centre for Development of Advanced Computing","ror":"https://ror.org/022abst40","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1331500379","https://openalex.org/I4210121746"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"S D Sudarsan","raw_affiliation_strings":["Centre for Development of Advanced Computing,Bengaluru,India"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Centre for Development of Advanced Computing,Bengaluru,India","institution_ids":["https://openalex.org/I1331500379"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I1331500379"],"apc_list":null,"apc_paid":null,"fwci":0.4312,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.66683217,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.5539000034332275,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.5539000034332275,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13717","display_name":"Advanced Algorithms and Applications","score":0.5151000022888184,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12941","display_name":"Embedded Systems and FPGA Design","score":0.4925000071525574,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6222051382064819}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6222051382064819}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpec62836.2024.10938451","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpec62836.2024.10938451","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE High Performance Extreme Computing Conference (HPEC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320312726","display_name":"University of Oregon","ror":"https://ror.org/0293rh119"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W2013156670","https://openalex.org/W2028843179","https://openalex.org/W2060422862","https://openalex.org/W2183278975","https://openalex.org/W2613264175","https://openalex.org/W2623993198","https://openalex.org/W2979513934","https://openalex.org/W3097636320","https://openalex.org/W3167137103","https://openalex.org/W3206873289","https://openalex.org/W3216357191","https://openalex.org/W4319067047","https://openalex.org/W6802181365"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"The":[0],"emergence":[1],"of":[2,14,27,57,88,107,127,156,164],"ARM-based":[3,41],"architectures":[4],"in":[5,45],"high-performance":[6],"computing":[7],"(HPC)":[8],"has":[9],"necessitated":[10],"a":[11],"closer":[12],"examination":[13],"compiler":[15,145],"behaviors":[16],"and":[17,24,29,50,63,97,110,121,136],"optimizations.":[18],"This":[19,147],"paper":[20],"investigates":[21],"the":[22,58,77,86,89,154,162],"performance":[23,87,119,163],"optimization":[25,123],"capabilities":[26],"GCC":[28,108],"LLVM":[30,111],"compilers":[31,90],"for":[32,80,143,153],"Aarch64":[33],"processors":[34,43],"on":[35,40,54,92],"HPC":[36,42,166],"workloads.":[37],"We":[38],"focus":[39],"used":[44],"systems":[46],"like":[47],"Grace":[48],"Hopper":[49],"Fujitsu":[51],"A64FX,":[52],"emphasizing":[53],"their":[55,114],"implementations":[56],"Scalable":[59],"Vector":[60],"Extension":[61],"(SVE)":[62],"other":[64],"architectural":[65],"features":[66],"that":[67],"enhance":[68],"performance.":[69],"Through":[70],"comprehensive":[71],"benchmarking,":[72],"including":[73],"vectorization":[74],"analysis":[75,126],"with":[76,113],"Test":[78],"Suite":[79],"Vectorizing":[81],"Compilers":[82],"(TSVC),":[83],"we":[84,117],"evaluate":[85],"based":[91],"execution":[93],"times,":[94],"applied":[95],"optimizations,":[96],"code":[98,129],"portability":[99],"across":[100],"these":[101],"systems.":[102,167],"By":[103],"comparing":[104],"recent":[105],"versions":[106],"(v14)":[109],"(v18)":[112],"previous":[115],"versions,":[116],"highlight":[118],"improvements":[120],"identify":[122],"gaps.":[124],"Our":[125],"assembly":[128],"offers":[130],"insights":[131,152],"into":[132],"vectorization,":[133],"register":[134],"allocation,":[135],"SIMD":[137],"instruction":[138],"generation,":[139],"providing":[140],"valuable":[141],"recommendations":[142],"future":[144],"enhancements.":[146],"study":[148],"aims":[149],"to":[150],"give":[151],"development":[155],"more":[157],"efficient":[158],"compilers,":[159],"ultimately":[160],"advancing":[161],"Aarch64-based":[165]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
