{"id":"https://openalex.org/W2075537166","doi":"https://doi.org/10.1145/1964218.1964221","title":"Performance analysis of the OP2 framework on many-core architectures","display_name":"Performance analysis of the OP2 framework on many-core architectures","publication_year":2011,"publication_date":"2011-03-29","ids":{"openalex":"https://openalex.org/W2075537166","doi":"https://doi.org/10.1145/1964218.1964221","mag":"2075537166"},"language":"en","primary_location":{"id":"doi:10.1145/1964218.1964221","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1964218.1964221","pdf_url":null,"source":{"id":"https://openalex.org/S4210187660","display_name":"ACM SIGMETRICS Performance Evaluation Review","issn_l":"0163-5999","issn":["0163-5999","1557-9484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGMETRICS Performance Evaluation Review","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5056186758","display_name":"Michael B. Giles","orcid":"https://orcid.org/0000-0002-5445-3721"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"M. B. Giles","raw_affiliation_strings":["University of Oxford"],"affiliations":[{"raw_affiliation_string":"University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070789282","display_name":"Gihan R. Mudalige","orcid":"https://orcid.org/0000-0002-1398-5174"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"G. R. Mudalige","raw_affiliation_strings":["University of Oxford"],"affiliations":[{"raw_affiliation_string":"University of Oxford","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037791710","display_name":"Z. Sharif","orcid":null},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Z. Sharif","raw_affiliation_strings":["Imperial College London","Imperial College London,#TAB#"],"affiliations":[{"raw_affiliation_string":"Imperial College London","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Imperial College London,#TAB#","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083653923","display_name":"Graham Markall","orcid":"https://orcid.org/0009-0003-9005-1716"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"G. Markall","raw_affiliation_strings":["Imperial College London","Imperial College London,#TAB#"],"affiliations":[{"raw_affiliation_string":"Imperial College London","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Imperial College London,#TAB#","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000319133","display_name":"Paul H. J. Kelly","orcid":"https://orcid.org/0000-0001-5905-1804"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"P. H.J. Kelly","raw_affiliation_strings":["Imperial College London","Imperial College London,#TAB#"],"affiliations":[{"raw_affiliation_string":"Imperial College London","institution_ids":["https://openalex.org/I47508984"]},{"raw_affiliation_string":"Imperial College London,#TAB#","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5056186758"],"corresponding_institution_ids":["https://openalex.org/I40120149"],"apc_list":null,"apc_paid":null,"fwci":4.8787,"has_fulltext":false,"cited_by_count":43,"citation_normalized_percentile":{"value":0.95580924,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"38","issue":"4","first_page":"9","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10715","display_name":"Distributed and Parallel Computing Systems","score":0.9912999868392944,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/x86","display_name":"x86","score":0.8388602137565613},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8254350423812866},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.824845016002655},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7244281768798828},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.6990347504615784},{"id":"https://openalex.org/keywords/many-core","display_name":"Many core","score":0.5685166120529175},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.5564513802528381},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.5271536707878113},{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.466942697763443},{"id":"https://openalex.org/keywords/partition","display_name":"Partition (number theory)","score":0.4631367027759552},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.44313958287239075},{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.44044458866119385},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.24678978323936462},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.1751765012741089},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15323060750961304}],"concepts":[{"id":"https://openalex.org/C170723468","wikidata":"https://www.wikidata.org/wiki/Q182933","display_name":"x86","level":3,"score":0.8388602137565613},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8254350423812866},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.824845016002655},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7244281768798828},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.6990347504615784},{"id":"https://openalex.org/C3020431745","wikidata":"https://www.wikidata.org/wiki/Q25325220","display_name":"Many core","level":2,"score":0.5685166120529175},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.5564513802528381},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.5271536707878113},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.466942697763443},{"id":"https://openalex.org/C42812","wikidata":"https://www.wikidata.org/wiki/Q1082910","display_name":"Partition (number theory)","level":2,"score":0.4631367027759552},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.44313958287239075},{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.44044458866119385},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.24678978323936462},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.1751765012741089},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15323060750961304},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1964218.1964221","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1964218.1964221","pdf_url":null,"source":{"id":"https://openalex.org/S4210187660","display_name":"ACM SIGMETRICS Performance Evaluation Review","issn_l":"0163-5999","issn":["0163-5999","1557-9484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGMETRICS Performance Evaluation Review","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.714.1505","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.714.1505","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.doc.ic.ac.uk/%7Egrm08/PMBS2010.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.5600000023841858,"display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G2249403966","display_name":null,"funder_award_id":"EP/I00677X/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G4452853771","display_name":null,"funder_award_id":"EP/G00210X/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G7583076630","display_name":null,"funder_award_id":"EP/I006079/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320309480","display_name":"Nvidia","ror":"https://ror.org/03jdj4y14"},{"id":"https://openalex.org/F4320320283","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10"},{"id":"https://openalex.org/F4320321979","display_name":"University of Surrey","ror":"https://ror.org/00ks66431"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":13,"referenced_works":["https://openalex.org/W1484160293","https://openalex.org/W1507090345","https://openalex.org/W1555233232","https://openalex.org/W1991106844","https://openalex.org/W2028262862","https://openalex.org/W2047287711","https://openalex.org/W2065080695","https://openalex.org/W2085123413","https://openalex.org/W2118055195","https://openalex.org/W2133755209","https://openalex.org/W2154968583","https://openalex.org/W2158640099","https://openalex.org/W4213211643"],"related_works":["https://openalex.org/W2740999212","https://openalex.org/W2188971969","https://openalex.org/W1994052277","https://openalex.org/W2769399951","https://openalex.org/W2024554511","https://openalex.org/W2588843388","https://openalex.org/W3042238487","https://openalex.org/W2885985254","https://openalex.org/W2599563411","https://openalex.org/W1964236241"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,59,68],"performance":[3,45,54,104,148],"analysis":[4,100],"and":[5,43,87,91,111,140,149],"benchmarking":[6],"study":[7],"of":[8,21,33,70,108,126,135],"the":[9,19,30,34,48,75,84,102,106,117,133,137,143,146],"OP2":[10,26,66],"\"active\"":[11],"library,":[12],"which":[13],"provides":[14],"an":[15,120],"abstraction":[16],"framework":[17],"for":[18,58,116,153],"solution":[20,118],"parallel":[22,38,114],"unstructured":[23,61,123],"mesh":[24,62,124],"applications.":[25],"aims":[27],"to":[28,50],"decouple":[29],"scientific":[31],"specification":[32],"application":[35,63],"from":[36,79,94],"its":[37],"implementation,":[39],"achieving":[40],"code":[41],"longevity":[42],"near-optimal":[44],"through":[46],"re-targeting":[47],"back-end":[49],"different":[51],"hardware.":[52],"Runtime":[53],"results":[55],"are":[56],"presented":[57],"representative":[60],"written":[64],"using":[65],"on":[67,83,119],"variety":[69],"many-core":[71],"processor":[72],"systems,":[73],"including":[74],"traditional":[76],"X86":[77],"architectures":[78],"Intel":[80],"(Xeon":[81],"based":[82],"older":[85],"Penryn":[86],"current":[88],"Nehalem":[89],"micro-architectures)":[90],"GPU":[92,112,147],"offerings":[93],"NVIDIA":[95],"(GTX260,":[96],"Tesla":[97],"C2050).":[98],"Our":[99],"demonstrates":[101],"contrasting":[103],"between":[105],"use":[107],"CPU":[109],"(OpenMP)":[110],"(CUDA)":[113],"implementations":[115],"industrial":[121],"sized":[122],"consisting":[125],"about":[127],"1.5":[128],"million":[129],"edges.":[130],"Results":[131],"show":[132],"significance":[134],"choosing":[136],"correct":[138],"partition":[139],"thread-block":[141],"configuration,":[142],"factors":[144],"limiting":[145],"insights":[150],"into":[151],"optimizations":[152],"improved":[154],"performance.":[155]},"counts_by_year":[{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":4},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":10}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
