{"id":"https://openalex.org/W2114297064","doi":"https://doi.org/10.1137/130943595","title":"Dynamic Autotuning of Adaptive Fast Multipole Methods on Hybrid Multicore CPU and GPU Systems","display_name":"Dynamic Autotuning of Adaptive Fast Multipole Methods on Hybrid Multicore CPU and GPU Systems","publication_year":2014,"publication_date":"2014-01-01","ids":{"openalex":"https://openalex.org/W2114297064","doi":"https://doi.org/10.1137/130943595","mag":"2114297064"},"language":"en","primary_location":{"id":"doi:10.1137/130943595","is_oa":false,"landing_page_url":"https://doi.org/10.1137/130943595","pdf_url":null,"source":{"id":"https://openalex.org/S165512578","display_name":"SIAM Journal on Scientific Computing","issn_l":"1064-8275","issn":["1064-8275","1095-7197"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Scientific Computing","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/1311.1006","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Marcus Holm","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Marcus Holm","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Stefan Engblom","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stefan Engblom","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Anders Goude","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anders Goude","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Sverker Holmgren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sverker Holmgren","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4393,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.67173025,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"36","issue":"4","first_page":"C376","last_page":"C399"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9275000095367432,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9275000095367432,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11263","display_name":"Electromagnetic Simulation and Numerical Methods","score":0.022199999541044235,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11946","display_name":"Antenna Design and Optimization","score":0.005400000140070915,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fast-multipole-method","display_name":"Fast multipole method","score":0.8267999887466431},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.7294999957084656},{"id":"https://openalex.org/keywords/multipole-expansion","display_name":"Multipole expansion","score":0.7152000069618225},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.7060999870300293},{"id":"https://openalex.org/keywords/central-processing-unit","display_name":"Central processing unit","score":0.4837999939918518},{"id":"https://openalex.org/keywords/execution-time","display_name":"Execution time","score":0.3547999858856201},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.33889999985694885}],"concepts":[{"id":"https://openalex.org/C135115559","wikidata":"https://www.wikidata.org/wiki/Q5437040","display_name":"Fast multipole method","level":3,"score":0.8267999887466431},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.7294999957084656},{"id":"https://openalex.org/C52765159","wikidata":"https://www.wikidata.org/wiki/Q1027847","display_name":"Multipole expansion","level":2,"score":0.7152000069618225},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.7060999870300293},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6345999836921692},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.548799991607666},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.5350000262260437},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.4837999939918518},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.46309998631477356},{"id":"https://openalex.org/C2989134064","wikidata":"https://www.wikidata.org/wiki/Q288510","display_name":"Execution time","level":2,"score":0.3547999858856201},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.33889999985694885},{"id":"https://openalex.org/C2776003309","wikidata":"https://www.wikidata.org/wiki/Q1988072","display_name":"Adaptive algorithm","level":2,"score":0.3199000060558319},{"id":"https://openalex.org/C48753275","wikidata":"https://www.wikidata.org/wiki/Q11216","display_name":"Numerical analysis","level":2,"score":0.30250000953674316},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.30230000615119934},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.2874999940395355},{"id":"https://openalex.org/C2780033567","wikidata":"https://www.wikidata.org/wiki/Q6823720","display_name":"Method of moments (probability theory)","level":3,"score":0.2770000100135803},{"id":"https://openalex.org/C2780365336","wikidata":"https://www.wikidata.org/wiki/Q25047934","display_name":"Single-core","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.2605000138282776},{"id":"https://openalex.org/C106515295","wikidata":"https://www.wikidata.org/wiki/Q26806595","display_name":"Parallel processing","level":2,"score":0.257999986410141},{"id":"https://openalex.org/C50897621","wikidata":"https://www.wikidata.org/wiki/Q2665508","display_name":"Hybrid system","level":2,"score":0.2578999996185303}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1137/130943595","is_oa":false,"landing_page_url":"https://doi.org/10.1137/130943595","pdf_url":null,"source":{"id":"https://openalex.org/S165512578","display_name":"SIAM Journal on Scientific Computing","issn_l":"1064-8275","issn":["1064-8275","1095-7197"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320508","host_organization_name":"Society for Industrial and Applied Mathematics","host_organization_lineage":["https://openalex.org/P4310320508"],"host_organization_lineage_names":["Society for Industrial and Applied Mathematics"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"SIAM Journal on Scientific Computing","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:1311.1006","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1311.1006","pdf_url":"https://arxiv.org/pdf/1311.1006","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:1311.1006","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1311.1006","pdf_url":"https://arxiv.org/pdf/1311.1006","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W1988144251","https://openalex.org/W1992906507","https://openalex.org/W1993688432","https://openalex.org/W2017654099","https://openalex.org/W2029446187","https://openalex.org/W2035799855","https://openalex.org/W2050013934","https://openalex.org/W2054523422","https://openalex.org/W2068306188","https://openalex.org/W2069883496","https://openalex.org/W2077852080","https://openalex.org/W2080457038","https://openalex.org/W2083206954","https://openalex.org/W2168963553"],"related_works":[],"abstract_inverted_index":{"We":[0],"discuss":[1],"an":[2],"implementation":[3],"of":[4,22,25,79,85],"adaptive":[5],"fast":[6,27],"multipole":[7,28],"methods":[8],"targeting":[9],"hybrid":[10],"multicore":[11],"CPU-":[12],"and":[13,43,57,82],"GPU-systems.":[14],"From":[15],"previous":[16],"experiences":[17],"with":[18],"the":[19,26,35,38,47,52,55,68,76,80],"computational":[20],"profile":[21],"our":[23],"version":[24],"algorithm,":[29],"suitable":[30],"parts":[31,40],"are":[32,41,63],"off-loaded":[33],"to":[34,65],"GPU,":[36],"while":[37],"remaining":[39],"threaded":[42],"executed":[44],"concurrently":[45],"by":[46,58],"CPU.":[48],"The":[49],"parameters":[50],"defining":[51],"algorithm":[53,69],"affect":[54],"performance":[56],"measuring":[59],"this":[60],"effect":[61],"we":[62],"able":[64],"dynamically":[66],"balance":[67],"towards":[70],"optimal":[71],"performance.":[72],"Our":[73],"setup":[74],"uses":[75],"dynamic":[77],"nature":[78],"computations":[81],"is":[83],"therefore":[84],"general":[86],"character.":[87]},"counts_by_year":[{"year":2019,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1}],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2016-06-24T00:00:00"}
