{"id":"https://openalex.org/W2794543518","doi":"https://doi.org/10.3233/978-1-61499-843-3-339","title":"A Fast Implementation of a Spectral Finite Elements Method on CPU and GPU Applied to Ultrasound Propagation","display_name":"A Fast Implementation of a Spectral Finite Elements Method on CPU and GPU Applied to Ultrasound Propagation","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2794543518","doi":"https://doi.org/10.3233/978-1-61499-843-3-339","mag":"2794543518"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-843-3-339","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-843-3-339","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-01761605","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060096770","display_name":"Carlos Carrascal-Manzanares","orcid":null},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]},{"id":"https://openalex.org/I4210125654","display_name":"Maison de la Simulation","ror":"https://ror.org/03jv6w209","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I195731000","https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210113668","https://openalex.org/I4210125654","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Carrascal-Manzanares Carlos","raw_affiliation_strings":["ALSOC - Architecture et Logiciels pour Syst\u00e8mes Embarqu\u00e9s sur Puce (France)","DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ALSOC - Architecture et Logiciels pour Syst\u00e8mes Embarqu\u00e9s sur Puce (France)","institution_ids":[]},{"raw_affiliation_string":"DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)","institution_ids":["https://openalex.org/I2738703131","https://openalex.org/I4210085861","https://openalex.org/I4210125654"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001170644","display_name":"Alexandre Imp\u00e9riale","orcid":"https://orcid.org/0000-0002-0561-0081"},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]},{"id":"https://openalex.org/I4210125654","display_name":"Maison de la Simulation","ror":"https://ror.org/03jv6w209","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I195731000","https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210113668","https://openalex.org/I4210125654","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Imperiale Alexandre","raw_affiliation_strings":["DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)","institution_ids":["https://openalex.org/I2738703131","https://openalex.org/I4210085861","https://openalex.org/I4210125654"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106082566","display_name":"Gilles Rougeron","orcid":null},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]},{"id":"https://openalex.org/I4210125654","display_name":"Maison de la Simulation","ror":"https://ror.org/03jv6w209","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I195731000","https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210113668","https://openalex.org/I4210125654","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Rougeron Gilles","raw_affiliation_strings":["DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)","institution_ids":["https://openalex.org/I2738703131","https://openalex.org/I4210085861","https://openalex.org/I4210125654"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083041090","display_name":"Vincent Bergeaud","orcid":null},"institutions":[{"id":"https://openalex.org/I2738703131","display_name":"Commissariat \u00e0 l'\u00c9nergie Atomique et aux \u00c9nergies Alternatives","ror":"https://ror.org/00jjx8s55","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131"]},{"id":"https://openalex.org/I4210085861","display_name":"Laboratoire d'Int\u00e9gration des Syst\u00e8mes et des Technologies","ror":"https://ror.org/000dbcc61","country_code":"FR","type":"government","lineage":["https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I4210085861","https://openalex.org/I4210117989"]},{"id":"https://openalex.org/I4210125654","display_name":"Maison de la Simulation","ror":"https://ror.org/03jv6w209","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I195731000","https://openalex.org/I2738703131","https://openalex.org/I2738703131","https://openalex.org/I277688954","https://openalex.org/I277688954","https://openalex.org/I4210113668","https://openalex.org/I4210125654","https://openalex.org/I4210159245"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Bergeaud Vincent","raw_affiliation_strings":["DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"DISC (CEA, LIST) - D\u00e9partement Imagerie et Simulation pour le Contr\u00f4le (CEA, LIST) (CEA SACLAY DIGITEO LABS B\u00e2t. 565 91191 GIF-SUR-YVETTE CEDEX - France)","institution_ids":["https://openalex.org/I2738703131","https://openalex.org/I4210085861","https://openalex.org/I4210125654"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086965094","display_name":"Lionel Lacassagne","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lacassagne Lionel","raw_affiliation_strings":["ALSOC - Architecture et Logiciels pour Syst\u00e8mes Embarqu\u00e9s sur Puce (France)"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ALSOC - Architecture et Logiciels pour Syst\u00e8mes Embarqu\u00e9s sur Puce (France)","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.3679,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.86747871,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11263","display_name":"Electromagnetic Simulation and Numerical Methods","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11263","display_name":"Electromagnetic Simulation and Numerical Methods","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10271","display_name":"Seismic Imaging and Inversion Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1908","display_name":"Geophysics"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10739","display_name":"Electromagnetic Scattering and Analysis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/simd","display_name":"SIMD","score":0.7890185117721558},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7452772855758667},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.7167807817459106},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5949735045433044},{"id":"https://openalex.org/keywords/scalar","display_name":"Scalar (mathematics)","score":0.5646039843559265},{"id":"https://openalex.org/keywords/central-processing-unit","display_name":"Central processing unit","score":0.5133787393569946},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.4688231647014618},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.415549099445343},{"id":"https://openalex.org/keywords/floating-point","display_name":"Floating point","score":0.4110748767852783},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2602616548538208},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.22882071137428284},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11456769704818726},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07725951075553894}],"concepts":[{"id":"https://openalex.org/C150552126","wikidata":"https://www.wikidata.org/wiki/Q339387","display_name":"SIMD","level":2,"score":0.7890185117721558},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7452772855758667},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.7167807817459106},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5949735045433044},{"id":"https://openalex.org/C57691317","wikidata":"https://www.wikidata.org/wiki/Q1289248","display_name":"Scalar (mathematics)","level":2,"score":0.5646039843559265},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.5133787393569946},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.4688231647014618},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.415549099445343},{"id":"https://openalex.org/C84211073","wikidata":"https://www.wikidata.org/wiki/Q117879","display_name":"Floating point","level":2,"score":0.4110748767852783},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2602616548538208},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.22882071137428284},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11456769704818726},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07725951075553894},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3233/978-1-61499-843-3-339","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-843-3-339","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},{"id":"pmh:oai:HAL:hal-01761605v1","is_oa":true,"landing_page_url":"https://hal.science/hal-01761605","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"www.parco.org","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-01761605v1","is_oa":true,"landing_page_url":"https://hal.science/hal-01761605","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"www.parco.org","raw_type":"Conference papers"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W46533625","https://openalex.org/W1494930385","https://openalex.org/W1975243156","https://openalex.org/W1975462624","https://openalex.org/W1977052086","https://openalex.org/W2011638694","https://openalex.org/W2021157069","https://openalex.org/W2021261510","https://openalex.org/W2057630513","https://openalex.org/W2075768929","https://openalex.org/W2104951519","https://openalex.org/W2114929171","https://openalex.org/W2148631859","https://openalex.org/W2159094357","https://openalex.org/W2310513352","https://openalex.org/W2731650325","https://openalex.org/W2801789732"],"related_works":["https://openalex.org/W2565725308","https://openalex.org/W2593628307","https://openalex.org/W3091978438","https://openalex.org/W4226248541","https://openalex.org/W4312862090","https://openalex.org/W4232853593","https://openalex.org/W2022441525","https://openalex.org/W2331916929","https://openalex.org/W2897504747","https://openalex.org/W2402775763"],"abstract_inverted_index":{"In":[0],"this":[1],"paper":[2],"we":[3,62],"present":[4,72],"an":[5],"optimization":[6],"of":[7,20,24,33,67,83],"a":[8,64,91],"spectral":[9],"finite":[10],"element":[11],"method":[12],"implementation.":[13],"The":[14,40],"improvements":[15],"consisted":[16],"in":[17,30],"the":[18,21,25,31,34,57,75,80],"modification":[19],"memory":[22],"layout":[23],"main":[26],"algorithmic":[27],"kernels":[28],"and":[29,49],"augmentation":[32],"arithmetic":[35],"intensity":[36],"via":[37],"loop":[38],"transformations.":[39],"code":[41,77],"has":[42],"been":[43],"deployed":[44],"on":[45,69,86],"multi-core":[46],"SIMD":[47],"machines":[48],"GPU.":[50],"Compared":[51],"to":[52],"our":[53,84],"starting":[54],"point,":[55],"i.e.":[56],"original":[58],"scalar":[59],"sequential":[60],"code,":[61],"achieved":[63],"speed":[65],"up":[66],"&amp;times;228":[68],"CPU.":[70],"We":[71],"comparisons":[73],"with":[74],"SPECFEM2D":[76],"that":[78],"prove":[79],"good":[81],"performances":[82],"implementation":[85],"similar":[87],"cases.":[88],"On":[89],"GPU,":[90],"hybrid":[92],"solution":[93],"is":[94],"investigated.":[95]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2018-04-06T00:00:00"}
