{"id":"https://openalex.org/W2563989965","doi":"https://doi.org/10.3233/978-1-61499-621-7-237","title":"Exploring the Offload Execution Model in the Intel Xeon Phi via Matrix Inversion","display_name":"Exploring the Offload Execution Model in the Intel Xeon Phi via Matrix Inversion","publication_year":2016,"publication_date":"2016-01-01","ids":{"openalex":"https://openalex.org/W2563989965","doi":"https://doi.org/10.3233/978-1-61499-621-7-237","mag":"2563989965"},"language":"en","primary_location":{"id":"doi:10.3233/978-1-61499-621-7-237","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-621-7-237","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Benner Peter","orcid":null},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210127568","display_name":"Max Planck Institute for Dynamics of Complex Technical Systems","ror":"https://ror.org/030h7k016","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210127568"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Benner Peter","raw_affiliation_strings":["Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society","institution_ids":["https://openalex.org/I4210127568","https://openalex.org/I149899117"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039665879","display_name":"Pablo Ezzatti","orcid":"https://orcid.org/0000-0002-2368-8907"},"institutions":[{"id":"https://openalex.org/I180910786","display_name":"Universidad de la Rep\u00fablica de Uruguay","ror":"https://ror.org/030bbe882","country_code":"UY","type":"education","lineage":["https://openalex.org/I180910786"]}],"countries":["UY"],"is_corresponding":false,"raw_author_name":"Ezzatti Pablo","raw_affiliation_strings":["Instituto de Computaci\u00f3n, Universidad de la Rep\u00fablica, 11300-Montevideo, Uruguay#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Instituto de Computaci\u00f3n, Universidad de la Rep\u00fablica, 11300-Montevideo, Uruguay#TAB#","institution_ids":["https://openalex.org/I180910786"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012806004","display_name":"Enrique S. Quintana\u2013Ort\u0301\u0131","orcid":"https://orcid.org/0000-0002-5454-165X"},"institutions":[{"id":"https://openalex.org/I10902133","display_name":"Universitat Jaume I","ror":"https://ror.org/02ws1xc11","country_code":"ES","type":"education","lineage":["https://openalex.org/I10902133"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Quintana-Ort&iacute; Enrique S.","raw_affiliation_strings":["Universitat Jaume I Castell\u00f3n, Spain#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universitat Jaume I Castell\u00f3n, Spain#TAB#","institution_ids":["https://openalex.org/I10902133"]}]},{"author_position":"last","author":{"id":null,"display_name":"Rem&oacute;n Alfredo","orcid":null},"institutions":[{"id":"https://openalex.org/I149899117","display_name":"Max Planck Society","ror":"https://ror.org/01hhn8329","country_code":"DE","type":"nonprofit","lineage":["https://openalex.org/I149899117"]},{"id":"https://openalex.org/I4210127568","display_name":"Max Planck Institute for Dynamics of Complex Technical Systems","ror":"https://ror.org/030h7k016","country_code":"DE","type":"facility","lineage":["https://openalex.org/I149899117","https://openalex.org/I4210127568"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rem&oacute;n Alfredo","raw_affiliation_strings":["Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computational Methods in Systems and Control Theory, Max Planck Institute for Dynamics of Complex Technical Systems, Max Planck Society","institution_ids":["https://openalex.org/I4210127568","https://openalex.org/I149899117"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I149899117","https://openalex.org/I4210127568"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.27425373,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10904","display_name":"Embedded Systems Design Techniques","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/xeon-phi","display_name":"Xeon Phi","score":0.8553204536437988},{"id":"https://openalex.org/keywords/inversion","display_name":"Inversion (geology)","score":0.7162653207778931},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.6491857767105103},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.620765745639801},{"id":"https://openalex.org/keywords/xeon","display_name":"Xeon","score":0.6059019565582275},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.39362674951553345},{"id":"https://openalex.org/keywords/geology","display_name":"Geology","score":0.06901389360427856}],"concepts":[{"id":"https://openalex.org/C96972482","wikidata":"https://www.wikidata.org/wiki/Q1049168","display_name":"Xeon Phi","level":2,"score":0.8553204536437988},{"id":"https://openalex.org/C1893757","wikidata":"https://www.wikidata.org/wiki/Q3653001","display_name":"Inversion (geology)","level":3,"score":0.7162653207778931},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.6491857767105103},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.620765745639801},{"id":"https://openalex.org/C145108525","wikidata":"https://www.wikidata.org/wiki/Q656154","display_name":"Xeon","level":2,"score":0.6059019565582275},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.39362674951553345},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.06901389360427856},{"id":"https://openalex.org/C109007969","wikidata":"https://www.wikidata.org/wiki/Q749565","display_name":"Structural basin","level":2,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.3233/978-1-61499-621-7-237","is_oa":false,"landing_page_url":"https://doi.org/10.3233/978-1-61499-621-7-237","pdf_url":null,"source":{"id":"https://openalex.org/S4210175178","display_name":"Advances in parallel computing","issn_l":"0927-5452","issn":["0927-5452","1879-808X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"book series"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advances in Parallel Computing","raw_type":"book-chapter"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2526069705","https://openalex.org/W2024016913","https://openalex.org/W2214459866","https://openalex.org/W2035419609","https://openalex.org/W2773471004","https://openalex.org/W2898398754","https://openalex.org/W2749903484","https://openalex.org/W2204115394","https://openalex.org/W2936534257","https://openalex.org/W2090306017"],"abstract_inverted_index":{"The":[0],"explicit":[1],"inversion":[2,49],"of":[3,26,54,83,108,134],"dense":[4],"matrices":[5],"appears":[6],"in":[7],"a":[8,105,117],"numerous":[9],"key":[10],"scientific":[11],"and":[12,31,78,125],"engineering":[13],"applications":[14],"such":[15,63],"as":[16,64],"model":[17,95],"reduction":[18],"or":[19,68],"optimal":[20],"control,":[21],"asking":[22],"for":[23,47,60],"the":[24,34,69,92,98,109,112,132,138],"exploitation":[25],"high":[27],"performance":[28],"computing":[29],"techniques":[30],"architectures":[32],"when":[33],"problem":[35],"dimension":[36],"is":[37,42],"large.":[38],"Gauss-Jordan":[39],"elimination":[40],"(GJE)":[41],"an":[43,126],"efficient":[44,140],"in-place":[45],"method":[46],"matrix":[48],"that":[50,89],"exposes":[51],"large":[52],"amounts":[53],"dataparallelism,":[55],"making":[56],"it":[57],"very":[58],"convenient":[59],"hardware":[61],"accelerators":[62],"graphics":[65],"processors":[66,124],"(GPUs)":[67],"Intel":[70,99,121,127],"Xeon":[71,100,122,128],"Phi.":[72],"In":[73],"this":[74],"paper,":[75],"we":[76],"present":[77],"evaluate":[79],"several":[80],"practical":[81],"implementations":[82],"GJE,":[84],"with":[85,119,137],"partial":[86],"row":[87],"pivoting,":[88],"especially":[90],"exploit":[91],"off-load":[93],"execution":[94],"available":[96],"on":[97,111,116],"Phi":[101,129],"to":[102],"carry":[103],"out":[104],"significant":[106],"fraction":[107],"computations":[110],"accelerator.":[113],"Numerical":[114],"experiments":[115],"system":[118],"two":[120],"E5-2640v3":[123],"7120P":[130],"compare":[131],"efficiency":[133],"these":[135],"implementations,":[136],"most":[139],"case":[141],"delivering":[142],"about":[143],"700":[144],"billions":[145],"double-precision":[146],"floating-point":[147],"operations":[148],"per":[149],"second.":[150]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2017-01-06T00:00:00"}
