{"id":"https://openalex.org/W2808635636","doi":"https://doi.org/10.1504/ijac.2018.10013770","title":"WT_DMDA new scheduling strategy for conjugate gradient solver on heterogeneous architecture","display_name":"WT_DMDA new scheduling strategy for conjugate gradient solver on heterogeneous architecture","publication_year":2018,"publication_date":"2018-01-01","ids":{"openalex":"https://openalex.org/W2808635636","doi":"https://doi.org/10.1504/ijac.2018.10013770","mag":"2808635636"},"language":"en","primary_location":{"id":"doi:10.1504/ijac.2018.10013770","is_oa":false,"landing_page_url":"https://doi.org/10.1504/ijac.2018.10013770","pdf_url":null,"source":{"id":"https://openalex.org/S8724992","display_name":"International Journal of Autonomic Computing","issn_l":"1741-8569","issn":["1741-8569","1741-8577"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Autonomic Computing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019027943","display_name":"Pierre Manneback","orcid":"https://orcid.org/0000-0003-3990-3621"},"institutions":[{"id":"https://openalex.org/I126477371","display_name":"Mohammed V University","ror":"https://ror.org/00r8w8f84","country_code":"MA","type":"education","lineage":["https://openalex.org/I126477371"]}],"countries":["MA"],"is_corresponding":false,"raw_author_name":"Pierre Manneback","raw_affiliation_strings":["ENSIAS, Mohammed V University  Rabat Morocco"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ENSIAS, Mohammed V University  Rabat Morocco","institution_ids":["https://openalex.org/I126477371"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026980527","display_name":"Sidi Ahmed Mahmoudi","orcid":"https://orcid.org/0000-0002-1530-9524"},"institutions":[{"id":"https://openalex.org/I126477371","display_name":"Mohammed V University","ror":"https://ror.org/00r8w8f84","country_code":"MA","type":"education","lineage":["https://openalex.org/I126477371"]}],"countries":["MA"],"is_corresponding":false,"raw_author_name":"Sidi Ahmed Mahmoudi","raw_affiliation_strings":["ENSIAS, Mohammed V University  Rabat Morocco"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"ENSIAS, Mohammed V University  Rabat Morocco","institution_ids":["https://openalex.org/I126477371"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048332059","display_name":"Najlae Kasmi","orcid":null},"institutions":[{"id":"https://openalex.org/I130929987","display_name":"University of Mons","ror":"https://ror.org/02qnnz951","country_code":"BE","type":"education","lineage":["https://openalex.org/I130929987"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Najlae Kasmi","raw_affiliation_strings":["Faculty of Engineering, University of Mons (UMONS), 20, Place du Parc, Mons, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Mons (UMONS), 20, Place du Parc, Mons, Belgium","institution_ids":["https://openalex.org/I130929987"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112733980","display_name":"Mostapha Zbakh","orcid":"https://orcid.org/0000-0002-1408-3850"},"institutions":[{"id":"https://openalex.org/I130929987","display_name":"University of Mons","ror":"https://ror.org/02qnnz951","country_code":"BE","type":"education","lineage":["https://openalex.org/I130929987"]}],"countries":["BE"],"is_corresponding":false,"raw_author_name":"Mostapha Zbakh","raw_affiliation_strings":["Faculty of Engineering, University of Mons (UMONS), 20, Place du Parc, Mons, Belgium"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Engineering, University of Mons (UMONS), 20, Place du Parc, Mons, Belgium","institution_ids":["https://openalex.org/I130929987"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10092294,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"3","issue":"1","first_page":"52","last_page":"52"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10792","display_name":"Matrix Theory and Algorithms","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9904999732971191,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9807000160217285,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7057961225509644},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.5887399911880493},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.5599492788314819},{"id":"https://openalex.org/keywords/conjugate-gradient-method","display_name":"Conjugate gradient method","score":0.5550108551979065},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5432459115982056},{"id":"https://openalex.org/keywords/conjugate","display_name":"Conjugate","score":0.5147523880004883},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.36186033487319946},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.34308546781539917},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3364581763744354},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.20498380064964294},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.20419448614120483},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.10496193170547485}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7057961225509644},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.5887399911880493},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.5599492788314819},{"id":"https://openalex.org/C81184566","wikidata":"https://www.wikidata.org/wiki/Q1191895","display_name":"Conjugate gradient method","level":2,"score":0.5550108551979065},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5432459115982056},{"id":"https://openalex.org/C197336794","wikidata":"https://www.wikidata.org/wiki/Q5161150","display_name":"Conjugate","level":2,"score":0.5147523880004883},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.36186033487319946},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.34308546781539917},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3364581763744354},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.20498380064964294},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.20419448614120483},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.10496193170547485},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1504/ijac.2018.10013770","is_oa":false,"landing_page_url":"https://doi.org/10.1504/ijac.2018.10013770","pdf_url":null,"source":{"id":"https://openalex.org/S8724992","display_name":"International Journal of Autonomic Computing","issn_l":"1741-8569","issn":["1741-8569","1741-8577"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Autonomic Computing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2143004018","https://openalex.org/W2330362314","https://openalex.org/W2435669318","https://openalex.org/W1995639836","https://openalex.org/W1543576583","https://openalex.org/W2754988198","https://openalex.org/W2052516204","https://openalex.org/W2107387898","https://openalex.org/W1993252583","https://openalex.org/W2952417160"],"abstract_inverted_index":{"Heterogeneous":[0],"systems":[1],"which":[2,65,103],"are":[3,10,40],"composed":[4],"of":[5,24,87,109,128,136,160,176,182],"multiple":[6],"CPUs":[7],"and":[8,12,31,36,90,141,166,180],"GPUs":[9,42,140],"more":[11,13,38],"attractive":[14],"as":[15,43],"platforms":[16],"for":[17],"high":[18],"performance":[19,48,108,169],"computing.":[20],"With":[21],"the":[22,56,60,83,88,91,107,110,126,129,168,174],"evolution":[23],"general":[25],"purpose":[26],"computation":[27],"on":[28,131],"GPU":[29],"(GPGPU)":[30],"corresponding":[32],"programming":[33],"frameworks":[34],"(OpenCL":[35],"CUDA),":[37],"applications":[39],"using":[41,54],"a":[44,73,98,132],"co-processor":[45],"to":[46,72,82,105,124,151,157],"achieve":[47],"that":[49,147,167],"could":[50],"not":[51],"be":[52,70,154],"accomplished":[53],"just":[55],"traditional":[57],"processors.":[58],"However,":[59],"main":[61],"problem":[62,77],"is":[63,78,170,185],"identifying":[64],"task":[66],"or":[67],"job":[68],"should":[69],"allocated":[71],"particular":[74],"device.":[75],"The":[76],"even":[79],"complicated":[80],"due":[81],"dissimilar":[84],"computational":[85,133],"power":[86],"CPU":[89],"GPU.":[92],"In":[93],"this":[94],"work":[95],"we":[96],"propose":[97],"new":[99],"scheduling":[100],"strategy":[101],"WT_DMDA":[102],"aims":[104],"optimise":[106],"preconditioned":[111],"conjugate":[112],"gradient":[113],"solver,":[114],"in":[115],"CPU-GPU":[116],"heterogeneous":[117],"environment.":[118],"We":[119,145],"use":[120],"StarPU":[121],"runtime":[122],"system":[123],"assess":[125],"efficiency":[127],"approach":[130],"platform":[134],"consisting":[135],"three":[137],"NVIDIA":[138],"Fermi":[139],"12":[142],"Intel":[143],"CPUs.":[144],"show":[146],"important":[148],"speedups":[149],"(up":[150],"5.13\u00d7)":[152],"may":[153],"reached":[155],"(relatively":[156],"default":[158],"scheduler":[159],"StarPU)":[161],"when":[162,172],"processing":[163],"large":[164],"matrices":[165],"advantageous":[171],"changing":[173],"granularity":[175],"tasks.":[177],"An":[178],"analysis":[179],"evaluation":[181],"these":[183],"results":[184],"discussed.":[186]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
