{"id":"https://openalex.org/W3116059414","doi":"https://doi.org/10.1109/tpds.2020.3046870","title":"iMLBench: A Machine Learning Benchmark Suite for CPU-GPU Integrated Architectures","display_name":"iMLBench: A Machine Learning Benchmark Suite for CPU-GPU Integrated Architectures","publication_year":2020,"publication_date":"2020-12-23","ids":{"openalex":"https://openalex.org/W3116059414","doi":"https://doi.org/10.1109/tpds.2020.3046870","mag":"3116059414"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2020.3046870","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3046870","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100337319","display_name":"Chenyang Zhang","orcid":"https://orcid.org/0000-0002-7627-6359"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenyang Zhang","raw_affiliation_strings":["Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091139467","display_name":"Feng Zhang","orcid":"https://orcid.org/0000-0003-1983-7321"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Zhang","raw_affiliation_strings":["Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024519576","display_name":"Xiaoguang Guo","orcid":"https://orcid.org/0000-0003-2795-2856"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoguang Guo","raw_affiliation_strings":["Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039946576","display_name":"Bingsheng He","orcid":"https://orcid.org/0000-0001-8618-4581"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Bingsheng He","raw_affiliation_strings":["School of Computing, National University of Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"School of Computing, National University of Singapore, Singapore","institution_ids":["https://openalex.org/I165932596"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100320957","display_name":"Xiao Zhang","orcid":"https://orcid.org/0009-0001-1857-1368"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Zhang","raw_affiliation_strings":["Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008721449","display_name":"Xiaoyong Du","orcid":"https://orcid.org/0000-0002-5757-9135"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyong Du","raw_affiliation_strings":["Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Data Engineering and Knowledge Engineering (MOE), School of Information, Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100337319"],"corresponding_institution_ids":["https://openalex.org/I78988378"],"apc_list":null,"apc_paid":null,"fwci":3.0035,"has_fulltext":false,"cited_by_count":27,"citation_normalized_percentile":{"value":0.91855401,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"32","issue":"7","first_page":"1740","last_page":"1752"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8607107400894165},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7351576685905457},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5790322422981262},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.5778540968894958},{"id":"https://openalex.org/keywords/pci-express","display_name":"PCI Express","score":0.5146649479866028},{"id":"https://openalex.org/keywords/central-processing-unit","display_name":"Central processing unit","score":0.43431979417800903},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4277113676071167},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.39701318740844727},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.337067574262619},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.3256916403770447},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.2637786269187927}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8607107400894165},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7351576685905457},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5790322422981262},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.5778540968894958},{"id":"https://openalex.org/C64270927","wikidata":"https://www.wikidata.org/wiki/Q206924","display_name":"PCI Express","level":3,"score":0.5146649479866028},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.43431979417800903},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4277113676071167},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.39701318740844727},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.337067574262619},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.3256916403770447},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.2637786269187927},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2020.3046870","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2020.3046870","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.8899999856948853,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1974609568","display_name":null,"funder_award_id":"61972403","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2029957150","display_name":null,"funder_award_id":"61732014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5480676819","display_name":null,"funder_award_id":"62072459","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8057543385","display_name":null,"funder_award_id":"U1911203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G992000842","display_name":null,"funder_award_id":"61802412","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1502544429","https://openalex.org/W1669896463","https://openalex.org/W1815597787","https://openalex.org/W1991126176","https://openalex.org/W2033597569","https://openalex.org/W2034714579","https://openalex.org/W2080592089","https://openalex.org/W2103006842","https://openalex.org/W2118447204","https://openalex.org/W2129817042","https://openalex.org/W2149234156","https://openalex.org/W2165039583","https://openalex.org/W2169875292","https://openalex.org/W2172654076","https://openalex.org/W2273440736","https://openalex.org/W2339666327","https://openalex.org/W2416330002","https://openalex.org/W2461316586","https://openalex.org/W2489886790","https://openalex.org/W2527036487","https://openalex.org/W2548579001","https://openalex.org/W2591922920","https://openalex.org/W2592258897","https://openalex.org/W2593535610","https://openalex.org/W2593649365","https://openalex.org/W2605301016","https://openalex.org/W2616033262","https://openalex.org/W2740589650","https://openalex.org/W2766839578","https://openalex.org/W2767829706","https://openalex.org/W2769464294","https://openalex.org/W2883981356","https://openalex.org/W2887504043","https://openalex.org/W2946101992","https://openalex.org/W2972347634","https://openalex.org/W2980665882","https://openalex.org/W2994206871","https://openalex.org/W2998957070","https://openalex.org/W3006708286","https://openalex.org/W3006945411","https://openalex.org/W3008591352","https://openalex.org/W3012519163","https://openalex.org/W3013888980","https://openalex.org/W3025871655","https://openalex.org/W3032604551","https://openalex.org/W3043428597","https://openalex.org/W3098379356","https://openalex.org/W4248767818","https://openalex.org/W4253901332","https://openalex.org/W4285719527","https://openalex.org/W6629990375","https://openalex.org/W6694513646","https://openalex.org/W6735918857","https://openalex.org/W6741613141","https://openalex.org/W6745499037","https://openalex.org/W6769276135","https://openalex.org/W6775587188","https://openalex.org/W6780969450"],"related_works":["https://openalex.org/W4385894176","https://openalex.org/W2347371119","https://openalex.org/W2612768808","https://openalex.org/W3131402800","https://openalex.org/W2388965158","https://openalex.org/W2808480228","https://openalex.org/W2366201982","https://openalex.org/W2593071546","https://openalex.org/W1564576805","https://openalex.org/W2984905932"],"abstract_inverted_index":{"Utilizing":[0],"heterogeneous":[1],"accelerators,":[2],"especially":[3],"GPUs,":[4],"to":[5,12,25,136],"accelerate":[6],"machine":[7,26,35,54,81,95,120,140],"learning":[8,27,55,82,96,121,141],"tasks":[9,122],"has":[10,116],"shown":[11],"be":[13],"a":[14,77,91,138],"great":[15],"success":[16],"in":[17,53],"recent":[18],"years.":[19],"GPUs":[20],"bring":[21],"huge":[22],"performance":[23,157,169],"improvements":[24],"and":[28,98,123,131,171,185],"greatly":[29],"promote":[30],"the":[31,38,49,113,129,132,150,160,164],"widespread":[32],"adoption":[33],"of":[34,94],"learning.":[36],"However,":[37],"discrete":[39,197],"CPU-GPU":[40,65,85],"architecture":[41,152],"design":[42,76,166],"with":[43,68],"high":[44],"PCIe":[45,114],"transmission":[46],"overhead":[47,115],"decreases":[48],"GPU":[50,133],"computing":[51],"benefits":[52],"training":[56,83],"tasks.":[57],"To":[58],"overcome":[59],"such":[60],"limitations,":[61],"hardware":[62],"vendors":[63],"release":[64],"integrated":[66,86,106,151,177],"architectures":[67,178],"shared":[69],"unified":[70],"memory.":[71],"In":[72],"this":[73],"article,":[74],"we":[75],"benchmark":[78,200],"suite":[79],"for":[80,119],"on":[84,105,146],"architectures,":[87],"called":[88],"iMLBench,":[89],"covering":[90],"wide":[92],"range":[93],"applications":[97],"kernels.":[99],"We":[100],"mainly":[101],"explore":[102],"two":[103],"features":[104],"architectures:":[107],"1)":[108],"zero-copy,":[109],"which":[110,126],"means":[111,127],"that":[112,128,149],"been":[117],"eliminated":[118],"2)":[124],"co-running,":[125],"CPU":[130],"co-run":[134],"together":[135],"process":[137],"single":[139],"task.":[142],"Our":[143],"experimental":[144],"results":[145,181],"iMLBench":[147],"show":[148],"brings":[153,167,173],"an":[154],"average":[155],"7.1\u00d7":[156],"improvement":[158],"over":[159,196],"original":[161],"implementations.":[162],"Specifically,":[163],"zero-copy":[165],"4.65\u00d7":[168],"improvement,":[170],"co-running":[172],"1.78\u00d7":[174],"improvement.":[175],"Moreover,":[176],"exhibit":[179],"promising":[180],"from":[182],"both":[183],"performance-per-dollar":[184],"energy":[186,194],"perspectives,":[187],"achieving":[188],"6.50\u00d7":[189],"performance-price":[190],"ratio":[191],"while":[192],"4.06\u00d7":[193],"efficiency":[195],"GPUs.":[198],"The":[199],"is":[201],"open-sourced":[202],"at":[203],"https://github.com/ChenyangZhang-cs/iMLBench.":[204]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
