{"id":"https://openalex.org/W2969656814","doi":"https://doi.org/10.1109/icufn.2019.8806196","title":"Development of an Open ISA GPGPU for Edge Device Machine Learning Applications","display_name":"Development of an Open ISA GPGPU for Edge Device Machine Learning Applications","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2969656814","doi":"https://doi.org/10.1109/icufn.2019.8806196","mag":"2969656814"},"language":"en","primary_location":{"id":"doi:10.1109/icufn.2019.8806196","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icufn.2019.8806196","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 Eleventh International Conference on Ubiquitous and Future Networks (ICUFN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046574849","display_name":"Yu-Xiang Su","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yu-Xiang Su","raw_affiliation_strings":["Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036995962","display_name":"Jhi-Han Jheng","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jhi-Han Jheng","raw_affiliation_strings":["Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028815027","display_name":"Dun-Jie Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Dun-Jie Chen","raw_affiliation_strings":["Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111582905","display_name":"Chung\u2010Ho Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I91807558","display_name":"National Cheng Kung University","ror":"https://ror.org/01b8kcc49","country_code":"TW","type":"education","lineage":["https://openalex.org/I91807558"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chung-Ho Chen","raw_affiliation_strings":["Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Dept. of Electrical Engineering and Inst. of Computer & Communication Engineering, National Cheng Kung University, Tainan, Taiwan","institution_ids":["https://openalex.org/I91807558"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.186,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.55719481,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"214","last_page":"217"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9822999835014343,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8670833110809326},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.7885359525680542},{"id":"https://openalex.org/keywords/general-purpose-computing-on-graphics-processing-units","display_name":"General-purpose computing on graphics processing units","score":0.7377421855926514},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.5954605937004089},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.5920277833938599},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5374259352684021},{"id":"https://openalex.org/keywords/instruction-set","display_name":"Instruction set","score":0.5085824728012085},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.4740681052207947},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.42582160234451294},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4197397232055664},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.4125417172908783},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.4109051823616028},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.382931649684906},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.32693150639533997},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2951301336288452},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.24185311794281006},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10079246759414673},{"id":"https://openalex.org/keywords/graphics","display_name":"Graphics","score":0.08420568704605103}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8670833110809326},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.7885359525680542},{"id":"https://openalex.org/C50630238","wikidata":"https://www.wikidata.org/wiki/Q971505","display_name":"General-purpose computing on graphics processing units","level":3,"score":0.7377421855926514},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.5954605937004089},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.5920277833938599},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5374259352684021},{"id":"https://openalex.org/C202491316","wikidata":"https://www.wikidata.org/wiki/Q272683","display_name":"Instruction set","level":2,"score":0.5085824728012085},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.4740681052207947},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.42582160234451294},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4197397232055664},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.4125417172908783},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.4109051823616028},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.382931649684906},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.32693150639533997},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2951301336288452},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.24185311794281006},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10079246759414673},{"id":"https://openalex.org/C21442007","wikidata":"https://www.wikidata.org/wiki/Q1027879","display_name":"Graphics","level":2,"score":0.08420568704605103},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icufn.2019.8806196","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icufn.2019.8806196","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 Eleventh International Conference on Ubiquitous and Future Networks (ICUFN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":1,"referenced_works":["https://openalex.org/W2615663338"],"related_works":["https://openalex.org/W1963859303","https://openalex.org/W2364044215","https://openalex.org/W2389600408","https://openalex.org/W240129890","https://openalex.org/W3048701459","https://openalex.org/W2149078538","https://openalex.org/W2080146221","https://openalex.org/W2370314112","https://openalex.org/W1912958759","https://openalex.org/W2792081825"],"abstract_inverted_index":{"Hosting":[0],"the":[1,6,11,35,38,52,105,129,132,135],"deep":[2],"learning":[3,33,110],"model":[4],"on":[5,34],"cloud":[7],"may":[8],"not":[9],"be":[10],"best":[12],"solution":[13],"in":[14,117],"many":[15],"cases,":[16],"for":[17,82],"instance,":[18],"IoT":[19],"applications":[20],"or":[21,27],"autonomous":[22],"system":[23],"where":[24],"low":[25],"latency":[26],"enhanced":[28],"security":[29],"is":[30,115],"desirable.":[31],"Deep":[32],"edge":[36,66],"alleviates":[37],"above":[39],"issues,":[40],"and":[41,78,111,131],"provides":[42],"benefits":[43],"of":[44,54,108,128,134],"local":[45],"computation.":[46,67],"In":[47],"this":[48],"paper,":[49],"we":[50],"present":[51],"development":[53],"an":[55],"open":[56],"ISA":[57,76],"(instruction":[58],"set":[59],"architecture)":[60],"general":[61],"purpose":[62],"GPU":[63,86,95,114,123,136],"aimed":[64],"at":[65],"Our":[68],"GPU,":[69,71,130],"CASLab":[70,85,94],"uses":[72],"license-free,":[73],"royalty-free":[74],"HSAIL":[75],"specification":[77],"supports":[79,88],"OpenCL1.2/2.0":[80],"APIs":[81],"heterogeneous":[83],"computing.":[84],"also":[87],"TensorFlow":[89],"framework":[90],"with":[91,97],"CUDA-on-CL":[92],"technology.":[93],"IP":[96],"configurable":[98],"SIMT":[99],"Core":[100],"design":[101,119],"tailors":[102],"directly":[103],"to":[104],"computing":[106],"need":[107],"on-device":[109],"inference.":[112],"The":[113],"developed":[116],"ESL":[118],"methodology":[120],"which":[121],"incorporates":[122],"micro-architecture":[124],"exploration,":[125],"power":[126],"modelling":[127],"co-simulation":[133],"software":[137],"stack.":[138]},"counts_by_year":[{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
