{"id":"https://openalex.org/W4288059664","doi":"https://doi.org/10.1109/tpds.2022.3193867","title":"Accelerating Tensor Swapping in GPUs With Self-Tuning Compression","display_name":"Accelerating Tensor Swapping in GPUs With Self-Tuning Compression","publication_year":2022,"publication_date":"2022-07-26","ids":{"openalex":"https://openalex.org/W4288059664","doi":"https://doi.org/10.1109/tpds.2022.3193867"},"language":"en","primary_location":{"id":"doi:10.1109/tpds.2022.3193867","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2022.3193867","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101585958","display_name":"Ping Chen","orcid":"https://orcid.org/0000-0001-6973-0755"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ping Chen","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004997843","display_name":"Shuibing He","orcid":"https://orcid.org/0000-0002-7075-4153"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]},{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuibing He","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084907146","display_name":"Xuechen Zhang","orcid":"https://orcid.org/0000-0002-3730-8901"},"institutions":[{"id":"https://openalex.org/I137317281","display_name":"Washington State University Vancouver","ror":"https://ror.org/00g2fk805","country_code":"US","type":"education","lineage":["https://openalex.org/I137317281","https://openalex.org/I72951846"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuechen Zhang","raw_affiliation_strings":["School of Engineering and Computer Science, Washington State University Vancouver, Vancouver, WA, USA"],"affiliations":[{"raw_affiliation_string":"School of Engineering and Computer Science, Washington State University Vancouver, Vancouver, WA, USA","institution_ids":["https://openalex.org/I137317281"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071132411","display_name":"Shuaiben Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]},{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuaiben Chen","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046080015","display_name":"Peiyi Hong","orcid":"https://orcid.org/0009-0001-6046-4988"},"institutions":[{"id":"https://openalex.org/I4210123185","display_name":"Zhejiang Lab","ror":"https://ror.org/02m2h7991","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210123185"]},{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peiyi Hong","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, China","Zhejiang Laboratory, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I168879160"]},{"raw_affiliation_string":"Zhejiang Laboratory, Hangzhou, China","institution_ids":["https://openalex.org/I4210123185"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101508047","display_name":"Yanlong Yin","orcid":"https://orcid.org/0009-0004-1505-4295"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yanlong Yin","raw_affiliation_strings":["Institute of Open Source Chip, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Open Source Chip, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057665558","display_name":"Xian\u2010He Sun","orcid":"https://orcid.org/0000-0002-1093-0792"},"institutions":[{"id":"https://openalex.org/I180949307","display_name":"Illinois Institute of Technology","ror":"https://ror.org/037t3ry66","country_code":"US","type":"education","lineage":["https://openalex.org/I180949307"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xian-He Sun","raw_affiliation_strings":["Department of Computer Science, Illinois Institute of Technology, Chicago, IL, USA"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, Illinois Institute of Technology, Chicago, IL, USA","institution_ids":["https://openalex.org/I180949307"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101585958"],"corresponding_institution_ids":["https://openalex.org/I168879160","https://openalex.org/I4210123185"],"apc_list":null,"apc_paid":null,"fwci":1.1347,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.75860785,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"33","issue":"12","first_page":"4484","last_page":"4498"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12303","display_name":"Tensor decomposition and applications","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2605","display_name":"Computational Mathematics"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8167904615402222},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.677387535572052},{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.6035688519477844},{"id":"https://openalex.org/keywords/software-portability","display_name":"Software portability","score":0.580987811088562},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.575955331325531},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.5267828106880188},{"id":"https://openalex.org/keywords/lossless-compression","display_name":"Lossless compression","score":0.5220541954040527},{"id":"https://openalex.org/keywords/data-compression-ratio","display_name":"Data compression ratio","score":0.45980966091156006},{"id":"https://openalex.org/keywords/tensor","display_name":"Tensor (intrinsic definition)","score":0.4581138491630554},{"id":"https://openalex.org/keywords/compression-ratio","display_name":"Compression ratio","score":0.44596612453460693},{"id":"https://openalex.org/keywords/cuda","display_name":"CUDA","score":0.4429045021533966},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.4221719205379486},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.4161013662815094},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.413303941488266},{"id":"https://openalex.org/keywords/computational-science","display_name":"Computational science","score":0.37086179852485657},{"id":"https://openalex.org/keywords/computer-engineering","display_name":"Computer engineering","score":0.33444786071777344},{"id":"https://openalex.org/keywords/image-compression","display_name":"Image compression","score":0.30981314182281494},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.24923253059387207},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.22490882873535156},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.18408054113388062},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.08871975541114807}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8167904615402222},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.677387535572052},{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.6035688519477844},{"id":"https://openalex.org/C63000827","wikidata":"https://www.wikidata.org/wiki/Q3080428","display_name":"Software portability","level":2,"score":0.580987811088562},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.575955331325531},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.5267828106880188},{"id":"https://openalex.org/C81081738","wikidata":"https://www.wikidata.org/wiki/Q55542","display_name":"Lossless compression","level":3,"score":0.5220541954040527},{"id":"https://openalex.org/C94835093","wikidata":"https://www.wikidata.org/wiki/Q3113333","display_name":"Data compression ratio","level":5,"score":0.45980966091156006},{"id":"https://openalex.org/C155281189","wikidata":"https://www.wikidata.org/wiki/Q3518150","display_name":"Tensor (intrinsic definition)","level":2,"score":0.4581138491630554},{"id":"https://openalex.org/C25797200","wikidata":"https://www.wikidata.org/wiki/Q828137","display_name":"Compression ratio","level":3,"score":0.44596612453460693},{"id":"https://openalex.org/C2778119891","wikidata":"https://www.wikidata.org/wiki/Q477690","display_name":"CUDA","level":2,"score":0.4429045021533966},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.4221719205379486},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.4161013662815094},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.413303941488266},{"id":"https://openalex.org/C459310","wikidata":"https://www.wikidata.org/wiki/Q117801","display_name":"Computational science","level":1,"score":0.37086179852485657},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.33444786071777344},{"id":"https://openalex.org/C13481523","wikidata":"https://www.wikidata.org/wiki/Q412438","display_name":"Image compression","level":4,"score":0.30981314182281494},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.24923253059387207},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.22490882873535156},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.18408054113388062},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.08871975541114807},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C171146098","wikidata":"https://www.wikidata.org/wiki/Q124192","display_name":"Automotive engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C511840579","wikidata":"https://www.wikidata.org/wiki/Q12757","display_name":"Internal combustion engine","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tpds.2022.3193867","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpds.2022.3193867","pdf_url":null,"source":{"id":"https://openalex.org/S97130795","display_name":"IEEE Transactions on Parallel and Distributed Systems","issn_l":"1045-9219","issn":["1045-9219","1558-2183","2161-9883"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Parallel and Distributed Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4065653633","display_name":null,"funder_award_id":"CNS 1906541","funder_id":"https://openalex.org/F4320335353","funder_display_name":"National Science Foundation of Sri Lanka"},{"id":"https://openalex.org/G4779957870","display_name":null,"funder_award_id":"62172361","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335353","display_name":"National Science Foundation of Sri Lanka","ror":"https://ror.org/010xaa060"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":60,"referenced_works":["https://openalex.org/W1677182931","https://openalex.org/W1686810756","https://openalex.org/W1800261609","https://openalex.org/W1919191429","https://openalex.org/W1921523184","https://openalex.org/W1964940342","https://openalex.org/W1994211684","https://openalex.org/W2057331441","https://openalex.org/W2071460053","https://openalex.org/W2102003408","https://openalex.org/W2108598243","https://openalex.org/W2125283600","https://openalex.org/W2142265837","https://openalex.org/W2194775991","https://openalex.org/W2279098554","https://openalex.org/W2489529491","https://openalex.org/W2618530766","https://openalex.org/W2746416407","https://openalex.org/W2788728386","https://openalex.org/W2792643794","https://openalex.org/W2798707674","https://openalex.org/W2809901035","https://openalex.org/W2886851211","https://openalex.org/W2896457183","https://openalex.org/W2911892981","https://openalex.org/W2962821792","https://openalex.org/W2963285578","https://openalex.org/W2964350391","https://openalex.org/W2971843695","https://openalex.org/W2973031157","https://openalex.org/W2979690924","https://openalex.org/W3010830594","https://openalex.org/W3012479151","https://openalex.org/W3012514909","https://openalex.org/W3043494828","https://openalex.org/W3044837714","https://openalex.org/W3103572230","https://openalex.org/W3106011734","https://openalex.org/W3118608800","https://openalex.org/W3124675547","https://openalex.org/W3167436278","https://openalex.org/W3206867815","https://openalex.org/W4200309432","https://openalex.org/W4285148475","https://openalex.org/W4293718192","https://openalex.org/W4297775537","https://openalex.org/W4301361180","https://openalex.org/W6637373629","https://openalex.org/W6640185926","https://openalex.org/W6676297131","https://openalex.org/W6685562342","https://openalex.org/W6694260854","https://openalex.org/W6695314431","https://openalex.org/W6732520560","https://openalex.org/W6737664043","https://openalex.org/W6749029207","https://openalex.org/W6752790953","https://openalex.org/W6755207826","https://openalex.org/W6767971408","https://openalex.org/W6787972765"],"related_works":["https://openalex.org/W3020739840","https://openalex.org/W2913998709","https://openalex.org/W4386875822","https://openalex.org/W3177128669","https://openalex.org/W4388483283","https://openalex.org/W4385574943","https://openalex.org/W4381744720","https://openalex.org/W2088378984","https://openalex.org/W3080614128","https://openalex.org/W4200061735"],"abstract_inverted_index":{"Data":[0,34],"swapping":[1,35,59,221],"between":[2],"CPUs":[3],"and":[4,98,100,139,144,170,227,238],"GPUs":[5,54,72,135],"is":[6,43,145],"widely":[7],"used":[8],"to":[9,103,162,179,181,214,225],"address":[10],"the":[11,46,57,68,127,171,205],"GPU":[12,31,149],"memory":[13,27,70,88,129],"shortage":[14],"issue":[15],"when":[16,40],"training":[17,200],"deep":[18],"neural":[19],"networks":[20],"(DNNs)":[21],"requiring":[22],"a":[23,30,38,115],"larger":[24],"amount":[25],"of":[26,48,71,78,131,173],"than":[28,45],"that":[29,159],"may":[32,36],"have.":[33],"become":[37],"bottleneck":[39],"its":[41,81],"latency":[42,47,222],"longer":[44],"DNN":[49,182,211,234],"computations.":[50],"Tensor":[51],"compression":[52,91,96,118,156,167,174,192],"in":[53,67,87],"can":[55],"reduce":[56],"data":[58],"time.":[60],"However,":[61],"existing":[62],"works":[63],"on":[64,110,148,157],"compressing":[65],"tensors":[66,105,158,195],"virtual":[69,128],"have":[73],"three":[74],"major":[75],"issues:":[76],"lack":[77],"portability":[79,143],"because":[80,106],"implementation":[82],"requires":[83],"additional":[84],"(de)compression":[85,137],"units":[86],"controllers,":[89],"sub-optimal":[90],"performance":[92],"for":[93,125,136,193,233],"varying":[94],"tensor":[95,117,220],"ratios":[97],"sizes,":[99],"poor":[101],"adaptation":[102],"dense":[104,185,194,239],"they":[107],"only":[108,154],"focus":[109],"sparse":[111,237],"tensors.":[112],"We":[113,203],"propose":[114],"self-tuning":[116],"framework,":[119],"named":[120],"<sc":[121,216],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[122,217],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">CSwap+</small>":[123,218],",":[124],"improving":[126],"management":[130],"GPUs.":[132],"It":[133],"uses":[134],"directly":[138],"thus":[140],"has":[141],"high":[142],"minimally":[146],"dependent":[147],"architecture":[150],"features.":[151],"Furthermore,":[152],"it":[153,187],"applies":[155],"are":[160],"deemed":[161],"be":[163],"cost-effective":[164,190],"considering":[165],"their":[166],"ratio,":[168],"size,":[169],"characteristics":[172],"algorithms":[175],"at":[176],"runtime.":[177],"Finally,":[178],"adapt":[180],"models":[183,235],"with":[184,196,229,236],"tensors,":[186,240],"also":[188],"supports":[189],"lossy":[191],"nearly":[197],"no":[198],"model":[199],"accuracy":[201],"degradation.":[202],"conduct":[204],"experiments":[206],"through":[207],"six":[208],"representative":[209],"memory-intensive":[210],"models.":[212],"Compared":[213],"vDNN,":[215],"reduces":[219],"by":[223],"up":[224],"50.9%":[226],"46.1%":[228],"NVIDIA":[230],"V100":[231],"GPU,":[232],"respectively.":[241]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
