{"id":"https://openalex.org/W3205985359","doi":"https://doi.org/10.23919/apnoms52696.2021.9562651","title":"Text-to-Speech with Model Compression on Edge Devices","display_name":"Text-to-Speech with Model Compression on Edge Devices","publication_year":2021,"publication_date":"2021-09-08","ids":{"openalex":"https://openalex.org/W3205985359","doi":"https://doi.org/10.23919/apnoms52696.2021.9562651","mag":"3205985359"},"language":"en","primary_location":{"id":"doi:10.23919/apnoms52696.2021.9562651","is_oa":false,"landing_page_url":"https://doi.org/10.23919/apnoms52696.2021.9562651","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 22nd Asia-Pacific Network Operations and Management Symposium (APNOMS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033123977","display_name":"Wai-Wan Koc","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":true,"raw_author_name":"Wai-Wan Koc","raw_affiliation_strings":["Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103713471","display_name":"Yung\u2010Ting Chang","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yung-Ting Chang","raw_affiliation_strings":["Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001803568","display_name":"Jian-Yu Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jian-Yu Yu","raw_affiliation_strings":["Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050823674","display_name":"Ts\u00ec-U\u00ed \u0130k","orcid":"https://orcid.org/0000-0001-6432-9161"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Tsi-Ui Ik","raw_affiliation_strings":["Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science, College of Computer Science National Yang Ming Chiao Tung University, Hsinchu City, Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5033123977"],"corresponding_institution_ids":["https://openalex.org/I148366613"],"apc_list":null,"apc_paid":null,"fwci":0.6798,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.76087869,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"114","last_page":"119"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/porting","display_name":"Porting","score":0.8321964740753174},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7884694337844849},{"id":"https://openalex.org/keywords/edge-device","display_name":"Edge device","score":0.7050991058349609},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.6538639068603516},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.629494845867157},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5683605670928955},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.525597095489502},{"id":"https://openalex.org/keywords/enhanced-data-rates-for-gsm-evolution","display_name":"Enhanced Data Rates for GSM Evolution","score":0.5170055627822876},{"id":"https://openalex.org/keywords/pruning","display_name":"Pruning","score":0.5161667466163635},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44314146041870117},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.43974217772483826}],"concepts":[{"id":"https://openalex.org/C106251023","wikidata":"https://www.wikidata.org/wiki/Q851989","display_name":"Porting","level":3,"score":0.8321964740753174},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7884694337844849},{"id":"https://openalex.org/C138236772","wikidata":"https://www.wikidata.org/wiki/Q25098575","display_name":"Edge device","level":3,"score":0.7050991058349609},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.6538639068603516},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.629494845867157},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5683605670928955},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.525597095489502},{"id":"https://openalex.org/C162307627","wikidata":"https://www.wikidata.org/wiki/Q204833","display_name":"Enhanced Data Rates for GSM Evolution","level":2,"score":0.5170055627822876},{"id":"https://openalex.org/C108010975","wikidata":"https://www.wikidata.org/wiki/Q500094","display_name":"Pruning","level":2,"score":0.5161667466163635},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44314146041870117},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.43974217772483826},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/apnoms52696.2021.9562651","is_oa":false,"landing_page_url":"https://doi.org/10.23919/apnoms52696.2021.9562651","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 22nd Asia-Pacific Network Operations and Management Symposium (APNOMS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.550000011920929,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G6611696618","display_name":null,"funder_award_id":"MOST109-2627-H-009-001,MOST110-2221-E-A49-063-MY3","funder_id":"https://openalex.org/F4320322795","funder_display_name":"Ministry of Science and Technology, Taiwan"}],"funders":[{"id":"https://openalex.org/F4320322795","display_name":"Ministry of Science and Technology, Taiwan","ror":"https://ror.org/02kv4zf79"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W2058641082","https://openalex.org/W2119144962","https://openalex.org/W2120847449","https://openalex.org/W2519091744","https://openalex.org/W2531207078","https://openalex.org/W2608554408","https://openalex.org/W2908511865","https://openalex.org/W2947963429","https://openalex.org/W2949382160","https://openalex.org/W2963000224","https://openalex.org/W2963122961","https://openalex.org/W2963140066","https://openalex.org/W2963363373","https://openalex.org/W2963609956","https://openalex.org/W2964243274","https://openalex.org/W2964299589","https://openalex.org/W2970418186","https://openalex.org/W2972885185","https://openalex.org/W4297689207","https://openalex.org/W6677580257","https://openalex.org/W6725543821","https://openalex.org/W6736780897"],"related_works":["https://openalex.org/W4322761281","https://openalex.org/W4238233472","https://openalex.org/W4313526662","https://openalex.org/W3111395152","https://openalex.org/W4312996489","https://openalex.org/W3106131444","https://openalex.org/W3216099748","https://openalex.org/W4205963435","https://openalex.org/W4313463379","https://openalex.org/W3214037210"],"abstract_inverted_index":{"The":[0,166],"application":[1],"of":[2,59,65,116,164,175,219,225],"voice":[3,15,35,134],"services":[4],"has":[5,68],"become":[6],"more":[7,130],"common":[8],"in":[9,37,207],"daily":[10],"life,":[11],"including":[12],"traffic":[13],"navigation,":[14],"assistants,":[16],"audio":[17],"books":[18],"and":[19,26,99,154,162,182,213],"so":[20],"on.":[21],"However,":[22],"considering":[23],"the":[24,53,57,62,104,114,117,139,158,173,189,199,205,217,220,222,226,240],"cost":[25],"variability,":[27],"it":[28,124],"is":[29,45,108,234,243],"difficult":[30],"to":[31,48,86,89,110,128,151,156,187],"fully":[32],"utilize":[33],"real":[34],"recordings":[36],"different":[38,91],"scenarios.":[39],"In":[40,136],"practice,":[41],"speech":[42,97,105,140,190,228],"synthesis":[43,106,141,191,229],"technology":[44],"usually":[46],"used":[47],"mimic":[49],"human":[50],"voices;":[51],"On":[52,198],"other":[54,200],"hand,":[55,201],"with":[56,113],"development":[58],"computer":[60],"equipment,":[61],"computing":[63],"power":[64],"edge":[66,87,111,152,196,232],"devices":[67,88],"also":[69],"gradually":[70],"improved,":[71],"which":[72],"enables":[73],"light":[74],"deep-learning":[75],"network":[76,107,142,192,230],"inference.":[77],"Currently,":[78],"many":[79],"deep":[80,176],"learning":[81,177],"technologies":[82],"have":[83],"been":[84],"ported":[85,109,150],"create":[90],"applications,":[92],"such":[93],"as":[94],"face":[95],"recognition,":[96,98],"photo":[100],"retouching.":[101],"Therefore,":[102],"if":[103],"devices,":[112],"advent":[115],"fifth":[118],"generation":[119,122],"mobile":[120],"communication":[121],"(5G),":[123],"would":[125,169],"be":[126,149,170],"able":[127],"provide":[129],"innovative":[131],"basis":[132],"for":[133],"services.":[135],"this":[137],"research,":[138],"Tacotron2":[143,227],"[1]":[144],"+":[145],"CBHG":[146],"[2]":[147],"will":[148],"device":[153,233],"aims":[155],"optimize":[157],"model":[159,167,241],"inference":[160,223],"time":[161],"amount":[163],"parameters.":[165],"optimization":[168],"based":[171],"on":[172,195,231],"compression":[174,218],"network,":[178],"quantization,":[179],"structured":[180],"pruning":[181],"low-rank":[183],"matrix":[184],"approximation":[185],"techniques":[186],"allow":[188],"working":[193],"effectively":[194],"devices.":[197],"we":[202],"get":[203],"over":[204],"difference":[206],"library":[208],"support":[209],"between":[210],"TensorFlow":[211,214],"1.5":[212],"Lite.":[215],"After":[216],"model,":[221],"speed":[224],"increased":[235],"by":[236,245],"1.91":[237],"times,":[238],"while":[239],"size":[242],"reduced":[244],"86%":[246],"respectively.":[247]},"counts_by_year":[{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
