{"id":"https://openalex.org/W4283824636","doi":"https://doi.org/10.21437/interspeech.2022-644","title":"TMGAN-PLC: Audio Packet Loss Concealment using Temporal Memory Generative Adversarial Network","display_name":"TMGAN-PLC: Audio Packet Loss Concealment using Temporal Memory Generative Adversarial Network","publication_year":2022,"publication_date":"2022-09-16","ids":{"openalex":"https://openalex.org/W4283824636","doi":"https://doi.org/10.21437/interspeech.2022-644"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2022-644","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-644","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020584403","display_name":"Yuansheng Guan","orcid":null},"institutions":[{"id":"https://openalex.org/I37987034","display_name":"Guangzhou University","ror":"https://ror.org/05ar8rn06","country_code":"CN","type":"education","lineage":["https://openalex.org/I37987034"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yuansheng Guan","raw_affiliation_strings":["School of Electronics and Communication Engineering, Guangzhou University, Guangzhou, China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Communication Engineering, Guangzhou University, Guangzhou, China","institution_ids":["https://openalex.org/I37987034"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100568171","display_name":"Guochen Yu","orcid":null},"institutions":[{"id":"https://openalex.org/I75689368","display_name":"Communication University of China","ror":"https://ror.org/04facbs33","country_code":"CN","type":"education","lineage":["https://openalex.org/I75689368"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guochen Yu","raw_affiliation_strings":["Communication University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Communication University of China, Beijing, China","institution_ids":["https://openalex.org/I75689368"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053757616","display_name":"Andong Li","orcid":"https://orcid.org/0000-0003-4094-8448"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Andong Li","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070266277","display_name":"Chengshi Zheng","orcid":"https://orcid.org/0000-0001-5656-994X"},"institutions":[{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chengshi Zheng","raw_affiliation_strings":["Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100440062","display_name":"Jie Wang","orcid":"https://orcid.org/0009-0009-2444-585X"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210099069","display_name":"Institute of Acoustics","ror":"https://ror.org/00v8rqv75","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210099069"]},{"id":"https://openalex.org/I37987034","display_name":"Guangzhou University","ror":"https://ror.org/05ar8rn06","country_code":"CN","type":"education","lineage":["https://openalex.org/I37987034"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Wang","raw_affiliation_strings":["School of Electronics and Communication Engineering, Guangzhou University, Guangzhou, China","Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Electronics and Communication Engineering, Guangzhou University, Guangzhou, China","institution_ids":["https://openalex.org/I37987034"]},{"raw_affiliation_string":"Key Laboratory of Noise and Vibration Research, Institute of Acoustics, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210099069","https://openalex.org/I19820366"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5020584403"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I37987034","https://openalex.org/I4210099069"],"apc_list":null,"apc_paid":null,"fwci":1.471,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.84612954,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":98},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10822","display_name":"Acoustic Wave Phenomena Research","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.989300012588501,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8198838829994202},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.6334140300750732},{"id":"https://openalex.org/keywords/network-packet","display_name":"Network packet","score":0.5493410229682922},{"id":"https://openalex.org/keywords/packet-loss","display_name":"Packet loss","score":0.49918198585510254},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.45266446471214294},{"id":"https://openalex.org/keywords/generative-adversarial-network","display_name":"Generative adversarial network","score":0.41813114285469055},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.35164323449134827},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.25804561376571655},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.18819338083267212}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8198838829994202},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.6334140300750732},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.5493410229682922},{"id":"https://openalex.org/C54108766","wikidata":"https://www.wikidata.org/wiki/Q391064","display_name":"Packet loss","level":3,"score":0.49918198585510254},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.45266446471214294},{"id":"https://openalex.org/C2988773926","wikidata":"https://www.wikidata.org/wiki/Q25104379","display_name":"Generative adversarial network","level":3,"score":0.41813114285469055},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.35164323449134827},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.25804561376571655},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.18819338083267212}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2022-644","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-644","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.6499999761581421}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W1677182931","https://openalex.org/W1836465849","https://openalex.org/W2067295501","https://openalex.org/W2094721231","https://openalex.org/W2131738223","https://openalex.org/W2137431935","https://openalex.org/W2145103350","https://openalex.org/W2243752967","https://openalex.org/W2476548250","https://openalex.org/W2799789537","https://openalex.org/W2940177920","https://openalex.org/W2963799213","https://openalex.org/W2970006822","https://openalex.org/W2971074500","https://openalex.org/W2972745527","https://openalex.org/W3011573174","https://openalex.org/W3015338123","https://openalex.org/W3022195800","https://openalex.org/W3025800305","https://openalex.org/W3094910704","https://openalex.org/W3096408984","https://openalex.org/W3097627357","https://openalex.org/W3160450938","https://openalex.org/W3197260772","https://openalex.org/W3207100935","https://openalex.org/W4205169642","https://openalex.org/W4288265053","https://openalex.org/W4294764252","https://openalex.org/W4296069296"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W4246396837","https://openalex.org/W3176240006","https://openalex.org/W3126451824","https://openalex.org/W2482350142","https://openalex.org/W1561927205","https://openalex.org/W4385421777","https://openalex.org/W2971552217","https://openalex.org/W3199712142","https://openalex.org/W2134402536"],"abstract_inverted_index":{"Real-time":[0],"communications":[1],"in":[2,9,22,112,167],"packet-switched":[3],"networks":[4],"have":[5,35],"become":[6],"widely":[7],"used":[8],"daily":[10],"communication,":[11],"while":[12],"they":[13],"inevitably":[14],"suffer":[15],"from":[16],"network":[17,81],"delays":[18],"and":[19,52,95,104,121,147,173],"data":[20],"losses":[21],"constrained":[23],"real-time":[24],"conditions.To":[25],"solve":[26],"these":[27],"problems,":[28],"audio":[29,83],"packet":[30,70],"loss":[31,134],"concealment":[32],"(PLC)":[33],"algorithms":[34],"been":[36],"developed":[37],"to":[38,61,115,142],"mitigate":[39],"voice":[40,64],"transmission":[41,50],"failures":[42],"by":[43,48,132],"reconstructing":[44],"the":[45,49,96,102,113,118,127,144,149,155,161],"lost":[46],"information.Limited":[47],"latency":[51],"device":[53],"memory,":[54],"it":[55],"is":[56,88,109],"still":[57],"intractable":[58],"for":[59,82],"PLC":[60,156],"accomplish":[62],"high-quality":[63],"reconstruction":[65],"using":[66],"a":[67,76,91,99],"relatively":[68],"small":[69],"buffer.In":[71],"this":[72],"paper,":[73],"we":[74,136],"propose":[75],"temporal":[77,105,124],"memory":[78],"generative":[79],"adversarial":[80],"PLC,":[84],"dubbed":[85],"TMGAN-PLC,":[86],"which":[87],"comprised":[89],"of":[90,101,169],"novel":[92],"nested-UNet":[93,103],"generator":[94,114],"time-domain/frequency-domain":[97],"discriminators.Specifically,":[98],"combination":[100],"featurewise":[106],"linear":[107],"modulation":[108],"elaborately":[110],"devised":[111],"finely":[116],"adjust":[117],"intra-frame":[119],"information":[120],"establish":[122],"inter-frame":[123],"dependencies.To":[125],"complement":[126],"missing":[128],"speech":[129,170],"content":[130,146],"caused":[131],"longer":[133],"bursts,":[135],"employ":[137],"multistage":[138],"gated":[139],"vector":[140],"quantizers":[141],"capture":[143],"correct":[145],"reconstruct":[148],"near-real":[150],"smooth":[151],"audio.Extensive":[152],"experiments":[153],"on":[154],"Challenge":[157],"dataset":[158],"demonstrate":[159],"that":[160],"proposed":[162],"method":[163],"yields":[164],"promising":[165],"performance":[166],"terms":[168],"quality,":[171],"intelligibility,":[172],"PLCMOS.":[174]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":6}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
