{"id":"https://openalex.org/W3206301866","doi":"https://doi.org/10.1145/3474085.3475463","title":"Towards Fast and High-Quality Sign Language Production","display_name":"Towards Fast and High-Quality Sign Language Production","publication_year":2021,"publication_date":"2021-10-17","ids":{"openalex":"https://openalex.org/W3206301866","doi":"https://doi.org/10.1145/3474085.3475463","mag":"3206301866"},"language":"en","primary_location":{"id":"doi:10.1145/3474085.3475463","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072986859","display_name":"Wencan Huang","orcid":"https://orcid.org/0000-0002-1555-3674"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wencan Huang","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058982791","display_name":"Wenwen Pan","orcid":"https://orcid.org/0000-0003-4300-7694"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenwen Pan","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079260216","display_name":"Zhou Zhao","orcid":"https://orcid.org/0000-0001-6121-0384"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhou Zhao","raw_affiliation_strings":["Zhejiang University, Hangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100393506","display_name":"Qi Tian","orcid":"https://orcid.org/0000-0002-7252-5047"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Tian","raw_affiliation_strings":["Huawei Cloud &amp; AI, Shenzhen, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Huawei Cloud &amp; AI, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5072986859"],"corresponding_institution_ids":["https://openalex.org/I76130692"],"apc_list":null,"apc_paid":null,"fwci":1.9713,"has_fulltext":false,"cited_by_count":36,"citation_normalized_percentile":{"value":0.86310884,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"3172","last_page":"3181"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11285","display_name":"Hearing Impairment and Communication","score":0.9800000190734863,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7963889837265015},{"id":"https://openalex.org/keywords/autoregressive-model","display_name":"Autoregressive model","score":0.6657612323760986},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5381781458854675},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4874594211578369},{"id":"https://openalex.org/keywords/sign-language","display_name":"Sign language","score":0.47572019696235657},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.41229814291000366},{"id":"https://openalex.org/keywords/sign","display_name":"Sign (mathematics)","score":0.4113216996192932},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3872326910495758},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3634818196296692},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3290271759033203},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10458624362945557}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7963889837265015},{"id":"https://openalex.org/C159877910","wikidata":"https://www.wikidata.org/wiki/Q2202883","display_name":"Autoregressive model","level":2,"score":0.6657612323760986},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5381781458854675},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4874594211578369},{"id":"https://openalex.org/C522192633","wikidata":"https://www.wikidata.org/wiki/Q34228","display_name":"Sign language","level":2,"score":0.47572019696235657},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.41229814291000366},{"id":"https://openalex.org/C139676723","wikidata":"https://www.wikidata.org/wiki/Q1193832","display_name":"Sign (mathematics)","level":2,"score":0.4113216996192932},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3872326910495758},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3634818196296692},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3290271759033203},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10458624362945557},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3474085.3475463","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3474085.3475463","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.6600000262260437}],"awards":[{"id":"https://openalex.org/G3846515262","display_name":null,"funder_award_id":"2020YFC0832505","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G755000837","display_name":null,"funder_award_id":"61836002,62072397,62077041","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W116902681","https://openalex.org/W1568066624","https://openalex.org/W1579853615","https://openalex.org/W1735317348","https://openalex.org/W1828163288","https://openalex.org/W1924770834","https://openalex.org/W2031334527","https://openalex.org/W2064675550","https://openalex.org/W2066601700","https://openalex.org/W2124934925","https://openalex.org/W2130942839","https://openalex.org/W2139359116","https://openalex.org/W2146502635","https://openalex.org/W2172140247","https://openalex.org/W2188882108","https://openalex.org/W2250342921","https://openalex.org/W2542835211","https://openalex.org/W2606862842","https://openalex.org/W2747329762","https://openalex.org/W2759302818","https://openalex.org/W2781902187","https://openalex.org/W2784435047","https://openalex.org/W2799020610","https://openalex.org/W2887738788","https://openalex.org/W2888163892","https://openalex.org/W2950304420","https://openalex.org/W2962730651","https://openalex.org/W2962795401","https://openalex.org/W2963076818","https://openalex.org/W2963403868","https://openalex.org/W2963684088","https://openalex.org/W2964199361","https://openalex.org/W2964308564","https://openalex.org/W2966391918","https://openalex.org/W2970730223","https://openalex.org/W2981618422","https://openalex.org/W2983796203","https://openalex.org/W2997573805","https://openalex.org/W2998508934","https://openalex.org/W3004835408","https://openalex.org/W3010590357","https://openalex.org/W3024396289","https://openalex.org/W3024732798","https://openalex.org/W3026874504","https://openalex.org/W3034363136","https://openalex.org/W3034765865","https://openalex.org/W3035490389","https://openalex.org/W3040942941","https://openalex.org/W3043621996","https://openalex.org/W3093337631","https://openalex.org/W3103017991","https://openalex.org/W3109174848","https://openalex.org/W3126473778","https://openalex.org/W3130016944","https://openalex.org/W4249279697","https://openalex.org/W4391156274"],"related_works":["https://openalex.org/W2953234277","https://openalex.org/W2626256601","https://openalex.org/W147410782","https://openalex.org/W2900413183","https://openalex.org/W4390975304","https://openalex.org/W3022252430","https://openalex.org/W4287804464","https://openalex.org/W3103989898","https://openalex.org/W3211292372","https://openalex.org/W1989687946"],"abstract_inverted_index":{"Sign":[0],"Language":[1],"Production":[2],"(SLP)":[3],"aims":[4],"to":[5,12,24,64,136,142,170],"automatically":[6],"translate":[7],"a":[8,93,99,133,160],"spoken":[9],"language":[10,16],"description":[11],"its":[13],"corresponding":[14],"sign":[15,26,30,149,154,176],"video.":[17],"The":[18],"core":[19],"procedure":[20],"of":[21,146,196],"SLP":[22],"is":[23,130],"transform":[25],"gloss":[27,126,140],"intermediaries":[28],"into":[29],"pose":[31,52,150,155,164,177],"sequences":[32],"(G2P).":[33],"Most":[34],"existing":[35],"methods":[36],"for":[37,109,125,152],"G2P":[38],"are":[39,62,83],"based":[40],"on":[41,55,182],"sequential":[42],"autoregression":[43],"or":[44],"sequence-to-sequence":[45],"encoder-decoder":[46],"learning.":[47,112],"However,":[48],"by":[49,86,121,132],"generating":[50],"target":[51,148],"frames":[53],"conditioned":[54],"the":[56,118,138,144,147,167],"previously":[57],"generated":[58],"ones,":[59],"these":[60],"models":[61,193],"prone":[63],"bringing":[65],"issues":[66,82],"such":[67,81],"as":[68,103,105],"error":[69],"accumulation":[70],"and":[71,173,198],"high":[72],"inference":[73],"latency.":[74],"In":[75],"this":[76],"paper,":[77],"we":[78,91,114,158],"argue":[79],"that":[80,186],"mainly":[84],"caused":[85],"adopting":[87],"autoregressive":[88,192],"manner.":[89],"Hence,":[90],"propose":[92],"novel":[94],"Non-AuToregressive":[95],"(NAT)":[96],"model":[97,169,189],"with":[98],"parallel":[100,153],"decoding":[101],"scheme,":[102],"well":[104],"an":[106],"External":[107],"Aligner":[108],"sequence":[110,141,151],"alignment":[111,123],"Specifically,":[113],"extract":[115],"alignments":[116],"from":[117],"external":[119],"aligner":[120],"monotonic":[122],"search":[124],"duration":[127],"prediction,":[128],"which":[129],"used":[131],"length":[134,145],"regulator":[135],"expand":[137],"source":[139],"match":[143],"generation.":[156],"Furthermore,":[157],"devise":[159],"spatial-temporal":[161],"graph":[162],"convolutional":[163],"generator":[165],"in":[166,194],"NAT":[168],"generate":[171],"smoother":[172],"more":[174],"natural":[175],"sequences.":[178],"Extensive":[179],"experiments":[180],"conducted":[181],"PHOENIX14T":[183],"dataset":[184],"show":[185],"our":[187],"proposed":[188],"outperforms":[190],"state-of-the-art":[191],"terms":[195],"speed":[197],"quality.":[199]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":18},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-05-08T15:41:06.802602","created_date":"2025-10-10T00:00:00"}
