{"id":"https://openalex.org/W3009828227","doi":"https://doi.org/10.1109/wacv45572.2020.9093512","title":"Word-level Deep Sign Language Recognition from Video: A New Large-scale Dataset and Methods Comparison","display_name":"Word-level Deep Sign Language Recognition from Video: A New Large-scale Dataset and Methods Comparison","publication_year":2020,"publication_date":"2020-03-01","ids":{"openalex":"https://openalex.org/W3009828227","doi":"https://doi.org/10.1109/wacv45572.2020.9093512","mag":"3009828227"},"language":"en","primary_location":{"id":"doi:10.1109/wacv45572.2020.9093512","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv45572.2020.9093512","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100386792","display_name":"Dongxu Li","orcid":"https://orcid.org/0000-0001-8543-4761"},"institutions":[{"id":"https://openalex.org/I4210127558","display_name":"Australian Centre for Robotic Vision","ror":"https://ror.org/02zv9xv82","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210127558"]},{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":true,"raw_author_name":"Dongxu Li","raw_affiliation_strings":["Australian Centre for Robotic Vision (ACRV), The Australian National University"],"affiliations":[{"raw_affiliation_string":"Australian Centre for Robotic Vision (ACRV), The Australian National University","institution_ids":["https://openalex.org/I4210127558","https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042672522","display_name":"Cristian Rodriguez Opazo","orcid":null},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210127558","display_name":"Australian Centre for Robotic Vision","ror":"https://ror.org/02zv9xv82","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210127558"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Cristian Rodriguez Opazo","raw_affiliation_strings":["Australian Centre for Robotic Vision (ACRV), The Australian National University"],"affiliations":[{"raw_affiliation_string":"Australian Centre for Robotic Vision (ACRV), The Australian National University","institution_ids":["https://openalex.org/I4210127558","https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003076238","display_name":"Xin Yu","orcid":"https://orcid.org/0000-0002-0269-5649"},"institutions":[{"id":"https://openalex.org/I4210127558","display_name":"Australian Centre for Robotic Vision","ror":"https://ror.org/02zv9xv82","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210127558"]},{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Xin Yu","raw_affiliation_strings":["Australian Centre for Robotic Vision (ACRV), The Australian National University"],"affiliations":[{"raw_affiliation_string":"Australian Centre for Robotic Vision (ACRV), The Australian National University","institution_ids":["https://openalex.org/I4210127558","https://openalex.org/I118347636"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101819061","display_name":"Hongdong Li","orcid":"https://orcid.org/0000-0003-4125-1554"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]},{"id":"https://openalex.org/I4210127558","display_name":"Australian Centre for Robotic Vision","ror":"https://ror.org/02zv9xv82","country_code":"AU","type":"facility","lineage":["https://openalex.org/I4210127558"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Hongdong Li","raw_affiliation_strings":["Australian Centre for Robotic Vision (ACRV), The Australian National University"],"affiliations":[{"raw_affiliation_string":"Australian Centre for Robotic Vision (ACRV), The Australian National University","institution_ids":["https://openalex.org/I4210127558","https://openalex.org/I118347636"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100386792"],"corresponding_institution_ids":["https://openalex.org/I118347636","https://openalex.org/I4210127558"],"apc_list":null,"apc_paid":null,"fwci":43.7604,"has_fulltext":false,"cited_by_count":553,"citation_normalized_percentile":{"value":0.99954065,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1448","last_page":"1458"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11285","display_name":"Hearing Impairment and Communication","score":0.9850999712944031,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8573026657104492},{"id":"https://openalex.org/keywords/sign-language","display_name":"Sign language","score":0.6603907942771912},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6319315433502197},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.624015212059021},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5762655735015869},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.548907995223999},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.5265179872512817},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5015454292297363},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4834385812282562},{"id":"https://openalex.org/keywords/american-sign-language","display_name":"American Sign Language","score":0.4780607521533966},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.47134894132614136},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.46406373381614685},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.442434161901474},{"id":"https://openalex.org/keywords/sign","display_name":"Sign (mathematics)","score":0.426065057516098},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3290383219718933},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32058799266815186}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8573026657104492},{"id":"https://openalex.org/C522192633","wikidata":"https://www.wikidata.org/wiki/Q34228","display_name":"Sign language","level":2,"score":0.6603907942771912},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6319315433502197},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.624015212059021},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5762655735015869},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.548907995223999},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.5265179872512817},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5015454292297363},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4834385812282562},{"id":"https://openalex.org/C2776737515","wikidata":"https://www.wikidata.org/wiki/Q14759","display_name":"American Sign Language","level":3,"score":0.4780607521533966},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.47134894132614136},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46406373381614685},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.442434161901474},{"id":"https://openalex.org/C139676723","wikidata":"https://www.wikidata.org/wiki/Q1193832","display_name":"Sign (mathematics)","level":2,"score":0.426065057516098},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3290383219718933},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32058799266815186},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/wacv45572.2020.9093512","is_oa":false,"landing_page_url":"https://doi.org/10.1109/wacv45572.2020.9093512","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"proceedings-article"},{"id":"pmh:oai:digital.library.adelaide.edu.au:2440/133224","is_oa":false,"landing_page_url":"https://hdl.handle.net/2440/133224","pdf_url":null,"source":{"id":"https://openalex.org/S4306401835","display_name":"Adelaide Research & Scholarship (AR&S) (University of Adelaide)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I5681781","host_organization_name":"The University of Adelaide","host_organization_lineage":["https://openalex.org/I5681781"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://ieeexplore.ieee.org/","raw_type":"Conference paper"},{"id":"pmh:oai:openresearch-repository.anu.edu.au:1885/311627","is_oa":false,"landing_page_url":"http://hdl.handle.net/1885/311627","pdf_url":null,"source":{"id":"https://openalex.org/S4306402539","display_name":"ANU Open Research (Australian National University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I118347636","host_organization_name":"Australian National University","host_organization_lineage":["https://openalex.org/I118347636"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2020 IEEE Winter Conference on Applications of Computer Vision (WACV)","raw_type":"Conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8100000023841858,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":94,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W276105310","https://openalex.org/W328363538","https://openalex.org/W1506441995","https://openalex.org/W1522301498","https://openalex.org/W1522734439","https://openalex.org/W1547391644","https://openalex.org/W1579818084","https://openalex.org/W1586730761","https://openalex.org/W1639784222","https://openalex.org/W1686810756","https://openalex.org/W1923404803","https://openalex.org/W1927052826","https://openalex.org/W1947481528","https://openalex.org/W1969724184","https://openalex.org/W1972034101","https://openalex.org/W1983364832","https://openalex.org/W1993229407","https://openalex.org/W1994529670","https://openalex.org/W2020163092","https://openalex.org/W2034014085","https://openalex.org/W2072096818","https://openalex.org/W2081983669","https://openalex.org/W2096733369","https://openalex.org/W2097117768","https://openalex.org/W2097151019","https://openalex.org/W2100526149","https://openalex.org/W2107603586","https://openalex.org/W2108274355","https://openalex.org/W2108333036","https://openalex.org/W2113325037","https://openalex.org/W2117539524","https://openalex.org/W2118244636","https://openalex.org/W2126179605","https://openalex.org/W2126574503","https://openalex.org/W2134983583","https://openalex.org/W2139857301","https://openalex.org/W2142194269","https://openalex.org/W2146221819","https://openalex.org/W2154790436","https://openalex.org/W2156303437","https://openalex.org/W2157331557","https://openalex.org/W2161755782","https://openalex.org/W2161969291","https://openalex.org/W2167876098","https://openalex.org/W2318037154","https://openalex.org/W2330154883","https://openalex.org/W2342890612","https://openalex.org/W2401084598","https://openalex.org/W2464305746","https://openalex.org/W2485310399","https://openalex.org/W2559085405","https://openalex.org/W2745933219","https://openalex.org/W2770128248","https://openalex.org/W2779380177","https://openalex.org/W2783892510","https://openalex.org/W2796347433","https://openalex.org/W2897163805","https://openalex.org/W2897208343","https://openalex.org/W2899768692","https://openalex.org/W2903314716","https://openalex.org/W2943447287","https://openalex.org/W2946677207","https://openalex.org/W2950339701","https://openalex.org/W2954798773","https://openalex.org/W2962730651","https://openalex.org/W2963065614","https://openalex.org/W2963474899","https://openalex.org/W2963524571","https://openalex.org/W2964105113","https://openalex.org/W2964121744","https://openalex.org/W2964203186","https://openalex.org/W3022360907","https://openalex.org/W3027573219","https://openalex.org/W3099206234","https://openalex.org/W4253468347","https://openalex.org/W4285719527","https://openalex.org/W4293584584","https://openalex.org/W6600983433","https://openalex.org/W6610312258","https://openalex.org/W6631190155","https://openalex.org/W6634737339","https://openalex.org/W6635099914","https://openalex.org/W6636759891","https://openalex.org/W6637373629","https://openalex.org/W6640257725","https://openalex.org/W6640295108","https://openalex.org/W6675871991","https://openalex.org/W6682864246","https://openalex.org/W6747909800","https://openalex.org/W6750227808","https://openalex.org/W6756633688","https://openalex.org/W6756891207","https://openalex.org/W6987011541"],"related_works":["https://openalex.org/W2089405242","https://openalex.org/W2004685257","https://openalex.org/W1977288663","https://openalex.org/W2115068291","https://openalex.org/W3010360921","https://openalex.org/W2100673443","https://openalex.org/W2897666773","https://openalex.org/W2226154349","https://openalex.org/W2963075127","https://openalex.org/W2947981379"],"abstract_inverted_index":{"Vision-based":[0],"sign":[1,17,94,115],"language":[2,18],"recognition":[3,95,116],"aims":[4],"at":[5,206,228],"helping":[6],"the":[7,30,77,86,154,186,189,213],"deaf":[8],"people":[9],"to":[10,22,29,76,91,106,204],"communicate":[11],"with":[12,108],"others.":[13],"However,":[14],"most":[15],"existing":[16],"datasets":[19,38],"are":[20,104,148,226],"limited":[21,31],"a":[23,49,163],"small":[24],"number":[25],"of":[26,188,217],"words.":[27],"Due":[28],"vocabulary":[32],"size,":[33],"models":[34,147,199,225],"learned":[35],"from":[36],"those":[37],"cannot":[39],"be":[40,72],"applied":[41],"in":[42,121,177],"practice.":[43],"In":[44],"this":[45,99],"paper,":[46],"we":[47,103,126,160],"introduce":[48],"new":[50,100],"large-scale":[51,101],"Word-Level":[52],"American":[53],"Sign":[54],"Language":[55],"(WLASL)":[56],"video":[57],"dataset,":[58,102],"containing":[59],"more":[60],"than":[61],"2000":[62],"words":[63],"performed":[64],"by":[65,84],"over":[66],"100":[67],"signers.":[68],"This":[69],"dataset":[70,90,221],"will":[71,152],"made":[73],"publicly":[74],"available":[75,227],"research":[78],"community.":[79],"To":[80],"our":[81,218],"knowledge,it":[82],"is":[83],"far":[85],"largest":[87],"public":[88],"ASL":[89],"facilitate":[92],"word-level":[93,114],"research.":[96],"Based":[97],"on":[98,209],"able":[105],"experiment":[107],"several":[109],"deep":[110,224],"learning":[111],"methods":[112],"for":[113,156],"and":[117,128,139,174,197,215,222],"evaluate":[118],"their":[119],"performances":[120,202],"large":[122],"scale":[123],"scenarios.":[124],"Specifically":[125],"implement":[127],"compare":[129],"two":[130],"different":[131],"models,i.e.,":[132],"(i)":[133],"holistic":[134],"visual":[135],"appearance":[136],"based":[137,144],"approach,":[138],"(ii)":[140],"2D":[141],"human":[142,178],"pose":[143,179],"approach.":[145],"Both":[146],"valuable":[149],"baselines":[150],"that":[151,171,195],"benefit":[153],"community":[155],"method":[157],"benchmarking.":[158],"Moreover,":[159],"also":[161],"propose":[162],"novel":[164],"pose-based":[165,190,196],"temporal":[166,175],"graph":[167],"convolution":[168],"networks":[169],"(Pose-TGCN)":[170],"model":[172],"spatial":[173],"dependencies":[176],"trajectories":[180],"simultaneously,":[181],"which":[182],"has":[183],"further":[184],"boosted":[185],"performance":[187],"method.":[191],"Our":[192,220],"results":[193],"show":[194],"appearance-based":[198],"achieve":[200],"comparable":[201],"up":[203],"62.63%":[205],"top-10":[207],"accuracy":[208],"2,000":[210],"words/glosses,":[211],"demonstrating":[212],"validity":[214],"challenges":[216],"dataset.":[219],"baseline":[223],"https://dxli94.github.io/WLASL/.":[229]},"counts_by_year":[{"year":2026,"cited_by_count":18},{"year":2025,"cited_by_count":128},{"year":2024,"cited_by_count":119},{"year":2023,"cited_by_count":118},{"year":2022,"cited_by_count":81},{"year":2021,"cited_by_count":69},{"year":2020,"cited_by_count":20}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
