{"id":"https://openalex.org/W7154445728","doi":"https://doi.org/10.1007/s11227-026-08481-x","title":"A multi-stage convolutional and self-attention architecture for high-precision sign language gesture recognition","display_name":"A multi-stage convolutional and self-attention architecture for high-precision sign language gesture recognition","publication_year":2026,"publication_date":"2026-04-16","ids":{"openalex":"https://openalex.org/W7154445728","doi":"https://doi.org/10.1007/s11227-026-08481-x"},"language":"en","primary_location":{"id":"doi:10.1007/s11227-026-08481-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11227-026-08481-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11227-026-08481-x.pdf","source":{"id":"https://openalex.org/S32326811","display_name":"The Journal of Supercomputing","issn_l":"0920-8542","issn":["0920-8542","1573-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Journal of Supercomputing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s11227-026-08481-x.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036652938","display_name":"Ahmed KASAPBA\u015eI","orcid":"https://orcid.org/0000-0003-2383-1774"},"institutions":[{"id":"https://openalex.org/I149218525","display_name":"Ankara University","ror":"https://ror.org/01wntqw50","country_code":"TR","type":"education","lineage":["https://openalex.org/I149218525"]},{"id":"https://openalex.org/I4210145505","display_name":"University of Turkish Aeronautical Association","ror":"https://ror.org/055p14r26","country_code":"TR","type":"education","lineage":["https://openalex.org/I4210145505"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"Ahmed Kasapba\u015f\u0131","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Faculty of Engineering, Turkish Aeronautical Association University, Ankara, Turkey","Department of Electrical and Electronics Engineering, Graduate School of Natural and Applied Sciences, Ankara Y\u0131ld\u0131r\u0131m Beyaz\u0131t University, Ankara, Turkey"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Faculty of Engineering, Turkish Aeronautical Association University, Ankara, Turkey","institution_ids":["https://openalex.org/I4210145505"]},{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Graduate School of Natural and Applied Sciences, Ankara Y\u0131ld\u0131r\u0131m Beyaz\u0131t University, Ankara, Turkey","institution_ids":["https://openalex.org/I149218525"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002143603","display_name":"H\u00fcseyin Canbolat","orcid":"https://orcid.org/0000-0002-2577-0517"},"institutions":[{"id":"https://openalex.org/I149218525","display_name":"Ankara University","ror":"https://ror.org/01wntqw50","country_code":"TR","type":"education","lineage":["https://openalex.org/I149218525"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"H\u00fcseyin Canbolat","raw_affiliation_strings":["Department of Electrical and Electronics Engineering, Graduate School of Natural and Applied Sciences, Ankara Y\u0131ld\u0131r\u0131m Beyaz\u0131t University, Ankara, Turkey"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Electronics Engineering, Graduate School of Natural and Applied Sciences, Ankara Y\u0131ld\u0131r\u0131m Beyaz\u0131t University, Ankara, Turkey","institution_ids":["https://openalex.org/I149218525"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5036652938"],"corresponding_institution_ids":["https://openalex.org/I149218525","https://openalex.org/I4210145505"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.65490654,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"82","issue":"6","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9473000168800354,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9473000168800354,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.009399999864399433,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10789","display_name":"Interactive and Immersive Displays","score":0.007400000002235174,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6133999824523926},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5565999746322632},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5156999826431274},{"id":"https://openalex.org/keywords/gesture-recognition","display_name":"Gesture recognition","score":0.4803999960422516},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.438400000333786},{"id":"https://openalex.org/keywords/sign-language","display_name":"Sign language","score":0.4377000033855438},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.40869998931884766},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4058000147342682},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.359499990940094}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9301999807357788},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6133999824523926},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5565999746322632},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.555400013923645},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5156999826431274},{"id":"https://openalex.org/C159437735","wikidata":"https://www.wikidata.org/wiki/Q1519524","display_name":"Gesture recognition","level":3,"score":0.4803999960422516},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.438400000333786},{"id":"https://openalex.org/C522192633","wikidata":"https://www.wikidata.org/wiki/Q34228","display_name":"Sign language","level":2,"score":0.4377000033855438},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.41760000586509705},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.40869998931884766},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4058000147342682},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.359499990940094},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.3594000041484833},{"id":"https://openalex.org/C207347870","wikidata":"https://www.wikidata.org/wiki/Q371174","display_name":"Gesture","level":2,"score":0.3580999970436096},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.3452000021934509},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3165999948978424},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3138999938964844},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.29809999465942383},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C46743427","wikidata":"https://www.wikidata.org/wiki/Q1341685","display_name":"Inference engine","level":3,"score":0.28360000252723694},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2786000072956085},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.27730000019073486},{"id":"https://openalex.org/C119898033","wikidata":"https://www.wikidata.org/wiki/Q3433888","display_name":"Ensemble forecasting","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s11227-026-08481-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11227-026-08481-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11227-026-08481-x.pdf","source":{"id":"https://openalex.org/S32326811","display_name":"The Journal of Supercomputing","issn_l":"0920-8542","issn":["0920-8542","1573-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Journal of Supercomputing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s11227-026-08481-x","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s11227-026-08481-x","pdf_url":"https://link.springer.com/content/pdf/10.1007/s11227-026-08481-x.pdf","source":{"id":"https://openalex.org/S32326811","display_name":"The Journal of Supercomputing","issn_l":"0920-8542","issn":["0920-8542","1573-0484"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Journal of Supercomputing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322626","display_name":"T\u00fcrkiye Bilimsel ve Teknolojik Ara\u015ft\u0131rma Kurumu","ror":"https://ror.org/04w9kkr77"},{"id":"https://openalex.org/F4320328664","display_name":"Ankara Y\u0131ld\u0131r\u0131m Beyaz\u0131t \u00dcniversitesi","ror":"https://ror.org/05ryemn72"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7154445728.pdf","grobid_xml":"https://content.openalex.org/works/W7154445728.grobid-xml"},"referenced_works_count":41,"referenced_works":["https://openalex.org/W1815076433","https://openalex.org/W2604319603","https://openalex.org/W2908510526","https://openalex.org/W2963263347","https://openalex.org/W3094502228","https://openalex.org/W3118895004","https://openalex.org/W3135806226","https://openalex.org/W3176939804","https://openalex.org/W4213009331","https://openalex.org/W4223508653","https://openalex.org/W4285803147","https://openalex.org/W4287116734","https://openalex.org/W4292367319","https://openalex.org/W4313855689","https://openalex.org/W4364295729","https://openalex.org/W4366261916","https://openalex.org/W4377699816","https://openalex.org/W4385555931","https://openalex.org/W4386002145","https://openalex.org/W4386498661","https://openalex.org/W4386522975","https://openalex.org/W4387741492","https://openalex.org/W4387819708","https://openalex.org/W4388918639","https://openalex.org/W4388942030","https://openalex.org/W4391930075","https://openalex.org/W4392513657","https://openalex.org/W4393260972","https://openalex.org/W4396856847","https://openalex.org/W4399897860","https://openalex.org/W4400779880","https://openalex.org/W4401914580","https://openalex.org/W4402523417","https://openalex.org/W4404491874","https://openalex.org/W4404494741","https://openalex.org/W4406612611","https://openalex.org/W4406897873","https://openalex.org/W4407252492","https://openalex.org/W4411453131","https://openalex.org/W4412063422","https://openalex.org/W7081948296"],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"This":[1],"paper":[2],"presents":[3],"a":[4,203],"novel":[5],"composite":[6],"architecture":[7,184],"for":[8,139],"high-precision":[9],"sign":[10],"language":[11],"gesture":[12],"recognition":[13],"referred":[14],"to":[15,28,117,225],"as":[16,145],"ViTSLA.":[17],"The":[18,199,213],"model":[19,201],"integrates":[20],"convolutional":[21],"inductive":[22],"bias":[23],"with":[24,65,194],"transformer-based":[25],"global":[26],"attention":[27,93],"improve":[29],"predictive":[30,77,187],"accuracy":[31,62],"and":[32,47,72,87,95,101,112,122,148,158,171,210,228],"computational":[33,83,102,191,211],"efficiency.":[34],"Extensive":[35],"experiments":[36],"are":[37],"conducted":[38],"on":[39],"three":[40],"datasets":[41],"using":[42],"five-fold":[43],"cross-validation,":[44],"ablation":[45],"analysis,":[46],"comparative":[48],"evaluation":[49],"against":[50],"standard":[51],"vision":[52,197,246],"transformer":[53],"(ViT)":[54],"variants.":[55],"Experimental":[56],"results":[57,179,214],"demonstrate":[58,180,215],"consistently":[59],"high":[60,172,186],"classification":[61],"exceeding":[63],"99.5%":[64],"minimal":[66],"variance":[67],"across":[68,161],"folds,":[69],"confirming":[70],"robustness":[71],"balanced":[73],"class-wise":[74],"performance.":[75,230],"Beyond":[76],"performance,":[78],"this":[79],"work":[80],"addresses":[81],"the":[82,164,182,234,237,241],"demands":[84],"of":[85,236,243],"training":[86,106,157],"deploying":[88],"hybrid":[89,217],"deep":[90],"architectures.":[91],"Transformer-based":[92],"mechanisms":[94],"high-resolution":[96],"tokenization":[97],"increase":[98],"memory":[99],"consumption":[100],"complexity.":[103],"Therefore,":[104],"efficient":[105],"requires":[107],"parallel":[108],"processing,":[109],"GPU":[110],"acceleration,":[111],"high-performance":[113],"computing":[114],"(HPC)":[115],"environments":[116],"handle":[118],"large-scale":[119],"tensor":[120],"operations":[121],"multi-fold":[123],"cross-validation":[124],"experiments.":[125],"Furthermore,":[126],"real-time":[127,175],"inference":[128],"capability":[129],"is":[130,137],"maintained":[131],"at":[132],"over":[133],"300":[134],"FPS,":[135],"which":[136],"essential":[138],"deployment":[140,176],"in":[141],"latency-sensitive":[142],"applications":[143],"such":[144],"interactive":[146],"systems":[147],"intelligent":[149,196,245],"human\u2013computer":[150],"interfaces.":[151],"Distributed":[152],"computation":[153],"further":[154],"enables":[155],"scalable":[156,226],"stable":[159,168],"convergence":[160],"datasets.":[162],"Moreover,":[163],"low":[165],"mean":[166],"latency,":[167],"P95":[169],"behavior,":[170],"throughput":[173],"confirm":[174],"capability.":[177],"These":[178,231],"that":[181,216],"proposed":[183,238],"achieves":[185,202],"performance":[188],"while":[189],"maintaining":[190],"characteristics":[192],"aligned":[193],"supercomputing-driven":[195,244],"systems.":[198,247],"developed":[200],"favorable":[204],"balance":[205],"between":[206],"accuracy,":[207],"parameter":[208],"efficiency,":[209],"cost.":[212],"convolutional-attention":[218],"architectures":[219],"benefit":[220],"from":[221],"HPC-enabled":[222],"parallelism,":[223],"leading":[224],"optimization":[227],"deployment-ready":[229],"findings":[232],"establish":[233],"relevance":[235],"approach":[239],"within":[240],"domain":[242]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2026-04-16T00:00:00"}
