{"id":"https://openalex.org/W4407692820","doi":"https://doi.org/10.1109/iceic64972.2025.10879747","title":"Segmentation and Recognition of Japanese Sign Language Syllables Using Frame Clustering in Video","display_name":"Segmentation and Recognition of Japanese Sign Language Syllables Using Frame Clustering in Video","publication_year":2025,"publication_date":"2025-01-19","ids":{"openalex":"https://openalex.org/W4407692820","doi":"https://doi.org/10.1109/iceic64972.2025.10879747"},"language":"en","primary_location":{"id":"doi:10.1109/iceic64972.2025.10879747","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iceic64972.2025.10879747","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Electronics, Information, and Communication (ICEIC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5095378514","display_name":"Tamon Kondo","orcid":"https://orcid.org/0009-0006-4394-4417"},"institutions":[{"id":"https://openalex.org/I31618427","display_name":"Tokyo Polytechnic University","ror":"https://ror.org/035kpke84","country_code":"JP","type":"education","lineage":["https://openalex.org/I31618427"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Tamon Kondo","raw_affiliation_strings":["Tokyo Polytechnic University,Graduate School of Engineering,Atsugi, Kanagawa,Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Polytechnic University,Graduate School of Engineering,Atsugi, Kanagawa,Japan","institution_ids":["https://openalex.org/I31618427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000460972","display_name":"Ryota Murai","orcid":null},"institutions":[{"id":"https://openalex.org/I31618427","display_name":"Tokyo Polytechnic University","ror":"https://ror.org/035kpke84","country_code":"JP","type":"education","lineage":["https://openalex.org/I31618427"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Ryota Murai","raw_affiliation_strings":["Tokyo Polytechnic University,Dept. of Engineering,Atsugi, Kanagawa,Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Polytechnic University,Dept. of Engineering,Atsugi, Kanagawa,Japan","institution_ids":["https://openalex.org/I31618427"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030887727","display_name":"Yousun Kang","orcid":null},"institutions":[{"id":"https://openalex.org/I31618427","display_name":"Tokyo Polytechnic University","ror":"https://ror.org/035kpke84","country_code":"JP","type":"education","lineage":["https://openalex.org/I31618427"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yousun Kang","raw_affiliation_strings":["Tokyo Polytechnic University,Faculty of Engineering,Atsugi, Kanagawa,Japan"],"affiliations":[{"raw_affiliation_string":"Tokyo Polytechnic University,Faculty of Engineering,Atsugi, Kanagawa,Japan","institution_ids":["https://openalex.org/I31618427"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5095378514"],"corresponding_institution_ids":["https://openalex.org/I31618427"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02274038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.9336000084877014,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11285","display_name":"Hearing Impairment and Communication","score":0.916700005531311,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8117589354515076},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6767352819442749},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.64250648021698},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.6360306143760681},{"id":"https://openalex.org/keywords/sign-language","display_name":"Sign language","score":0.6114984154701233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5319312810897827},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4997844696044922},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36588054895401},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3347676396369934},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.16674137115478516},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.07754993438720703}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8117589354515076},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6767352819442749},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.64250648021698},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.6360306143760681},{"id":"https://openalex.org/C522192633","wikidata":"https://www.wikidata.org/wiki/Q34228","display_name":"Sign language","level":2,"score":0.6114984154701233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5319312810897827},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4997844696044922},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36588054895401},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3347676396369934},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.16674137115478516},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.07754993438720703},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iceic64972.2025.10879747","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iceic64972.2025.10879747","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Electronics, Information, and Communication (ICEIC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W2782242894","https://openalex.org/W2809707231","https://openalex.org/W4323570550","https://openalex.org/W4401754348"],"related_works":["https://openalex.org/W4298130764","https://openalex.org/W2804364458","https://openalex.org/W4379621602","https://openalex.org/W4294690766","https://openalex.org/W2132641928","https://openalex.org/W4310225030","https://openalex.org/W2159815235","https://openalex.org/W2090259340","https://openalex.org/W3204710839","https://openalex.org/W1926736923"],"abstract_inverted_index":{"This":[0],"research":[1],"aims":[2],"to":[3,164],"develop":[4],"a":[5,15,35,114],"method":[6,94,112],"for":[7,130,138],"recognizing":[8],"sign":[9,22,37],"language":[10,23,38],"gestures":[11,121,132],"from":[12],"video,":[13],"with":[14,97,125],"focus":[16,154],"on":[17,26,34,155],"segmenting":[18,119],"and":[19,40,62,77,133,146,150,159],"identifying":[20],"individual":[21],"characters.":[24],"Building":[25],"previous":[27],"work,":[28],"the":[29,49,92,110,157],"proposed":[30],"model":[31],"was":[32,80],"trained":[33,83],"Japanese":[36],"dataset":[39,158],"evaluated":[41],"using":[42,55,82],"videos":[43],"of":[44,105,128],"an":[45,102,126],"experienced":[46],"signer":[47],"performing":[48],"gestures.":[50],"Gesture":[51],"features":[52],"were":[53,75],"extracted":[54],"Mediapipe,":[56],"capturing":[57],"40":[58],"finger":[59,168],"joint":[60],"angles":[61],"hand":[63],"tilt":[64],"measurements.":[65],"To":[66],"detect":[67],"transitions":[68],"between":[69],"syllables,":[70],"several":[71],"change-point":[72],"detection":[73],"methods":[74],"applied,":[76],"character":[78,99],"recognition":[79],"performed":[81],"Vision":[84],"Transformer":[85],"(ViT)":[86],"models.":[87],"Experimental":[88],"results":[89],"indicated":[90],"that":[91],"PELT":[93],"had":[95],"difficulties":[96],"accurate":[98],"segmentation,":[100],"achieving":[101],"overall":[103],"accuracy":[104,127],"only":[106],"31.7%.":[107],"In":[108],"contrast,":[109],"BottomUp":[111],"achieved":[113],"100%":[115],"success":[116],"rate":[117],"in":[118],"textbook":[120,131],"under":[122],"specific":[123],"conditions,":[124],"44.4%":[129],"37.0%":[134],"overall.":[135],"Challenges":[136],"remain":[137],"characters":[139],"such":[140],"as":[141],"<tex":[142,147],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[143,148],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$^{\\prime\\prime}\\mathcal{D}":[144],"(\\text{no})^{\\prime\\prime}$</tex>":[145],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$^{\\prime\\prime}\\mathcal{h}(\\text{nn}),^{\\prime\\prime}$</tex>":[149],"future":[151],"work":[152],"will":[153],"expanding":[156],"improving":[160],"feature":[161],"extraction":[162],"techniques":[163],"better":[165],"capture":[166],"everyday":[167],"movements.":[169]},"counts_by_year":[],"updated_date":"2025-12-21T23:12:01.093139","created_date":"2025-10-10T00:00:00"}
