{"id":"https://openalex.org/W7147222852","doi":"https://doi.org/10.1016/j.array.2026.100787","title":"Multimodal fusion of visual and auditory biomarkers: An epoch-wise stochastic modality masking framework for stroke detection using a CNN\u2013GRU network","display_name":"Multimodal fusion of visual and auditory biomarkers: An epoch-wise stochastic modality masking framework for stroke detection using a CNN\u2013GRU network","publication_year":2026,"publication_date":"2026-04-01","ids":{"openalex":"https://openalex.org/W7147222852","doi":"https://doi.org/10.1016/j.array.2026.100787"},"language":"en","primary_location":{"id":"doi:10.1016/j.array.2026.100787","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.array.2026.100787","pdf_url":null,"source":{"id":"https://openalex.org/S4210194039","display_name":"Array","issn_l":"2590-0056","issn":["2590-0056"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Array","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1016/j.array.2026.100787","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5106398750","display_name":"Sadman Sakib Alif","orcid":null},"institutions":[{"id":"https://openalex.org/I5518804","display_name":"BRAC University","ror":"https://ror.org/00sge8677","country_code":"BD","type":"education","lineage":["https://openalex.org/I5518804"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Sadman Sakib Alif","raw_affiliation_strings":["BRAC University, Dhaka, Bangladesh"],"raw_orcid":"https://orcid.org/0009-0008-3643-9134","affiliations":[{"raw_affiliation_string":"BRAC University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I5518804"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132695328","display_name":"Md. Yasin Arafat","orcid":null},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Md. Yasin Arafat","raw_affiliation_strings":["North South University, Dhaka, Bangladesh"],"raw_orcid":"https://orcid.org/0009-0003-1791-5266","affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132610724","display_name":"Md. Mazharul Islam Nibir","orcid":null},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Md. Mazharul Islam Nibir","raw_affiliation_strings":["North South University, Dhaka, Bangladesh"],"raw_orcid":"https://orcid.org/0009-0005-9880-3833","affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132550043","display_name":"Farhana Mehazbin Tusti","orcid":null},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Farhana Mehazbin Tusti","raw_affiliation_strings":["North South University, Dhaka, Bangladesh"],"raw_orcid":"https://orcid.org/0009-0008-4423-3101","affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024196830","display_name":"Aniqua Nusrat Zereen","orcid":"https://orcid.org/0000-0002-8655-8667"},"institutions":[{"id":"https://openalex.org/I25399158","display_name":"Mahidol University","ror":"https://ror.org/01znkr924","country_code":"TH","type":"education","lineage":["https://openalex.org/I25399158"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Aniqua Nusrat Zereen","raw_affiliation_strings":["Mahidol University, Salaya, Thailand"],"raw_orcid":"https://orcid.org/0000-0002-8655-8667","affiliations":[{"raw_affiliation_string":"Mahidol University, Salaya, Thailand","institution_ids":["https://openalex.org/I25399158"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5024196830"],"corresponding_institution_ids":["https://openalex.org/I25399158"],"apc_list":{"value":1350,"currency":"USD","value_usd":1350},"apc_paid":{"value":1350,"currency":"USD","value_usd":1350},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.75632611,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":null,"first_page":"100787","last_page":"100787"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10863","display_name":"Voice and Speech Disorders","score":0.3515999913215637,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10863","display_name":"Voice and Speech Disorders","score":0.3515999913215637,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10510","display_name":"Stroke Rehabilitation and Recovery","score":0.07370000332593918,"subfield":{"id":"https://openalex.org/subfields/2742","display_name":"Rehabilitation"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10227","display_name":"Acute Ischemic Stroke Management","score":0.0560000017285347,"subfield":{"id":"https://openalex.org/subfields/2713","display_name":"Epidemiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6355999708175659},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5807999968528748},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.527999997138977},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.521399974822998},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.36160001158714294},{"id":"https://openalex.org/keywords/facial-expression","display_name":"Facial expression","score":0.33149999380111694},{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.3052999973297119}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7894999980926514},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6355999708175659},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.586899995803833},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5807999968528748},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5444999933242798},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.527999997138977},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.521399974822998},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.36160001158714294},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.33149999380111694},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3019999861717224},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.299699991941452},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2955000102519989},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2928999960422516},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.2750999927520752},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.2549999952316284},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.2547000050544739},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.25119999051094055},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2508000135421753}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1016/j.array.2026.100787","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.array.2026.100787","pdf_url":null,"source":{"id":"https://openalex.org/S4210194039","display_name":"Array","issn_l":"2590-0056","issn":["2590-0056"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Array","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:26a3aa7bf44d495a9daa723665e5617e","is_oa":true,"landing_page_url":"https://doaj.org/article/26a3aa7bf44d495a9daa723665e5617e","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Array, Vol 30, Iss , Pp 100787- (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1016/j.array.2026.100787","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.array.2026.100787","pdf_url":null,"source":{"id":"https://openalex.org/S4210194039","display_name":"Array","issn_l":"2590-0056","issn":["2590-0056"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Array","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","score":0.5634048581123352,"display_name":"Industry, innovation and infrastructure"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W2018363392","https://openalex.org/W2095955991","https://openalex.org/W2157420555","https://openalex.org/W2167541413","https://openalex.org/W2508244509","https://openalex.org/W2803306216","https://openalex.org/W2899356990","https://openalex.org/W2919243131","https://openalex.org/W3082991707","https://openalex.org/W3092693034","https://openalex.org/W3158717660","https://openalex.org/W3164264239","https://openalex.org/W3204786284","https://openalex.org/W4205679663","https://openalex.org/W4224315877","https://openalex.org/W4283368621","https://openalex.org/W4283749599","https://openalex.org/W4287509666","https://openalex.org/W4294875228","https://openalex.org/W4303685860","https://openalex.org/W4311472318","https://openalex.org/W4361855690","https://openalex.org/W4362731103","https://openalex.org/W4388027483","https://openalex.org/W4389080144","https://openalex.org/W4391490171","https://openalex.org/W4393252960","https://openalex.org/W4393312849","https://openalex.org/W4399421915","https://openalex.org/W4399442744","https://openalex.org/W4400031023","https://openalex.org/W4401659386","https://openalex.org/W4401795618","https://openalex.org/W4405512582","https://openalex.org/W4407637717","https://openalex.org/W4408358703","https://openalex.org/W4409316841","https://openalex.org/W4411799683"],"related_works":[],"abstract_inverted_index":{"The":[0,183],"automated":[1],"identification":[2],"of":[3,18,51,105,126],"neurovascular":[4],"impairment,":[5],"particularly":[6],"ischemic":[7],"or":[8],"hemorrhagic":[9],"stroke,":[10],"remains":[11],"challenging":[12],"due":[13],"to":[14,66,159,169,219],"the":[15,55,72,85,103,113,157,167,188,200,211,217,227],"multimodal":[16,30,140,176,197],"nature":[17],"symptoms":[19],"such":[20],"as":[21],"facial":[22,58,86,143,149],"asymmetry":[23],"and":[24,36,41,87,95,145,151,163],"dysarthria.":[25],"This":[26,155],"study":[27],"introduces":[28],"a":[29,46,117,123],"diagnostic":[31],"framework":[32,190],"that":[33,187],"integrates":[34],"visual":[35,56],"auditory":[37,73],"streams":[38],"for":[39,229],"accurate":[40],"interpretable":[42],"stroke":[43,230],"detection,":[44],"with":[45],"focus":[47],"on":[48],"efficient":[49],"utilization":[50],"available":[52],"data.":[53],"On":[54],"side,":[57],"landmarks":[59,144,150],"are":[60,77],"derived":[61],"from":[62,91,135,223],"MediaPipe\u2019s":[63],"Face":[64],"Mesh":[65],"identify":[67],"unilateral":[68],"muscular":[69],"deficiencies.":[70],"For":[71],"streams,":[74],"speech":[75],"recordings":[76],"transformed":[78],"into":[79],"Mel-Frequency":[80],"Cepstral":[81],"Coefficients":[82],"(MFCC).":[83],"Notably,":[84],"audio":[88,146,153],"data":[89,128],"come":[90],"two":[92],"separate":[93],"sources":[94],"lack":[96],"patient-level":[97],"correspondence.":[98],"A":[99],"primary":[100],"innovation":[101],"is":[102,129,180],"incorporation":[104],"an":[106],"epoch-wise":[107],"stochastic":[108],"modality":[109,213],"masking":[110,214],"approach":[111,215],"within":[112],"training":[114,127],"loop,":[115],"utilizing":[116],"CNN\u2013GRU":[118],"scheme.":[119],"In":[120],"each":[121],"epoch,":[122],"new":[124],"batch":[125],"created":[130],"by":[131],"dynamically":[132],"combining":[133],"samples":[134],"three":[136],"different":[137],"categories:":[138],"complete":[139],"input":[141],"(both":[142],"MFCC),":[147],"only":[148,152],"MFCC.":[154],"compels":[156],"model":[158,218],"learn":[160,220],"both":[161],"unimodal":[162,201],"cross-modal":[164],"representations,":[165],"demonstrating":[166,226],"ability":[168],"leverage":[170],"multiple":[171],"modalities":[172],"even":[173],"when":[174],"true":[175],"correspondence":[177],"across":[178],"datasets":[179],"not":[181],"available.":[182],"empirical":[184],"results":[185],"show":[186,207],"developed":[189],"works":[191],"well,":[192],"achieving":[193],"95.33%":[194],"accuracy":[195],"in":[196,232],"settings.":[198],"While":[199],"baselines":[202],"(facial-only:":[203],"86.87%;":[204],"audio-only:":[205],"97.41%)":[206],"strong":[208],"performance":[209],"individually,":[210],"proposed":[212],"enables":[216],"robust":[221],"representations":[222],"cross-source":[224],"data,":[225],"potential":[228],"detection":[231],"preliminary":[233],"evaluation":[234],"scenarios.":[235]},"counts_by_year":[],"updated_date":"2026-04-06T05:59:17.497350","created_date":"2026-04-02T00:00:00"}
