{"id":"https://openalex.org/W7138106426","doi":"https://doi.org/10.1609/aaai.v40i21.38870","title":"CAT-Net: A Cross-Attention Tone Network for Cross-Subject EEG-EMG Fusion Tone Decoding","display_name":"CAT-Net: A Cross-Attention Tone Network for Cross-Subject EEG-EMG Fusion Tone Decoding","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138106426","doi":"https://doi.org/10.1609/aaai.v40i21.38870"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i21.38870","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i21.38870","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38870/42832","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38870/42832","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043459152","display_name":"Yifan Zhuang","orcid":"https://orcid.org/0000-0003-3732-5215"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yifan Zhuang","raw_affiliation_strings":["Sony Interactive Entertainment"],"affiliations":[{"raw_affiliation_string":"Sony Interactive Entertainment","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038717078","display_name":"Calvin Huang","orcid":"https://orcid.org/0000-0002-5054-4714"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Calvin Huang","raw_affiliation_strings":["Independent researcher"],"affiliations":[{"raw_affiliation_string":"Independent researcher","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129677884","display_name":"Zepeng Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zepeng Yu","raw_affiliation_strings":["Independent researcher"],"affiliations":[{"raw_affiliation_string":"Independent researcher","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035501844","display_name":"Yongjie Zou","orcid":"https://orcid.org/0000-0001-8425-3934"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yongjie Zou","raw_affiliation_strings":["Lingang Laboratory"],"affiliations":[{"raw_affiliation_string":"Lingang Laboratory","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023760937","display_name":"Jiawei Ju","orcid":"https://orcid.org/0000-0002-1310-6803"},"institutions":[{"id":"https://openalex.org/I4210164150","display_name":"Shanghai Center for Brain Science and Brain-Inspired Technology","ror":"https://ror.org/0551a0y31","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210164150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiawei Ju","raw_affiliation_strings":["Shanghai Center for Brain Science and Brain-Inspired Technology\nLingang Laboratory"],"affiliations":[{"raw_affiliation_string":"Shanghai Center for Brain Science and Brain-Inspired Technology\nLingang Laboratory","institution_ids":["https://openalex.org/I4210164150"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5043459152"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3015873,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"21","first_page":"18090","last_page":"18098"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.9853000044822693,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.004800000227987766,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10784","display_name":"Muscle activation and electromyography studies","score":0.0010999999940395355,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.8485000133514404},{"id":"https://openalex.org/keywords/tone","display_name":"Tone (literature)","score":0.5997999906539917},{"id":"https://openalex.org/keywords/electroencephalography","display_name":"Electroencephalography","score":0.5967000126838684},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.5716000199317932},{"id":"https://openalex.org/keywords/brain\u2013computer-interface","display_name":"Brain\u2013computer interface","score":0.5306000113487244},{"id":"https://openalex.org/keywords/neural-decoding","display_name":"Neural decoding","score":0.5203999876976013},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.37880000472068787},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.37700000405311584}],"concepts":[{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.8485000133514404},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7524999976158142},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7251999974250793},{"id":"https://openalex.org/C2780583480","wikidata":"https://www.wikidata.org/wiki/Q1366327","display_name":"Tone (literature)","level":2,"score":0.5997999906539917},{"id":"https://openalex.org/C522805319","wikidata":"https://www.wikidata.org/wiki/Q179965","display_name":"Electroencephalography","level":2,"score":0.5967000126838684},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.5716000199317932},{"id":"https://openalex.org/C173201364","wikidata":"https://www.wikidata.org/wiki/Q897410","display_name":"Brain\u2013computer interface","level":3,"score":0.5306000113487244},{"id":"https://openalex.org/C40743351","wikidata":"https://www.wikidata.org/wiki/Q7002049","display_name":"Neural decoding","level":3,"score":0.5203999876976013},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41519999504089355},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.37880000472068787},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.37700000405311584},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.37369999289512634},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3644999861717224},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.3458999991416931},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.33160001039505005},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.3089999854564667},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.30219998955726624},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.27549999952316284},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C43617652","wikidata":"https://www.wikidata.org/wiki/Q7575399","display_name":"Speech production","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i21.38870","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i21.38870","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38870/42832","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i21.38870","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i21.38870","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/38870/42832","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7138106426.pdf","grobid_xml":"https://content.openalex.org/works/W7138106426.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Brain-computer":[0],"interface":[1],"(BCI)":[2],"speech":[3,15,81,94,170],"decoding":[4,34,63,98,213],"has":[5],"emerged":[6],"as":[7,42],"a":[8,58,106],"promising":[9],"tool":[10],"for":[11,32,168,173,190],"assisting":[12],"individuals":[13],"with":[14,105,184,214],"impairments.":[16],"In":[17,53,176],"this":[18,54],"context,":[19],"the":[20,85,145,203,227],"integration":[21],"of":[22,88,147,166,186,205,229],"electroencephalography":[23],"(EEG)":[24],"and":[25,68,79,90,129,140,171,188,192,220],"electromyography":[26],"(EMG)":[27],"signals":[28,70],"offers":[29],"strong":[30,182],"potential":[31],"enhancing":[33],"performance.":[35],"Mandarin":[36,74],"tone":[37],"classification":[38,164],"presents":[39],"particular":[40],"challenges,":[41],"tonal":[43],"variations":[44],"convey":[45],"distinct":[46],"meanings":[47],"even":[48],"when":[49],"phonemes":[50],"remain":[51],"identical.":[52],"study,":[55],"we":[56],"propose":[57],"novel":[59],"cross-subject":[60,122,177],"multimodal":[61],"BCI":[62,231],"framework":[64],"that":[65,211],"fuses":[66],"EEG":[67,127,139],"EMG":[69,131,142],"to":[71,120,201,226],"classify":[72],"four":[73],"tones":[75],"under":[76],"both":[77],"audible":[78,169,191],"silent":[80,174,193],"conditions.":[82],"Inspired":[83],"by":[84],"cooperative":[86],"mechanisms":[87],"neural":[89,97],"muscular":[91],"systems":[92],"in":[93],"production,":[95],"our":[96,154],"architecture":[99],"combines":[100],"spatial-temporal":[101],"feature":[102],"extraction":[103],"branches":[104],"cross-attention":[107],"fusion":[108],"mechanism,":[109],"enabling":[110],"informative":[111],"interaction":[112],"between":[113],"modalities.":[114],"We":[115,124,196],"further":[116,197],"incorporate":[117],"domain-adversarial":[118],"training":[119],"improve":[121],"generalization.":[123],"collected":[125],"4,800":[126,130],"trials":[128,132],"from":[133],"10":[134],"participants":[135],"using":[136],"only":[137],"twenty":[138],"five":[141],"channels,":[143],"demonstrating":[144],"feasibility":[146],"minimal-channel":[148],"decoding.":[149],"Despite":[150],"employing":[151],"lightweight":[152],"modules,":[153],"model":[155],"outperforms":[156],"state-of-the-art":[157],"baselines":[158],"across":[159,223],"all":[160],"conditions,":[161],"achieving":[162],"average":[163],"accuracies":[165,185],"87.83\\%":[167],"88.08\\%":[172],"speech.":[175],"evaluations,":[178],"it":[179],"still":[180],"maintains":[181],"performance":[183],"83.27\\%":[187],"85.10\\%":[189],"speech,":[194],"respectively.":[195],"conduct":[198],"ablation":[199],"studies":[200],"validate":[202],"effectiveness":[204],"each":[206],"component.":[207],"Our":[208],"findings":[209],"suggest":[210],"tone-level":[212],"minimal":[215],"EEG-EMG":[216],"channels":[217],"is":[218],"feasible":[219],"potentially":[221],"generalizable":[222],"subjects,":[224],"contributing":[225],"development":[228],"practical":[230],"applications.":[232]},"counts_by_year":[],"updated_date":"2026-03-20T20:47:17.329874","created_date":"2026-03-18T00:00:00"}
