{"id":"https://openalex.org/W4405709883","doi":"https://doi.org/10.1109/iscslp63861.2024.10800104","title":"Enhancing Spatio-Temporal Auditory Attention Decoding with ST-AADNet","display_name":"Enhancing Spatio-Temporal Auditory Attention Decoding with ST-AADNet","publication_year":2024,"publication_date":"2024-11-07","ids":{"openalex":"https://openalex.org/W4405709883","doi":"https://doi.org/10.1109/iscslp63861.2024.10800104"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp63861.2024.10800104","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp63861.2024.10800104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038699958","display_name":"Ruofeng Yan","orcid":"https://orcid.org/0000-0001-8347-3097"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Ruofan Yan","raw_affiliation_strings":["Hong Kong Polytechnic University,Department of Computing"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Department of Computing","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102713928","display_name":"Peng Shu","orcid":"https://orcid.org/0000-0002-5970-9992"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Shu Peng","raw_affiliation_strings":["Hong Kong Polytechnic University,Department of Computing"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Department of Computing","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020592482","display_name":"Zhige Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zhige Chen","raw_affiliation_strings":["Hong Kong Polytechnic University,Department of Computing"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Department of Computing","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083469101","display_name":"Zhi-An Huang","orcid":"https://orcid.org/0000-0001-9974-148X"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zhi-An Huang","raw_affiliation_strings":["Hong Kong City University (Dong Guan)"],"affiliations":[{"raw_affiliation_string":"Hong Kong City University (Dong Guan)","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100448431","display_name":"Rui Liu","orcid":"https://orcid.org/0000-0002-1408-9443"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Rui Liu","raw_affiliation_strings":["Hong Kong Polytechnic University,Department of Computing"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Department of Computing","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025285243","display_name":"Kay Chen Tan","orcid":"https://orcid.org/0000-0002-6802-2463"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Kay Chen Tan","raw_affiliation_strings":["Hong Kong Polytechnic University,Department of Data Science and Artificial Intelligence"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Department of Data Science and Artificial Intelligence","institution_ids":["https://openalex.org/I14243506"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018341980","display_name":"Jibin Wu","orcid":"https://orcid.org/0000-0003-0135-4188"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jibin Wu","raw_affiliation_strings":["Hong Kong Polytechnic University,Department of Computing"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University,Department of Computing","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5038699958"],"corresponding_institution_ids":["https://openalex.org/I14243506"],"apc_list":null,"apc_paid":null,"fwci":0.3628,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.60705037,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"334","last_page":"338"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9747999906539917,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.8148790597915649},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7271546721458435},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5707671046257019},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.16921043395996094}],"concepts":[{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.8148790597915649},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7271546721458435},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5707671046257019},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.16921043395996094}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp63861.2024.10800104","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp63861.2024.10800104","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1667288554","display_name":null,"funder_award_id":"P0043563,P0046094","funder_id":"https://openalex.org/F4320322598","funder_display_name":"Hong Kong Polytechnic University"},{"id":"https://openalex.org/G5524462834","display_name":null,"funder_award_id":"62306259,U21A20512","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322598","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W1534477342","https://openalex.org/W1991139021","https://openalex.org/W2027250573","https://openalex.org/W2033080056","https://openalex.org/W2082183045","https://openalex.org/W2122111042","https://openalex.org/W2255466643","https://openalex.org/W2322143332","https://openalex.org/W2408166852","https://openalex.org/W2558802391","https://openalex.org/W2767841979","https://openalex.org/W2775454033","https://openalex.org/W2923248388","https://openalex.org/W2948163068","https://openalex.org/W3097777922","https://openalex.org/W3126966983","https://openalex.org/W3159532722","https://openalex.org/W3159696612","https://openalex.org/W4206654584","https://openalex.org/W4211091012","https://openalex.org/W4223920619","https://openalex.org/W4383960611","https://openalex.org/W4385863621","https://openalex.org/W4400762160"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Individuals":[0],"with":[1,27],"hearing":[2],"impairments":[3],"often":[4],"struggle":[5],"to":[6,84,102],"isolate":[7],"and":[8,52,78,113],"focus":[9],"on":[10,110],"a":[11,65,74,79,95],"single":[12],"speaker":[13],"in":[14,47,128],"multi-speaker":[15],"environments.":[16],"Neuroscience":[17],"research":[18],"has":[19],"uncovered":[20],"distinct":[21],"patterns":[22],"of":[23,97,120],"brain":[24],"activity":[25],"associated":[26],"auditory":[28],"attention":[29],"that":[30],"can":[31],"be":[32],"detected":[33],"using":[34],"electroencephalography":[35],"(EEG)":[36],"measurements.":[37],"Existing":[38],"deep":[39],"learning":[40],"methods":[41,100],"developed":[42],"for":[43],"AAD":[44],"encounter":[45],"challenges":[46],"extracting":[48],"effective":[49],"spatial-temporal":[50,87],"features":[51,88],"handling":[53],"the":[54,104,117,121,125],"data":[55,98],"scarcity":[56],"issues.":[57],"To":[58],"address":[59],"these":[60],"issues,":[61],"this":[62],"work":[63],"proposes":[64],"novel":[66],"neural":[67,76],"network":[68,77,83],"architecture":[69],"named":[70],"ST-AADNet,":[71],"which":[72],"integrates":[73],"convolutional":[75],"long":[80],"short-term":[81],"memory":[82],"extract":[85],"useful":[86],"from":[89],"EEG":[90],"signals.":[91],"Furthermore,":[92],"we":[93],"introduce":[94],"series":[96],"augmentation":[99],"tailored":[101],"enhance":[103],"model's":[105],"generalization":[106],"capacity.":[107],"Experimental":[108],"studies":[109],"both":[111],"audio-only":[112],"audio-video":[114],"datasets":[115],"demonstrate":[116],"superior":[118],"performance":[119],"proposed":[122],"methods,":[123],"securing":[124],"second":[126],"position":[127],"The":[129],"First":[130],"Chinese":[131],"Auditory":[132],"Attention":[133],"Decoding":[134],"Challenge.":[135]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
