{"id":"https://openalex.org/W4405709161","doi":"https://doi.org/10.1109/iscslp63861.2024.10800319","title":"Binary-Temporal Convolutional Neural Network for Multi-Class Auditory Spatial Attention Detection","display_name":"Binary-Temporal Convolutional Neural Network for Multi-Class Auditory Spatial Attention Detection","publication_year":2024,"publication_date":"2024-11-07","ids":{"openalex":"https://openalex.org/W4405709161","doi":"https://doi.org/10.1109/iscslp63861.2024.10800319"},"language":"en","primary_location":{"id":"doi:10.1109/iscslp63861.2024.10800319","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp63861.2024.10800319","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101645107","display_name":"Peng Zhao","orcid":"https://orcid.org/0000-0002-2666-0299"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Peng Zhao","raw_affiliation_strings":["National University of Defense Technology"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012127797","display_name":"Ruicong Wang","orcid":"https://orcid.org/0000-0001-5180-1367"},"institutions":[{"id":"https://openalex.org/I4210099586","display_name":"Shenzhen Research Institute of Big Data","ror":"https://ror.org/00z1gwf89","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210099586"]},{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruicong Wang","raw_affiliation_strings":["School of Data Science, Shenzhen Research Institute of Big Data, The Chinese University of Hong Kong,Shenzhen,Guangdong"],"affiliations":[{"raw_affiliation_string":"School of Data Science, Shenzhen Research Institute of Big Data, The Chinese University of Hong Kong,Shenzhen,Guangdong","institution_ids":["https://openalex.org/I4210116924","https://openalex.org/I4210099586"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103064052","display_name":"Xueyi Zhang","orcid":"https://orcid.org/0009-0008-2394-3518"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xueyi Zhang","raw_affiliation_strings":["National University of Defense Technology"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028043255","display_name":"Mingrui Lao","orcid":"https://orcid.org/0000-0001-8413-7220"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingrui Lao","raw_affiliation_strings":["National University of Defense Technology"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088380372","display_name":"Siqi Cai","orcid":"https://orcid.org/0000-0003-3282-9246"},"institutions":[{"id":"https://openalex.org/I165932596","display_name":"National University of Singapore","ror":"https://ror.org/01tgyzw49","country_code":"SG","type":"education","lineage":["https://openalex.org/I165932596"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Siqi Cai","raw_affiliation_strings":["National University of Singapore"],"affiliations":[{"raw_affiliation_string":"National University of Singapore","institution_ids":["https://openalex.org/I165932596"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101645107"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.7117,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.7195238,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9541000127792358,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9541000127792358,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11692","display_name":"Noise Effects and Management","score":0.9409000277519226,"subfield":{"id":"https://openalex.org/subfields/3616","display_name":"Speech and Hearing"},"field":{"id":"https://openalex.org/fields/36","display_name":"Health Professions"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8065483570098877},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6954939365386963},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.5976012349128723},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.5090793967247009},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4971964657306671},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4254499673843384},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4094979763031006},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.0603906512260437}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8065483570098877},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6954939365386963},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.5976012349128723},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.5090793967247009},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4971964657306671},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4254499673843384},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4094979763031006},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0603906512260437},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iscslp63861.2024.10800319","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iscslp63861.2024.10800319","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE 14th International Symposium on Chinese Spoken Language Processing (ISCSLP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10","score":0.6000000238418579}],"awards":[{"id":"https://openalex.org/G2799040894","display_name":null,"funder_award_id":"62271432","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1991139021","https://openalex.org/W2082183045","https://openalex.org/W2300242332","https://openalex.org/W2559463885","https://openalex.org/W2887447938","https://openalex.org/W2981819390","https://openalex.org/W3034297393","https://openalex.org/W3207598347","https://openalex.org/W4206654584","https://openalex.org/W4214888034","https://openalex.org/W4385822975","https://openalex.org/W4385863621","https://openalex.org/W4386452375","https://openalex.org/W4388519991","https://openalex.org/W4392693728","https://openalex.org/W6639703010","https://openalex.org/W6690026940","https://openalex.org/W6693397755","https://openalex.org/W6768287286","https://openalex.org/W6849381436","https://openalex.org/W6852504160","https://openalex.org/W6892601869"],"related_works":["https://openalex.org/W4391621807","https://openalex.org/W4321487865","https://openalex.org/W4313906399","https://openalex.org/W4391621790","https://openalex.org/W4239306820","https://openalex.org/W4391266461","https://openalex.org/W2590798552","https://openalex.org/W2811106690","https://openalex.org/W2947043951","https://openalex.org/W4399188509"],"abstract_inverted_index":{"Humans":[0],"have":[1],"a":[2,14,31,97,101,142,155],"remarkable":[3],"ability":[4],"to":[5,23,35],"focus":[6],"on":[7,37],"one":[8],"of":[9,27,78,90,131],"the":[10,25,28,61,76,88,125],"sound":[11],"sources":[12],"in":[13,44,137],"multi-speaker":[15],"environment.":[16],"Auditory":[17],"spatial":[18],"attention":[19,81],"detection":[20],"(ASAD)":[21],"aims":[22],"identify":[24],"direction":[26],"speech":[29],"source":[30],"person":[32],"is":[33],"attending":[34],"based":[36],"their":[38],"brain":[39],"signals,":[40],"with":[41,133],"potential":[42],"applications":[43],"enhancing":[45],"hearing":[46],"aids,":[47],"improving":[48],"communication":[49],"systems,":[50],"and":[51,118,157],"advancing":[52],"braincomputer":[53],"interface":[54],"(BCI)":[55],"technologies.":[56],"Most":[57],"prior":[58],"studies":[59],"formulated":[60],"problem":[62],"as":[63],"binary":[64,102],"classification,":[65],"however,":[66],"realworld":[67],"scenarios":[68],"are":[69],"much":[70],"more":[71],"complex.":[72],"Our":[73],"study":[74,113],"explores":[75],"feasibility":[77],"detecting":[79],"auditory":[80],"among":[82],"10":[83],"competing":[84],"speakers.":[85],"To":[86],"address":[87],"needs":[89],"low-resource":[91],"computing":[92],"equipment,":[93],"we":[94],"further":[95],"propose":[96],"novel":[98],"approach":[99],"using":[100],"temporal":[103],"convolutional":[104],"neural":[105],"network":[106,148],"(B-TCNN)":[107],"for":[108,141,160],"multiclass":[109],"ASAD":[110,144,162],"tasks.":[111,163],"This":[112],"effectively":[114],"reduces":[115],"memory":[116],"consumption":[117],"accelerates":[119],"inference.":[120],"Experimental":[121],"results":[122],"show":[123],"that":[124],"B-TCNN":[126],"achieves":[127],"an":[128],"average":[129],"accuracy":[130],"93.8%":[132],"only":[134],"33K":[135],"parameters":[136],"1-second":[138],"decision":[139],"windows":[140],"10class":[143],"dataset.":[145],"The":[146],"proposed":[147],"significantly":[149],"outperforms":[150],"other":[151],"competitive":[152],"models,":[153],"offering":[154],"lightweight":[156],"efficient":[158],"solution":[159],"multi-class":[161]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
