{"id":"https://openalex.org/W4392904437","doi":"https://doi.org/10.1109/icassp48485.2024.10448221","title":"TB-ResNet: Bridging the Gap from TDNN to ResNet in Automatic Speaker Verification with Temporal-Bottleneck Enhancement","display_name":"TB-ResNet: Bridging the Gap from TDNN to ResNet in Automatic Speaker Verification with Temporal-Bottleneck Enhancement","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392904437","doi":"https://doi.org/10.1109/icassp48485.2024.10448221"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10448221","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10448221","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007968560","display_name":"Sunmook Choi","orcid":"https://orcid.org/0009-0006-3044-9222"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]},{"id":"https://openalex.org/I4210161052","display_name":"Korea University","ror":"https://ror.org/05m1gnk07","country_code":"JP","type":"education","lineage":["https://openalex.org/I4210161052"]}],"countries":["JP","KR"],"is_corresponding":true,"raw_author_name":"Sunmook Choi","raw_affiliation_strings":["Korea University,Department of Mathematics,Republic of Korea","Department of Mathematics, Korea University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University,Department of Mathematics,Republic of Korea","institution_ids":["https://openalex.org/I4210161052","https://openalex.org/I197347611"]},{"raw_affiliation_string":"Department of Mathematics, Korea University, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101310939","display_name":"Sanghyeok Chung","orcid":"https://orcid.org/0009-0002-2257-4729"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]},{"id":"https://openalex.org/I4210161052","display_name":"Korea University","ror":"https://ror.org/05m1gnk07","country_code":"JP","type":"education","lineage":["https://openalex.org/I4210161052"]}],"countries":["JP","KR"],"is_corresponding":false,"raw_author_name":"Sanghyeok Chung","raw_affiliation_strings":["Korea University,Department of Mathematics,Republic of Korea","Department of Mathematics, Korea University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University,Department of Mathematics,Republic of Korea","institution_ids":["https://openalex.org/I4210161052","https://openalex.org/I197347611"]},{"raw_affiliation_string":"Department of Mathematics, Korea University, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109692723","display_name":"Seungeun Lee","orcid":"https://orcid.org/0009-0006-2913-803X"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]},{"id":"https://openalex.org/I4210161052","display_name":"Korea University","ror":"https://ror.org/05m1gnk07","country_code":"JP","type":"education","lineage":["https://openalex.org/I4210161052"]}],"countries":["JP","KR"],"is_corresponding":false,"raw_author_name":"Seungeun Lee","raw_affiliation_strings":["Korea University,Department of Mathematics,Republic of Korea","Department of Mathematics, Korea University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University,Department of Mathematics,Republic of Korea","institution_ids":["https://openalex.org/I4210161052","https://openalex.org/I197347611"]},{"raw_affiliation_string":"Department of Mathematics, Korea University, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064412814","display_name":"Soyul Han","orcid":"https://orcid.org/0000-0003-0156-250X"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Soyul Han","raw_affiliation_strings":["Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","Department of Statistics and Data Science, Chung-Ang University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","institution_ids":["https://openalex.org/I67900169"]},{"raw_affiliation_string":"Department of Statistics and Data Science, Chung-Ang University, Republic of Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102505609","display_name":"Taein Kang","orcid":"https://orcid.org/0009-0007-4978-9101"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Taein Kang","raw_affiliation_strings":["Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","Department of Statistics and Data Science, Chung-Ang University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","institution_ids":["https://openalex.org/I67900169"]},{"raw_affiliation_string":"Department of Statistics and Data Science, Chung-Ang University, Republic of Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062505402","display_name":"Jaejin Seo","orcid":"https://orcid.org/0000-0002-7534-9341"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaejin Seo","raw_affiliation_strings":["Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","Department of Statistics and Data Science, Chung-Ang University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","institution_ids":["https://openalex.org/I67900169"]},{"raw_affiliation_string":"Department of Statistics and Data Science, Chung-Ang University, Republic of Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014457836","display_name":"Il\u2010Youp Kwak","orcid":"https://orcid.org/0000-0002-7117-7669"},"institutions":[{"id":"https://openalex.org/I67900169","display_name":"Chung-Ang University","ror":"https://ror.org/01r024a98","country_code":"KR","type":"education","lineage":["https://openalex.org/I67900169"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Il-Youp Kwak","raw_affiliation_strings":["Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","Department of Statistics and Data Science, Chung-Ang University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Chung-Ang University,Department of Statistics and Data Science,Republic of Korea","institution_ids":["https://openalex.org/I67900169"]},{"raw_affiliation_string":"Department of Statistics and Data Science, Chung-Ang University, Republic of Korea","institution_ids":["https://openalex.org/I67900169"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064077787","display_name":"Seungsang Oh","orcid":"https://orcid.org/0000-0003-4975-9977"},"institutions":[{"id":"https://openalex.org/I4210161052","display_name":"Korea University","ror":"https://ror.org/05m1gnk07","country_code":"JP","type":"education","lineage":["https://openalex.org/I4210161052"]},{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]}],"countries":["JP","KR"],"is_corresponding":false,"raw_author_name":"Seungsang Oh","raw_affiliation_strings":["Korea University,Department of Mathematics,Republic of Korea","Department of Mathematics, Korea University, Republic of Korea"],"affiliations":[{"raw_affiliation_string":"Korea University,Department of Mathematics,Republic of Korea","institution_ids":["https://openalex.org/I4210161052","https://openalex.org/I197347611"]},{"raw_affiliation_string":"Department of Mathematics, Korea University, Republic of Korea","institution_ids":["https://openalex.org/I197347611"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5007968560"],"corresponding_institution_ids":["https://openalex.org/I197347611","https://openalex.org/I4210161052"],"apc_list":null,"apc_paid":null,"fwci":2.1822,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.88499765,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"10291","last_page":"10295"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/residual-neural-network","display_name":"Residual neural network","score":0.836748480796814},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.8349922895431519},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.8077596426010132},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7599836587905884},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.5237215161323547},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4332996606826782},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42384666204452515},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4166499376296997},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3965902328491211},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3677307367324829},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.14374953508377075},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.10762110352516174}],"concepts":[{"id":"https://openalex.org/C2944601119","wikidata":"https://www.wikidata.org/wiki/Q43744058","display_name":"Residual neural network","level":3,"score":0.836748480796814},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.8349922895431519},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.8077596426010132},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7599836587905884},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.5237215161323547},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4332996606826782},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42384666204452515},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4166499376296997},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3965902328491211},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3677307367324829},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.14374953508377075},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.10762110352516174}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10448221","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10448221","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4699999988079071,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W2046056978","https://openalex.org/W2194775991","https://openalex.org/W2219249508","https://openalex.org/W2607662938","https://openalex.org/W2696967604","https://openalex.org/W2726515241","https://openalex.org/W2794506738","https://openalex.org/W2808631503","https://openalex.org/W2890964092","https://openalex.org/W2936774411","https://openalex.org/W2938358845","https://openalex.org/W2969985801","https://openalex.org/W2972369255","https://openalex.org/W2972712416","https://openalex.org/W3024869864","https://openalex.org/W4293363567","https://openalex.org/W4296608375","https://openalex.org/W4297165527","https://openalex.org/W4321524405","https://openalex.org/W6637242042","https://openalex.org/W6638667902","https://openalex.org/W6688816777","https://openalex.org/W6842535719","https://openalex.org/W6842909713","https://openalex.org/W6849840340"],"related_works":["https://openalex.org/W2595172197","https://openalex.org/W2084856301","https://openalex.org/W2127970246","https://openalex.org/W2953234277","https://openalex.org/W4401096132","https://openalex.org/W3213976941","https://openalex.org/W2896102333","https://openalex.org/W4289388752","https://openalex.org/W2604192360","https://openalex.org/W4400659363"],"abstract_inverted_index":{"This":[0],"paper":[1],"focuses":[2],"on":[3,125],"the":[4,48,53,65,94,121,133,138],"transition":[5],"of":[6,96,118],"automatic":[7],"speaker":[8],"verification":[9],"systems":[10,21],"from":[11],"time":[12],"delay":[13],"neural":[14],"networks":[15],"(TDNN)":[16],"to":[17,27,46,61],"ResNet-based":[18,39,89],"networks.":[19],"TDNN-based":[20],"use":[22],"a":[23,88,108,128],"statistics":[24,49,78,97],"pooling":[25,50,98],"layer":[26],"aggregate":[28],"temporal":[29,66,71,109],"information":[30,72],"which":[31],"is":[32],"suitable":[33],"for":[34],"two-dimensional":[35],"tensors.":[36],"Even":[37],"though":[38],"models":[40],"produce":[41],"three-dimensional":[42],"tensors,":[43],"they":[44],"continue":[45],"incorporate":[47],"layer.":[51],"However,":[52],"reduction":[54,130],"in":[55,58,112,131],"spatial":[56],"dimensions":[57],"ResNet":[59,86,123],"due":[60],"convolution":[62],"operations,":[63],"including":[64],"axis,":[67],"raises":[68],"concerns":[69],"about":[70],"loss":[73],"and":[74,103,137],"its":[75,113],"compatibility":[76],"with":[77],"pooling.":[79],"To":[80],"address":[81],"this,":[82],"we":[83],"introduce":[84],"Temporal-Bottleneck":[85],"(TB-ResNet),":[87],"system":[90],"that":[91],"can":[92],"utilize":[93],"nature":[95],"more":[99],"effectively":[100],"by":[101],"capturing":[102],"retaining":[104],"frame-level":[105],"contexts":[106],"through":[107],"bottleneck":[110],"configuration":[111],"building":[114],"blocks.":[115],"The":[116],"performance":[117],"TB-ResNets":[119],"outperforms":[120],"original":[122],"counterparts":[124],"VoxCeleb1,":[126],"achieving":[127],"significant":[129],"both":[132],"equal":[134],"error":[135],"rate":[136],"minimum":[139],"detection":[140],"cost":[141],"function.":[142]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
