{"id":"https://openalex.org/W3216283037","doi":"https://doi.org/10.1109/lsp.2021.3129695","title":"Lightweight Speaker Recognition in Poincar\u00e9 Spaces","display_name":"Lightweight Speaker Recognition in Poincar\u00e9 Spaces","publication_year":2021,"publication_date":"2021-11-22","ids":{"openalex":"https://openalex.org/W3216283037","doi":"https://doi.org/10.1109/lsp.2021.3129695","mag":"3216283037"},"language":"en","primary_location":{"id":"doi:10.1109/lsp.2021.3129695","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2021.3129695","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100351737","display_name":"Jieun Lee","orcid":"https://orcid.org/0000-0002-2921-9431"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]},{"id":"https://openalex.org/I2799389823","display_name":"Korea Education and Research Information Service","ror":"https://ror.org/020r4p198","country_code":"KR","type":"government","lineage":["https://openalex.org/I2799389823","https://openalex.org/I2801339556","https://openalex.org/I2801339556","https://openalex.org/I4210114506","https://openalex.org/I4387152098"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jieun Lee","raw_affiliation_strings":["Department of Electrical Engineering, Pohang University of Science and Technology, Pohang, South Korea","Korea Education and Research Information Service (KERIS), Daegu, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]},{"raw_affiliation_string":"Korea Education and Research Information Service (KERIS), Daegu, South Korea","institution_ids":["https://openalex.org/I2799389823"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103159153","display_name":"Sung-Bin Kim","orcid":"https://orcid.org/0009-0005-8455-3298"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kim Sung-Bin","raw_affiliation_strings":["Department of Electrical Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044543389","display_name":"Seokhyeong Kang","orcid":"https://orcid.org/0000-0003-3015-1806"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seokhyeong Kang","raw_affiliation_strings":["Department of Electrical Engineering, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078114111","display_name":"Tae-Hyun Oh","orcid":"https://orcid.org/0000-0003-0468-1571"},"institutions":[{"id":"https://openalex.org/I123900574","display_name":"Pohang University of Science and Technology","ror":"https://ror.org/04xysgw12","country_code":"KR","type":"education","lineage":["https://openalex.org/I123900574"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Tae-Hyun Oh","raw_affiliation_strings":["Department of Electrical Engineering and Graduate School of Artificial Intelligence, Pohang University of Science and Technology, Pohang, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering and Graduate School of Artificial Intelligence, Pohang University of Science and Technology, Pohang, South Korea","institution_ids":["https://openalex.org/I123900574"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100351737"],"corresponding_institution_ids":["https://openalex.org/I123900574","https://openalex.org/I2799389823"],"apc_list":null,"apc_paid":null,"fwci":0.8158,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.78796699,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"29","issue":null,"first_page":"224","last_page":"228"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7342621088027954},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.7090445160865784},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6831296682357788},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.6151368618011475},{"id":"https://openalex.org/keywords/optimal-distinctiveness-theory","display_name":"Optimal distinctiveness theory","score":0.5852340459823608},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5495584607124329},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5455701351165771},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5099138021469116},{"id":"https://openalex.org/keywords/euclidean-distance","display_name":"Euclidean distance","score":0.4950646460056305},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.45086321234703064},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.43895429372787476},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4334031641483307},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41077935695648193},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.24290978908538818}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7342621088027954},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.7090445160865784},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6831296682357788},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.6151368618011475},{"id":"https://openalex.org/C47385372","wikidata":"https://www.wikidata.org/wiki/Q7098943","display_name":"Optimal distinctiveness theory","level":2,"score":0.5852340459823608},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5495584607124329},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5455701351165771},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5099138021469116},{"id":"https://openalex.org/C120174047","wikidata":"https://www.wikidata.org/wiki/Q847073","display_name":"Euclidean distance","level":2,"score":0.4950646460056305},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.45086321234703064},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.43895429372787476},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4334031641483307},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41077935695648193},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.24290978908538818},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lsp.2021.3129695","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lsp.2021.3129695","pdf_url":null,"source":{"id":"https://openalex.org/S120629676","display_name":"IEEE Signal Processing Letters","issn_l":"1070-9908","issn":["1070-9908","1558-2361"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.699999988079071,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320322065","display_name":"National IT Industry Promotion Agency","ror":"https://ror.org/026v53e29"},{"id":"https://openalex.org/F4320328359","display_name":"Ministry of Science and ICT, South Korea","ror":"https://ror.org/01wpjm123"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W2060300932","https://openalex.org/W2091291608","https://openalex.org/W2187089797","https://openalex.org/W2194775991","https://openalex.org/W2461933982","https://openalex.org/W2502312327","https://openalex.org/W2604462068","https://openalex.org/W2612434969","https://openalex.org/W2726515241","https://openalex.org/W2794506738","https://openalex.org/W2797520557","https://openalex.org/W2808631503","https://openalex.org/W2902299888","https://openalex.org/W2916104401","https://openalex.org/W2920853498","https://openalex.org/W2943816678","https://openalex.org/W2962788625","https://openalex.org/W2962918445","https://openalex.org/W2962965870","https://openalex.org/W2963048316","https://openalex.org/W2963163009","https://openalex.org/W2963225922","https://openalex.org/W2963500407","https://openalex.org/W2963674932","https://openalex.org/W2979157532","https://openalex.org/W2982479999","https://openalex.org/W3013020904","https://openalex.org/W3015949486","https://openalex.org/W3034342078","https://openalex.org/W3035102141","https://openalex.org/W3095508601","https://openalex.org/W3127824945","https://openalex.org/W3195437175","https://openalex.org/W4289665794","https://openalex.org/W4295312788","https://openalex.org/W4297775537","https://openalex.org/W4299279015","https://openalex.org/W6638632666","https://openalex.org/W6679667936","https://openalex.org/W6685891324","https://openalex.org/W6724804524","https://openalex.org/W6726275242","https://openalex.org/W6737575990","https://openalex.org/W6737664043","https://openalex.org/W6751693566","https://openalex.org/W6752141533","https://openalex.org/W6755202523","https://openalex.org/W6800946474"],"related_works":["https://openalex.org/W4225552138","https://openalex.org/W2032875729","https://openalex.org/W3046185751","https://openalex.org/W2477273251","https://openalex.org/W2475308993","https://openalex.org/W2790526747","https://openalex.org/W2069575426","https://openalex.org/W3002212064","https://openalex.org/W90767720","https://openalex.org/W3148366653"],"abstract_inverted_index":{"This":[0,84],"letter":[1],"proposes":[2],"a":[3,11,91,105],"lightweight":[4],"model":[5,68,78],"for":[6,47,108,166],"speaker":[7,15,24,109,123,168],"recognition":[8,16,169],"by":[9,27,79,95],"leveraging":[10],"hyperbolic":[12,61,101,106],"space.":[13],"The":[14,55],"performance":[17,161],"heavily":[18],"depends":[19],"on":[20,38,141],"the":[21,39,59,96,100,121,134,142,149,163],"distinctiveness":[22],"of":[23,51,58,90,99,137,153],"embeddings":[25,124],"induced":[26],"metric":[28,41],"learning.":[29],"However,":[30],"most":[31],"state-of-the-art":[32],"embedding":[33],"methods":[34],"are":[35,125],"typically":[36,75],"based":[37],"Euclidean":[40],"space,":[42],"which":[43,72],"does":[44],"not":[45],"account":[46],"inherent":[48],"hierarchical":[49,70],"structures":[50],"speech":[52],"voice":[53],"characteristics.":[54],"recent":[56],"development":[57],"neural":[60,82,154],"geometry":[62,98],"has":[63,159],"demonstrated":[64],"its":[65],"effectiveness":[66],"to":[67,77],"continuous":[69],"structures,":[71],"have":[73],"been":[74],"cumbersome":[76],"standard":[80,164],"deep":[81],"networks.":[83],"facet":[85],"provides":[86],"an":[87],"additional":[88],"by-product":[89],"compact":[92,132],"representation.":[93],"Inspired":[94],"favorable":[97,160],"geometry,":[102],"we":[103],"developed":[104],"ResNet":[107,165],"recognition.":[110],"We":[111],"found":[112],"that":[113],"in":[114,128],"smaller":[115],"dimension":[116],"regimes":[117],"than":[118],"typical":[119],"cases,":[120],"learned":[122],"more":[126,131],"discriminative;":[127],"other":[129],"words,":[130],"at":[133],"same":[135],"level":[136],"performance.":[138],"Our":[139],"experiments":[140],"large-scale":[143],"VoxCeleb":[144],"datasets":[145],"show":[146],"that,":[147],"given":[148],"limited":[150],"channel":[151],"dimensions":[152],"networks,":[155],"our":[156],"method":[157],"consistently":[158],"against":[162],"both":[167],"and":[170],"verification":[171],"tasks.":[172]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
