{"id":"https://openalex.org/W3194417184","doi":"https://doi.org/10.1109/biosig52210.2021.9548296","title":"Curricular SincNet: Towards Robust Deep Speaker Recognition by Emphasizing Hard Samples in Latent Space","display_name":"Curricular SincNet: Towards Robust Deep Speaker Recognition by Emphasizing Hard Samples in Latent Space","publication_year":2021,"publication_date":"2021-09-01","ids":{"openalex":"https://openalex.org/W3194417184","doi":"https://doi.org/10.1109/biosig52210.2021.9548296","mag":"3194417184"},"language":"en","primary_location":{"id":"doi:10.1109/biosig52210.2021.9548296","is_oa":false,"landing_page_url":"https://doi.org/10.1109/biosig52210.2021.9548296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Conference of the Biometrics Special Interest Group (BIOSIG)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2108.10714","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010392592","display_name":"Labib Chowdhury","orcid":"https://orcid.org/0000-0002-5287-8267"},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":true,"raw_author_name":"Labib Chowdhury","raw_affiliation_strings":["North South University, Dhaka, Bangladesh","[North South University]"],"affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]},{"raw_affiliation_string":"[North South University]","institution_ids":["https://openalex.org/I157386601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048854958","display_name":"Mustafa Kamal","orcid":"https://orcid.org/0000-0002-9783-2924"},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Mustafa Kamal","raw_affiliation_strings":["North South University, Dhaka, Bangladesh","[North South University]"],"affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]},{"raw_affiliation_string":"[North South University]","institution_ids":["https://openalex.org/I157386601"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023934543","display_name":"Najia Hasan","orcid":null},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Najia Hasan","raw_affiliation_strings":["North South University, Dhaka, Bangladesh","[North South University]"],"affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]},{"raw_affiliation_string":"[North South University]","institution_ids":["https://openalex.org/I157386601"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062072064","display_name":"Nabeel Mohammed","orcid":"https://orcid.org/0000-0002-7661-3570"},"institutions":[{"id":"https://openalex.org/I157386601","display_name":"North South University","ror":"https://ror.org/05wdbfp45","country_code":"BD","type":"education","lineage":["https://openalex.org/I157386601"]}],"countries":["BD"],"is_corresponding":false,"raw_author_name":"Nabeel Mohammed","raw_affiliation_strings":["North South University, Dhaka, Bangladesh","[North South University]"],"affiliations":[{"raw_affiliation_string":"North South University, Dhaka, Bangladesh","institution_ids":["https://openalex.org/I157386601"]},{"raw_affiliation_string":"[North South University]","institution_ids":["https://openalex.org/I157386601"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5010392592"],"corresponding_institution_ids":["https://openalex.org/I157386601"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.11555114,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/softmax-function","display_name":"Softmax function","score":0.8560370206832886},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7945536375045776},{"id":"https://openalex.org/keywords/biometrics","display_name":"Biometrics","score":0.6027331352233887},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5979059934616089},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.558716893196106},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.522579550743103},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5008499622344971},{"id":"https://openalex.org/keywords/facial-recognition-system","display_name":"Facial recognition system","score":0.4960807263851166},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.45951688289642334},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.42095986008644104},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41611596941947937}],"concepts":[{"id":"https://openalex.org/C188441871","wikidata":"https://www.wikidata.org/wiki/Q7554146","display_name":"Softmax function","level":3,"score":0.8560370206832886},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7945536375045776},{"id":"https://openalex.org/C184297639","wikidata":"https://www.wikidata.org/wiki/Q177765","display_name":"Biometrics","level":2,"score":0.6027331352233887},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5979059934616089},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.558716893196106},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.522579550743103},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5008499622344971},{"id":"https://openalex.org/C31510193","wikidata":"https://www.wikidata.org/wiki/Q1192553","display_name":"Facial recognition system","level":3,"score":0.4960807263851166},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.45951688289642334},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.42095986008644104},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41611596941947937}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1109/biosig52210.2021.9548296","is_oa":false,"landing_page_url":"https://doi.org/10.1109/biosig52210.2021.9548296","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Conference of the Biometrics Special Interest Group (BIOSIG)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2108.10714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.10714","pdf_url":"https://arxiv.org/pdf/2108.10714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"mag:3194417184","is_oa":true,"landing_page_url":"http://arxiv.org/pdf/2108.10714.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"arXiv (Cornell University)","raw_type":null},{"id":"doi:10.48550/arxiv.2108.10714","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2108.10714","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2108.10714","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2108.10714","pdf_url":"https://arxiv.org/pdf/2108.10714","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.8399999737739563,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":17,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W1635512741","https://openalex.org/W1909308924","https://openalex.org/W2046056978","https://openalex.org/W2101261946","https://openalex.org/W2121812409","https://openalex.org/W2150769028","https://openalex.org/W2748488820","https://openalex.org/W2784163702","https://openalex.org/W2915887922","https://openalex.org/W2964052309","https://openalex.org/W2969985801","https://openalex.org/W3035693354","https://openalex.org/W3097523643","https://openalex.org/W3103152812","https://openalex.org/W6639916541","https://openalex.org/W6759004640"],"related_works":["https://openalex.org/W3203902498","https://openalex.org/W3035693354","https://openalex.org/W3162913942","https://openalex.org/W3025075133","https://openalex.org/W3083072141","https://openalex.org/W2890872363","https://openalex.org/W3208068273","https://openalex.org/W2970561365","https://openalex.org/W2907077903","https://openalex.org/W2889565680","https://openalex.org/W3190626620","https://openalex.org/W2995174043","https://openalex.org/W3115774063","https://openalex.org/W2997469299","https://openalex.org/W2982689298","https://openalex.org/W2806138827","https://openalex.org/W3133605945","https://openalex.org/W3086978629","https://openalex.org/W1998752042","https://openalex.org/W3015127654"],"abstract_inverted_index":{"Deep":[0],"learning":[1],"models":[2],"have":[3],"become":[4],"an":[5,132],"increasingly":[6],"preferred":[7],"option":[8],"for":[9,61],"biometric":[10,94],"recognition":[11,27],"systems,":[12],"such":[13,96,103],"as":[14,97,115,117],"speaker":[15,26],"recognition.":[16,99],"SincNet,":[17],"a":[18,104,139,187],"deep":[19],"neural":[20],"network":[21],"architecture,":[22],"gained":[23],"popularity":[24],"in":[25,92],"tasks":[28],"due":[29],"to":[30,38,119,143,194],"its":[31],"parameterized":[32],"sinc":[33],"functions":[34,66],"that":[35,109],"allow":[36],"it":[37,110,180],"work":[39],"directly":[40],"on":[41,153],"the":[42,50,57,145,165,175,182],"speech":[43],"signal.":[44],"The":[45,100,148],"original":[46],"SincNet":[47,134,146,195],"architecture":[48],"uses":[49],"softmax":[51],"loss,":[52],"which":[53],"may":[54],"not":[55,68],"be":[56],"most":[58],"suitable":[59],"choice":[60],"recognition-based":[62],"tasks.":[63],"Such":[64],"loss":[65,141],"do":[67],"impose":[69,112],"inter-class":[70,113],"margins":[71,114],"nor":[72],"differentiate":[73],"between":[74],"easy":[75,121],"and":[76,122,158,196],"hard":[77,123],"training":[78],"samples.":[79,124],"Curriculum":[80],"learning,":[81],"particularly":[82],"those":[83],"leveraging":[84],"angular":[85],"margin-based":[86],"losses,":[87],"has":[88],"proven":[89],"very":[90],"successful":[91],"other":[93,170,197],"applications":[95],"face":[98],"advantage":[101],"of":[102,177,189],"curriculum":[105],"learning-based":[106],"techniques":[107],"is":[108,151],"will":[111],"well":[116],"taking":[118],"account":[120],"In":[125,162,174],"this":[126],"paper,":[127],"we":[128,137],"propose":[129],"Curricular":[130],"SincNet(CL-SincNet),":[131],"improved":[133],"model":[135,150,166],"where":[136],"use":[138],"curricular":[140],"function":[142],"train":[144],"architecture.":[147],"proposed":[149],"evaluated":[152],"multiple":[154],"datasets":[155],"using":[156],"intra-dataset":[157],"inter-dataset":[159,178],"evaluation":[160],"protocols.":[161],"both":[163],"settings,":[164],"performs":[167],"competitively":[168],"with":[169,186],"previously":[171],"published":[172,198],"work.":[173,199],"case":[176],"testing,":[179],"achieves":[181],"best":[183],"overall":[184],"results":[185],"reduction":[188],"4%":[190],"error":[191],"rate":[192],"compare":[193]},"counts_by_year":[],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
