{"id":"https://openalex.org/W3163350809","doi":"https://doi.org/10.1109/kst51265.2021.9415832","title":"Improvement of Text-Independent Speaker Verification Using Gender-like Feature","display_name":"Improvement of Text-Independent Speaker Verification Using Gender-like Feature","publication_year":2021,"publication_date":"2021-01-21","ids":{"openalex":"https://openalex.org/W3163350809","doi":"https://doi.org/10.1109/kst51265.2021.9415832","mag":"3163350809"},"language":"en","primary_location":{"id":"doi:10.1109/kst51265.2021.9415832","is_oa":false,"landing_page_url":"https://doi.org/10.1109/kst51265.2021.9415832","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 13th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5003927462","display_name":"Pornprom Kiawjak","orcid":null},"institutions":[{"id":"https://openalex.org/I91538806","display_name":"King Mongkut's Institute of Technology Ladkrabang","ror":"https://ror.org/055mf0v62","country_code":"TH","type":"education","lineage":["https://openalex.org/I91538806"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Pornprom Kiawjak","raw_affiliation_strings":["Faculty of Information Technology, King Mongkut's Institute of Technology Ladkrabang, Bangkok, Thailand"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, King Mongkut's Institute of Technology Ladkrabang, Bangkok, Thailand","institution_ids":["https://openalex.org/I91538806"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029657798","display_name":"Somkiat Wangsiripitak","orcid":null},"institutions":[{"id":"https://openalex.org/I91538806","display_name":"King Mongkut's Institute of Technology Ladkrabang","ror":"https://ror.org/055mf0v62","country_code":"TH","type":"education","lineage":["https://openalex.org/I91538806"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Somkiat Wangsiripitak","raw_affiliation_strings":["Faculty of Information Technology, King Mongkut's Institute of Technology Ladkrabang, Bangkok, Thailand"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, King Mongkut's Institute of Technology Ladkrabang, Bangkok, Thailand","institution_ids":["https://openalex.org/I91538806"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066462028","display_name":"Kitsuchart Pasupa","orcid":"https://orcid.org/0000-0001-8359-9888"},"institutions":[{"id":"https://openalex.org/I91538806","display_name":"King Mongkut's Institute of Technology Ladkrabang","ror":"https://ror.org/055mf0v62","country_code":"TH","type":"education","lineage":["https://openalex.org/I91538806"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Kitsuchart Pasupa","raw_affiliation_strings":["Faculty of Information Technology, King Mongkut's Institute of Technology Ladkrabang, Bangkok, Thailand"],"affiliations":[{"raw_affiliation_string":"Faculty of Information Technology, King Mongkut's Institute of Technology Ladkrabang, Bangkok, Thailand","institution_ids":["https://openalex.org/I91538806"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5003927462"],"corresponding_institution_ids":["https://openalex.org/I91538806"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06062844,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"219","last_page":"224"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9905999898910522,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7569518089294434},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6364179849624634},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.6203768253326416},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.615696370601654},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.607918918132782},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.5864039659500122},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.5647873282432556},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5093370676040649},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48722735047340393},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4752887487411499},{"id":"https://openalex.org/keywords/residual-neural-network","display_name":"Residual neural network","score":0.46401748061180115},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.4626726806163788},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.42756757140159607},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4169846773147583},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.07586044073104858}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7569518089294434},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6364179849624634},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.6203768253326416},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.615696370601654},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.607918918132782},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.5864039659500122},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.5647873282432556},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5093370676040649},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48722735047340393},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4752887487411499},{"id":"https://openalex.org/C2944601119","wikidata":"https://www.wikidata.org/wiki/Q43744058","display_name":"Residual neural network","level":3,"score":0.46401748061180115},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.4626726806163788},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.42756757140159607},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4169846773147583},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.07586044073104858},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/kst51265.2021.9415832","is_oa":false,"landing_page_url":"https://doi.org/10.1109/kst51265.2021.9415832","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 13th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W2041823554","https://openalex.org/W2046056978","https://openalex.org/W2096733369","https://openalex.org/W2107638917","https://openalex.org/W2114925438","https://openalex.org/W2121750345","https://openalex.org/W2147147599","https://openalex.org/W2395750323","https://openalex.org/W2402195372","https://openalex.org/W2618530766","https://openalex.org/W2726515241","https://openalex.org/W2808631503","https://openalex.org/W2894176037","https://openalex.org/W2916104401","https://openalex.org/W2963095666","https://openalex.org/W2964307722","https://openalex.org/W3099206234","https://openalex.org/W6713401928","https://openalex.org/W6740167877"],"related_works":["https://openalex.org/W2206035908","https://openalex.org/W2162158162","https://openalex.org/W4235705411","https://openalex.org/W1521299571","https://openalex.org/W4247736853","https://openalex.org/W1493012537","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W4310979479","https://openalex.org/W2144470400"],"abstract_inverted_index":{"Text-independent":[0],"speaker":[1,9],"verification":[2,86],"is":[3,37,73,121,148,150,176,200],"a":[4,8,12,42,164,174],"task":[5],"of":[6,14,26,69,87,103,139,145,155,160,171,236],"verifying":[7],"identity":[10,147],"from":[11,59],"characteristic":[13],"voice.":[15],"We":[16],"proposed":[17,91],"the":[18,28,47,55,60,70,77,116,119,123,134,169,206,209,219],"combined":[19,79],"deep":[20,80],"Convolutional":[21],"Neural":[22],"Network":[23],"(CNN)":[24],"consisting":[25],"(i)":[27],"first":[29,192,207],"CNN":[30,49,72,81,92],"trained":[31,50,196],"to":[32,40,62,75,98,190,205],"achieve":[33],"gender":[34,120,144,170],"classification":[35,67],"which":[36,194],"then":[38],"used":[39],"create":[41],"gender-like":[43,56],"embedding":[44],"and":[45,85,186],"(ii)":[46],"last":[48,71],"with":[51,133],"one":[52],"additional":[53],"input,":[54],"feature":[57],"(embedding)":[58],"first,":[61],"classify":[63],"each":[64],"speaker.":[65,89],"The":[66,136],"layer":[68],"removed":[74],"allow":[76],"remaining":[78],"for":[82,184,197,222],"one-shot":[83],"learning":[84],"unobserved":[88],"Our":[90],"could":[93],"obtain":[94],"better":[95],"results":[96,113],"compared":[97,204],"VGGVox":[99,156,232],"(ResNet-50)":[100,157,233],"by":[101,234],"0.40%":[102],"Equal":[104],"Error":[105],"Rate":[106],"(EER)":[107],"on":[108,115,128,158,215],"average.":[109],"Additionally,":[110],"we":[111],"investigated":[112],"based":[114],"scenario":[117],"that":[118,131,142,154,168],"known;":[122],"evaluation":[124],"was":[125,195],"performed":[126,224],"only":[127,143],"utterance":[129],"pairs":[130],"comply":[132],"scenario.":[135],"EER":[137,214],"rate":[138],"such":[140],"case":[141],"claimed":[146],"known":[149],"0.52%":[151],"lower":[152],"than":[153],"average":[159],"two":[161,179,228],"genders.":[162],"In":[163],"more":[165],"specific":[166],"situation":[167],"person":[172],"making":[173],"claim":[175],"also":[177],"known,":[178],"dedicated":[180,221,229],"networks":[181,230],"were":[182],"retrained":[183],"female":[185,210],"male,":[187],"in":[188],"addition":[189],"our":[191,227],"network":[193,211,220],"both.":[198],"It":[199],"interesting":[201],"that,":[202],"when":[203],"network,":[208],"achieved":[212],"less":[213],"female-female":[216],"verification,":[217],"while":[218],"male":[223],"worse.":[225],"Nevertheless,":[226],"outperformed":[231],"0.88%":[235],"EER.":[237]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
