{"id":"https://openalex.org/W2687193347","doi":"https://doi.org/10.1504/ijes.2017.10005717","title":"Prosodic features-based speaker verification using speaker-specific-text for short utterances","display_name":"Prosodic features-based speaker verification using speaker-specific-text for short utterances","publication_year":2017,"publication_date":"2017-01-01","ids":{"openalex":"https://openalex.org/W2687193347","doi":"https://doi.org/10.1504/ijes.2017.10005717","mag":"2687193347"},"language":"en","primary_location":{"id":"doi:10.1504/ijes.2017.10005717","is_oa":false,"landing_page_url":"https://doi.org/10.1504/ijes.2017.10005717","pdf_url":null,"source":{"id":"https://openalex.org/S204369148","display_name":"International Journal of Embedded Systems","issn_l":"1741-1068","issn":["1741-1068","1741-1076"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317825","host_organization_name":"Inderscience Publishers","host_organization_lineage":["https://openalex.org/P4310317825"],"host_organization_lineage_names":["Inderscience Publishers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Embedded Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017090075","display_name":"Zhendong Wu","orcid":"https://orcid.org/0000-0001-8778-8213"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhendong Wu","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084329249","display_name":"Freeha Azmat","orcid":null},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Freeha Azmat","raw_affiliation_strings":["School of Engineering, University of Warwick, Coventry CV4 7AL, UK"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Engineering, University of Warwick, Coventry CV4 7AL, UK","institution_ids":["https://openalex.org/I39555362"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100435506","display_name":"Ping Li","orcid":"https://orcid.org/0000-0002-3314-943X"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ping Li","raw_affiliation_strings":["School of Mathematics and Computational Science, Sun Yatsen University, Guangzhou, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mathematics and Computational Science, Sun Yatsen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101631859","display_name":"Jianwu Zhang","orcid":"https://orcid.org/0000-0001-8288-8688"},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianwu Zhang","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I50760025"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013291701","display_name":"Jianchao He","orcid":null},"institutions":[{"id":"https://openalex.org/I50760025","display_name":"Hangzhou Dianzi University","ror":"https://ror.org/0576gt767","country_code":"CN","type":"education","lineage":["https://openalex.org/I50760025"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianchao He","raw_affiliation_strings":["School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I50760025"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0689957,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"9","issue":"3","first_page":"250","last_page":"250"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9818999767303467,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9818999767303467,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.8451549410820007},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8042095899581909},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7702387571334839},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.6802499890327454},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.6637674570083618},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5546407699584961},{"id":"https://openalex.org/keywords/speaker-verification","display_name":"Speaker verification","score":0.5458117723464966},{"id":"https://openalex.org/keywords/formant","display_name":"Formant","score":0.47176554799079895},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.450324684381485},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.44884759187698364},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.42816710472106934},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.38245606422424316},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.24922913312911987},{"id":"https://openalex.org/keywords/vowel","display_name":"Vowel","score":0.06471717357635498}],"concepts":[{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.8451549410820007},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8042095899581909},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7702387571334839},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.6802499890327454},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.6637674570083618},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5546407699584961},{"id":"https://openalex.org/C2982762665","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker verification","level":3,"score":0.5458117723464966},{"id":"https://openalex.org/C158215666","wikidata":"https://www.wikidata.org/wiki/Q1414685","display_name":"Formant","level":3,"score":0.47176554799079895},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.450324684381485},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.44884759187698364},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42816710472106934},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38245606422424316},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.24922913312911987},{"id":"https://openalex.org/C2779581591","wikidata":"https://www.wikidata.org/wiki/Q36244","display_name":"Vowel","level":2,"score":0.06471717357635498}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1504/ijes.2017.10005717","is_oa":false,"landing_page_url":"https://doi.org/10.1504/ijes.2017.10005717","pdf_url":null,"source":{"id":"https://openalex.org/S204369148","display_name":"International Journal of Embedded Systems","issn_l":"1741-1068","issn":["1741-1068","1741-1076"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310317825","host_organization_name":"Inderscience Publishers","host_organization_lineage":["https://openalex.org/P4310317825"],"host_organization_lineage_names":["Inderscience Publishers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Embedded Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4699999988079071,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2100012411","https://openalex.org/W1482212662","https://openalex.org/W3162157266","https://openalex.org/W2162084437","https://openalex.org/W1997579527","https://openalex.org/W2102353451","https://openalex.org/W3044927199","https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097"],"abstract_inverted_index":{"Over":[0],"the":[1,47,50,73,77,97,105,112,150],"past":[2],"several":[3],"years,":[4],"Gaussian":[5],"mixture":[6],"model":[7],"and":[8,17,53,66],"its":[9],"variants":[10],"have":[11],"been":[12],"dominant":[13],"architectures":[14],"in":[15,35,56,128,136],"text-independent":[16],"text-dependent":[18,85],"speaker":[19,88,108,121],"recognition":[20,23,98,153],"field.":[21],"The":[22],"accuracy":[24],"of":[25,49,79,107,114],"above-mentioned":[26],"models":[27],"declines":[28],"when":[29],"experimental":[30],"utterances'":[31],"length":[32],"becomes":[33],"short":[34,86],"practical":[36],"application.":[37],"Presently,":[38],"Mel-frequency":[39],"cepstral":[40],"coefficients":[41],"are":[42,68],"generally":[43,69],"used":[44,135],"to":[45,71,95,103,138],"characterise":[46],"properties":[48],"vocal":[51,140],"tract":[52,141],"widely":[54],"applied":[55],"speech":[57,152],"recognition.":[58],"In":[59,84,101],"addition,":[60],"prosodic":[61,91,126,144],"features,":[62,127],"such":[63],"as":[64],"pitch":[65],"formant,":[67],"considered":[70],"describe":[72],"glottal":[74],"characteristics.":[75],"However,":[76],"efficiency":[78],"those":[80],"approaches":[81],"remains":[82],"unsatisfactory.":[83],"utterance":[87],"verification":[89,109,122],"systems,":[90],"features":[92,142],"can":[93],"assist":[94],"improve":[96],"result":[99],"theoretically.":[100],"order":[102,137],"optimise":[104],"performance":[106],"systems":[110],"under":[111],"framework":[113],"adapted":[115],"GMM-UBM,":[116],"we":[117],"adopt":[118],"a":[119,130,156],"variant":[120],"system":[123,154],"based":[124],"on":[125],"which":[129],"dual":[131],"judgement":[132],"mechanism":[133],"is":[134],"integrate":[139],"with":[143],"features.":[145],"Experimental":[146],"results":[147],"showed":[148],"that":[149],"new":[151],"gives":[155],"better":[157],"consequence.":[158]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
