{"id":"https://openalex.org/W2086547315","doi":"https://doi.org/10.1002/scj.4690190606","title":"Speaker identification based on frequency distribution of vector\u2010quantized spectra","display_name":"Speaker identification based on frequency distribution of vector\u2010quantized spectra","publication_year":1988,"publication_date":"1988-06-01","ids":{"openalex":"https://openalex.org/W2086547315","doi":"https://doi.org/10.1002/scj.4690190606","mag":"2086547315"},"language":"en","primary_location":{"id":"doi:10.1002/scj.4690190606","is_oa":false,"landing_page_url":"https://doi.org/10.1002/scj.4690190606","pdf_url":null,"source":{"id":"https://openalex.org/S58208175","display_name":"Systems and Computers in Japan","issn_l":"0882-1666","issn":["0882-1666","1520-684X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Systems and Computers in Japan","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109058482","display_name":"Katsuhiko Shirai","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Katsuhiko Shirai","raw_affiliation_strings":["Katsuhiko Shirai graduated 1963 Dept. Electrical Eng., School of Sci. & Eng., Waseda Univ. Completed doctoral program 1968 Grad. School. Affiliated with Waseda Univ. since 1965, and presently, Prof. Dept. Electrical Eng. Doctor of Eng. Engaged in research on man-machine systems, such as speech recognition, speech synthesis, natural language processing and cognitive science. Member, Acoust. SOC. Jap.; and I.E.E.E","School of Science and Engineering, Waseda University, Tokyo, Japan 160","I.E.E.E","Katsuhiko Shirai graduated 1963 Dept. Electrical Eng., School of Sci. & Eng., Waseda Univ. Completed doctoral program 1968 Grad. School. Affiliated with Waseda Univ. since 1965, and presently, Prof. Dept. Electrical Eng. Doctor of Eng. Engaged in research on man-machine systems, such as speech recognition, speech synthesis, natural language processing and cognitive science. Member, Acoust. SOC. Jap"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Katsuhiko Shirai graduated 1963 Dept. Electrical Eng., School of Sci. & Eng., Waseda Univ. Completed doctoral program 1968 Grad. School. Affiliated with Waseda Univ. since 1965, and presently, Prof. Dept. Electrical Eng. Doctor of Eng. Engaged in research on man-machine systems, such as speech recognition, speech synthesis, natural language processing and cognitive science. Member, Acoust. SOC. Jap.; and I.E.E.E","institution_ids":["https://openalex.org/I150744194"]},{"raw_affiliation_string":"School of Science and Engineering, Waseda University, Tokyo, Japan 160","institution_ids":["https://openalex.org/I150744194"]},{"raw_affiliation_string":"I.E.E.E","institution_ids":[]},{"raw_affiliation_string":"Katsuhiko Shirai graduated 1963 Dept. Electrical Eng., School of Sci. & Eng., Waseda Univ. Completed doctoral program 1968 Grad. School. Affiliated with Waseda Univ. since 1965, and presently, Prof. Dept. Electrical Eng. Doctor of Eng. Engaged in research on man-machine systems, such as speech recognition, speech synthesis, natural language processing and cognitive science. Member, Acoust. SOC. Jap","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082062172","display_name":"Kazunori Mano","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]},{"id":"https://openalex.org/I4210156427","display_name":"ProCure (United States)","ror":"https://ror.org/04cdebn34","country_code":"US","type":"company","lineage":["https://openalex.org/I4210156427"]},{"id":"https://openalex.org/I4588055","display_name":"Tottori University","ror":"https://ror.org/024yc3q36","country_code":"JP","type":"education","lineage":["https://openalex.org/I4588055"]}],"countries":["JP","US"],"is_corresponding":false,"raw_author_name":"Kazunori Mano","raw_affiliation_strings":["Kazunori Mano graduated 1982 Dept. Electrical Eng., School of Sci. & Eng. Completed doctoral program 1987 Grad. School. Doctor of Eng. Assistant 1984-87 Centre for Informatics, Waseda Univ. Since 1987, affiliated with NTT. Engaged in research on speech recognition and speaker recognition. Member, Acoust. SOC. Jap.; and Inf. Proc. SOC. Japan","School of Science and Engineering, Waseda University, Tokyo, Japan 160","Inf. Proc. SOC. Japan","Kazunori Mano graduated 1982 Dept. Electrical Eng., School of Sci. & Eng. Completed doctoral program 1987 Grad. School. Doctor of Eng. Assistant 1984-87 Centre for Informatics, Waseda Univ. Since 1987, affiliated with NTT. Engaged in research on speech recognition and speaker recognition. Member, Acoust. SOC. Jap"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Kazunori Mano graduated 1982 Dept. Electrical Eng., School of Sci. & Eng. Completed doctoral program 1987 Grad. School. Doctor of Eng. Assistant 1984-87 Centre for Informatics, Waseda Univ. Since 1987, affiliated with NTT. Engaged in research on speech recognition and speaker recognition. Member, Acoust. SOC. Jap.; and Inf. Proc. SOC. Japan","institution_ids":["https://openalex.org/I4588055"]},{"raw_affiliation_string":"School of Science and Engineering, Waseda University, Tokyo, Japan 160","institution_ids":["https://openalex.org/I150744194"]},{"raw_affiliation_string":"Inf. Proc. SOC. Japan","institution_ids":["https://openalex.org/I4210156427"]},{"raw_affiliation_string":"Kazunori Mano graduated 1982 Dept. Electrical Eng., School of Sci. & Eng. Completed doctoral program 1987 Grad. School. Doctor of Eng. Assistant 1984-87 Centre for Informatics, Waseda Univ. Since 1987, affiliated with NTT. Engaged in research on speech recognition and speaker recognition. Member, Acoust. SOC. Jap","institution_ids":["https://openalex.org/I4588055"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050645997","display_name":"Shunichi Ishige","orcid":null},"institutions":[{"id":"https://openalex.org/I1304132090","display_name":"Sony (Taiwan)","ror":"https://ror.org/0214y7014","country_code":"TW","type":"company","lineage":["https://openalex.org/I1304132090","https://openalex.org/I4210143797"]},{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP","TW"],"is_corresponding":false,"raw_author_name":"Shunichi Ishige","raw_affiliation_strings":["School of Science and Engineering, Waseda University, Tokyo, Japan 160","Shunichi Ishige graduated 1985 Dept. Electrical Eng., School of Sci. & Eng., Waseda Univ. Completed Master's program 1987 Grad. School. Since 1987, affiliated with Sony Corp. In Grad. School, engaged in research on speaker recognition. Member, Acoust. SOC. Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Science and Engineering, Waseda University, Tokyo, Japan 160","institution_ids":["https://openalex.org/I150744194"]},{"raw_affiliation_string":"Shunichi Ishige graduated 1985 Dept. Electrical Eng., School of Sci. & Eng., Waseda Univ. Completed Master's program 1987 Grad. School. Since 1987, affiliated with Sony Corp. In Grad. School, engaged in research on speaker recognition. Member, Acoust. SOC. Japan","institution_ids":["https://openalex.org/I1304132090"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109058482"],"corresponding_institution_ids":["https://openalex.org/I150744194"],"apc_list":null,"apc_paid":null,"fwci":0.6629,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.75450045,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"19","issue":"6","first_page":"63","last_page":"72"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vector-quantization","display_name":"Vector quantization","score":0.8410279750823975},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.7075274586677551},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7014225721359253},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.6937400698661804},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.6888700127601624},{"id":"https://openalex.org/keywords/quantization","display_name":"Quantization (signal processing)","score":0.6417153477668762},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6014150381088257},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5733628273010254},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5311720967292786},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.5126551985740662},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45340201258659363},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.35360169410705566},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2750382721424103}],"concepts":[{"id":"https://openalex.org/C199833920","wikidata":"https://www.wikidata.org/wiki/Q612536","display_name":"Vector quantization","level":2,"score":0.8410279750823975},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.7075274586677551},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7014225721359253},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.6937400698661804},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.6888700127601624},{"id":"https://openalex.org/C28855332","wikidata":"https://www.wikidata.org/wiki/Q198099","display_name":"Quantization (signal processing)","level":2,"score":0.6417153477668762},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6014150381088257},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5733628273010254},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5311720967292786},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.5126551985740662},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45340201258659363},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.35360169410705566},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2750382721424103}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1002/scj.4690190606","is_oa":false,"landing_page_url":"https://doi.org/10.1002/scj.4690190606","pdf_url":null,"source":{"id":"https://openalex.org/S58208175","display_name":"Systems and Computers in Japan","issn_l":"0882-1666","issn":["0882-1666","1520-684X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Systems and Computers in Japan","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W1791154168","https://openalex.org/W1945356021","https://openalex.org/W2069976350","https://openalex.org/W2084781109","https://openalex.org/W2114706887","https://openalex.org/W2125952316","https://openalex.org/W2134383396","https://openalex.org/W2155634954","https://openalex.org/W2158921262","https://openalex.org/W2585529150"],"related_works":["https://openalex.org/W4246349004","https://openalex.org/W2181871477","https://openalex.org/W2061163896","https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W2432604435","https://openalex.org/W2787035864","https://openalex.org/W2373675101","https://openalex.org/W2511460115"],"abstract_inverted_index":{"Abstract":[0],"At":[1],"present,":[2],"one":[3],"of":[4,18,30,62,71,76,128,146,156,165,187,201],"the":[5,16,22,28,34,37,51,56,60,63,68,72,77,98,102,105,109,113,116,120,126,129,135,147,162,175,179,193,209],"most":[6],"important":[7],"problems":[8],"in":[9,101],"speech":[10,23],"recognition":[11,14],"and":[12,36,82,125,196],"speaker":[13,39],"is":[15,48,55,84,94],"extraction":[17,29],"individual":[19,31,69],"information":[20,32,40],"from":[21,174],"waveform.":[24],"This":[25],"paper":[26],"describes":[27],"by":[33,59,86,112,161],"vector\u2010quantization":[35,64],"text\u2010independent":[38],"based":[41],"on":[42],"that":[43],"method.":[44],"A":[45],"feature":[46,78,96,118],"vector":[47,79],"proposed":[49],"for":[50,104,122,150,167,192,206],"first":[52,194],"time":[53],"which":[54,171],"quantized":[57],"distribution":[58,93,99,164],"frequency":[61],"code":[65],"to":[66,133,208],"represent":[67],"features":[70],"speaker.":[73],"The":[74,91,138],"properties":[75],"are":[80,131,141,172],"investigated,":[81],"effectiveness":[83],"verified":[85],"an":[87,153,184],"actual":[88],"speaker\u2010identification":[89],"experiment.":[90],"quantization":[92,136,163],"a":[95,144,197],"representing":[97],"density":[100],"space":[103],"acoustic":[106,117],"features,":[107],"e.g.,":[108],"spectrum":[110],"uttered":[111],"individual.":[114],"As":[115,143],"parameters,":[119],"cepstrum":[121,166],"stationary":[123],"part,":[124],"change":[127],"cepstrum,":[130],"used":[132],"construct":[134],"distribution.":[137],"identification":[139,148,154,185,199],"rates":[140],"compared.":[142],"result":[145],"experiment":[149,180],"10":[151,168],"speakers,":[152,183],"rate":[155,186,200],"100":[157],"percent":[158,189,203],"was":[159,190,204],"achieved":[160,191,205],"input":[169],"words,":[170],"different":[173],"training":[176],"samples.":[177],"In":[178],"using":[181],"200":[182],"88":[188],"candidates,":[195],"cumulative":[198],"95":[202],"up":[207],"second":[210],"candidate.":[211]},"counts_by_year":[],"updated_date":"2026-05-21T06:26:12.895304","created_date":"2025-10-10T00:00:00"}
