{"id":"https://openalex.org/W242215465","doi":"https://doi.org/10.21437/eurospeech.1999-189","title":"A new F0 contour control method based on vector representation of F0 contour","display_name":"A new F0 contour control method based on vector representation of F0 contour","publication_year":1999,"publication_date":"1999-09-05","ids":{"openalex":"https://openalex.org/W242215465","doi":"https://doi.org/10.21437/eurospeech.1999-189","mag":"242215465"},"language":"en","primary_location":{"id":"doi:10.21437/eurospeech.1999-189","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.1999-189","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th European Conference on Speech Communication and Technology","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019776478","display_name":"Mitsuaki Isogai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mitsuaki Isogai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5102842694","display_name":"Hideyuki Mizuno","orcid":"https://orcid.org/0000-0002-2591-7152"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hideyuki Mizuno","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5207,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.72726757,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"727","last_page":"730"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9801999926567078,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7733244895935059},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.7573531866073608},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.7325092554092407},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6974924206733704},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.688339352607727},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.6118508577346802},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.565680205821991},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.5656185746192932},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5395447611808777},{"id":"https://openalex.org/keywords/image-warping","display_name":"Image warping","score":0.5298808813095093},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.4561544954776764}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7733244895935059},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.7573531866073608},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.7325092554092407},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6974924206733704},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.688339352607727},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.6118508577346802},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.565680205821991},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.5656185746192932},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5395447611808777},{"id":"https://openalex.org/C157202957","wikidata":"https://www.wikidata.org/wiki/Q1659609","display_name":"Image warping","level":2,"score":0.5298808813095093},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.4561544954776764}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/eurospeech.1999-189","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.1999-189","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th European Conference on Speech Communication and Technology","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.75,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W1533051419","https://openalex.org/W1985979081","https://openalex.org/W2050693797","https://openalex.org/W2093450784","https://openalex.org/W2096494729","https://openalex.org/W2116893836","https://openalex.org/W2136859047","https://openalex.org/W2148154194","https://openalex.org/W2167307239"],"related_works":["https://openalex.org/W2990982991","https://openalex.org/W2146591867","https://openalex.org/W2048014685","https://openalex.org/W2370972896","https://openalex.org/W3119288895","https://openalex.org/W3148366653","https://openalex.org/W2185075503","https://openalex.org/W1197719229","https://openalex.org/W2381158726","https://openalex.org/W1992796048"],"abstract_inverted_index":{"This":[0],"paper":[1],"describes":[2],"a":[3,21,30,72],"new":[4],"framework":[5],"for":[6,49],"designing":[7],"speaker":[8,36],"recognition":[9],"systems":[10,100],"based":[11,70],"on":[12,71],"the":[13,26,44,55,60,64,68,82,95,103,112],"discriminative":[14],"feature":[15,27,61],"extraction":[16],"(DFE)":[17],"method.":[18],"We":[19,52],"apply":[20],"mel-cepstral":[22,40],"estimation":[23,41],"technique":[24,42],"to":[25],"extractor":[28,62],"in":[29,109],"Gaussian":[31],"mixture":[32],"model":[33],"(GMM)-based":[34],"text-independent":[35],"identification":[37],"system.":[38],"The":[39],"uses":[43],"second-order":[45],"all-pass":[46],"warping":[47,57],"function":[48],"frequency":[50,56,83],"transformation.":[51],"jointly":[53],"optimize":[54],"parameters":[58,66],"of":[59,67],"and":[63],"GMM":[65],"classifier":[69,113],"minimum":[73],"classification":[74],"error":[75],"(MCE)":[76],"criterion.":[77],"Experimental":[78],"results":[79],"show":[80],"that":[81],"warped":[84],"scale":[85],"after":[86],"optimization":[87],"is":[88,114],"different":[89],"from":[90],"traditional":[91],"linear/mel":[92],"scales;":[93],"moreover,":[94],"proposed":[96],"system":[97],"outperforms":[98],"conventional":[99],"trained":[101],"with":[102],"generalized":[104],"probabilistic":[105],"descent":[106],"(GPD)":[107],"method":[108],"which":[110],"only":[111],"optimized.":[115]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2016-06-24T00:00:00"}
