{"id":"https://openalex.org/W170533338","doi":"https://doi.org/10.21437/eurospeech.2003-723","title":"syncpitch: a pseudo pitch synchronous algorithm for speaker recognition","display_name":"syncpitch: a pseudo pitch synchronous algorithm for speaker recognition","publication_year":2003,"publication_date":"2003-09-01","ids":{"openalex":"https://openalex.org/W170533338","doi":"https://doi.org/10.21437/eurospeech.2003-723","mag":"170533338"},"language":"en","primary_location":{"id":"doi:10.21437/eurospeech.2003-723","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2003-723","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"8th European Conference on Speech Communication and Technology (Eurospeech 2003)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050001246","display_name":"Ran D. Zilca","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ran D. Zilca","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039085741","display_name":"Ji\u0159\u00ed Navr\u00e1til","orcid":"https://orcid.org/0000-0001-6348-0812"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiri Navratil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5111944718","display_name":"Ganesh N. Ramaswamy","orcid":"https://orcid.org/0009-0002-8015-0844"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ganesh N. Ramaswamy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.4065,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.83819385,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"2649","last_page":"2652"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7905595302581787},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7454866766929626},{"id":"https://openalex.org/keywords/pitch-detection-algorithm","display_name":"Pitch detection algorithm","score":0.7083650827407837},{"id":"https://openalex.org/keywords/nist","display_name":"NIST","score":0.6999881267547607},{"id":"https://openalex.org/keywords/cepstrum","display_name":"Cepstrum","score":0.6421142816543579},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5963661074638367},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5507614612579346},{"id":"https://openalex.org/keywords/signal","display_name":"SIGNAL (programming language)","score":0.5434392690658569},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5201566815376282},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.5016145706176758},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.48760882019996643},{"id":"https://openalex.org/keywords/mel-frequency-cepstrum","display_name":"Mel-frequency cepstrum","score":0.46865859627723694},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.41691070795059204},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3761812448501587},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30152270197868347},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.2774519622325897},{"id":"https://openalex.org/keywords/digital-signal-processing","display_name":"Digital signal processing","score":0.1435869038105011}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7905595302581787},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7454866766929626},{"id":"https://openalex.org/C135622632","wikidata":"https://www.wikidata.org/wiki/Q7198851","display_name":"Pitch detection algorithm","level":3,"score":0.7083650827407837},{"id":"https://openalex.org/C111219384","wikidata":"https://www.wikidata.org/wiki/Q6954384","display_name":"NIST","level":2,"score":0.6999881267547607},{"id":"https://openalex.org/C88485024","wikidata":"https://www.wikidata.org/wiki/Q1054571","display_name":"Cepstrum","level":2,"score":0.6421142816543579},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5963661074638367},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5507614612579346},{"id":"https://openalex.org/C2779843651","wikidata":"https://www.wikidata.org/wiki/Q7390335","display_name":"SIGNAL (programming language)","level":2,"score":0.5434392690658569},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5201566815376282},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.5016145706176758},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.48760882019996643},{"id":"https://openalex.org/C151989614","wikidata":"https://www.wikidata.org/wiki/Q440370","display_name":"Mel-frequency cepstrum","level":3,"score":0.46865859627723694},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.41691070795059204},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3761812448501587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30152270197868347},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2774519622325897},{"id":"https://openalex.org/C84462506","wikidata":"https://www.wikidata.org/wiki/Q173142","display_name":"Digital signal processing","level":2,"score":0.1435869038105011},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/eurospeech.2003-723","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.2003-723","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"8th European Conference on Speech Communication and Technology (Eurospeech 2003)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.800000011920929,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W86348706","https://openalex.org/W1503442377","https://openalex.org/W1997873121","https://openalex.org/W2014181881","https://openalex.org/W2078953162","https://openalex.org/W2113810833","https://openalex.org/W2139037446","https://openalex.org/W2153408936","https://openalex.org/W2167768673","https://openalex.org/W2397634864"],"related_works":["https://openalex.org/W2018086531","https://openalex.org/W1980297060","https://openalex.org/W2387604097","https://openalex.org/W1963976507","https://openalex.org/W2373675101","https://openalex.org/W3146151004","https://openalex.org/W2141992701","https://openalex.org/W4385672897","https://openalex.org/W106160982","https://openalex.org/W2206035908"],"abstract_inverted_index":{"Pitch":[0],"mismatch":[1],"between":[2],"enrollment":[3],"and":[4,47,83],"testing":[5],"is":[6,15,132],"a":[7,58,85,92,116,129],"common":[8],"problem":[9],"in":[10,29,41,51,139],"speaker":[11,35,136],"recognition":[12],"systems.":[13],"It":[14],"well":[16],"known":[17],"that":[18,64,100],"the":[19,44,71,95,109,121,143],"fine":[20],"spectral":[21],"structure":[22],"related":[23],"to":[24,66,79,134],"fundamental":[25],"frequency":[26],"manifests":[27],"itself":[28],"Mel":[30],"cepstral":[31],"features":[32],"used":[33],"for":[34],"recognition.":[36],"Therefore":[37],"pitch":[38,68,81,87,103,110],"variations":[39],"result":[40],"variation":[42],"of":[43,94,126],"acoustic":[45],"features,":[46],"potentially":[48],"an":[49],"increase":[50],"error":[52],"rate.":[53],"A":[54],"previous":[55],"study":[56],"introduced":[57],"signal":[59,73],"processing":[60,105],"procedure":[61],"termed":[62,98],"depitch":[63,96],"attempts":[65],"remove":[67],"information":[69],"from":[70],"speech":[72,77,122],"by":[74],"forcing":[75],"every":[76],"frame":[78],"be":[80],"synchronous":[82,104],"include":[84],"single":[86],"cycle.":[88],"This":[89],"paper":[90],"presents":[91],"modification":[93],"algorithm,":[97],"syncpitch,":[99],"performs":[101],"pseudo":[102],"while":[106],"still":[107],"preserving":[108],"information.":[111],"The":[112],"new":[113],"algorithm":[114],"has":[115],"relatively":[117],"moderate":[118],"effect":[119],"on":[120,142],"signal.":[123],"System":[124],"combination":[125],"syncpitch":[127],"with":[128],"baseline":[130],"system":[131],"shown":[133],"improve":[135],"verification":[137],"accuracy":[138],"experiments":[140],"conducted":[141],"2002":[144],"NIST":[145],"Speaker":[146],"Recognition":[147],"Evaluation":[148],"data.":[149]},"counts_by_year":[{"year":2014,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
