{"id":"https://openalex.org/W105892654","doi":"https://doi.org/10.21437/interspeech.2004-382","title":"Graphical model approach to pitch tracking","display_name":"Graphical model approach to pitch tracking","publication_year":2004,"publication_date":"2004-10-04","ids":{"openalex":"https://openalex.org/W105892654","doi":"https://doi.org/10.21437/interspeech.2004-382","mag":"105892654"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2004-382","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-382","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102969086","display_name":"Xiao Li","orcid":"https://orcid.org/0000-0003-2425-4577"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Xiao Li","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111946966","display_name":"Jonathan Malkin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jonathan Malkin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5113478221","display_name":"Jeff Bilmes","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jeff Bilmes","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102969086"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.8569,"has_fulltext":false,"cited_by_count":12,"citation_normalized_percentile":{"value":0.90442866,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1101","last_page":"1104"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/graphical-model","display_name":"Graphical model","score":0.8216785192489624},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7159709930419922},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6978896856307983},{"id":"https://openalex.org/keywords/bittorrent-tracker","display_name":"BitTorrent tracker","score":0.6386638879776001},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4974561035633087},{"id":"https://openalex.org/keywords/voice","display_name":"Voice","score":0.4962649941444397},{"id":"https://openalex.org/keywords/pitch-detection-algorithm","display_name":"Pitch detection algorithm","score":0.44786328077316284},{"id":"https://openalex.org/keywords/dynamic-programming","display_name":"Dynamic programming","score":0.42471417784690857},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4115750193595886},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3168085813522339},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.2571659982204437},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2422334849834442},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.1492336392402649},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.12712082266807556}],"concepts":[{"id":"https://openalex.org/C155846161","wikidata":"https://www.wikidata.org/wiki/Q1143367","display_name":"Graphical model","level":2,"score":0.8216785192489624},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7159709930419922},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6978896856307983},{"id":"https://openalex.org/C57501372","wikidata":"https://www.wikidata.org/wiki/Q2021268","display_name":"BitTorrent tracker","level":3,"score":0.6386638879776001},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4974561035633087},{"id":"https://openalex.org/C552089266","wikidata":"https://www.wikidata.org/wiki/Q494510","display_name":"Voice","level":2,"score":0.4962649941444397},{"id":"https://openalex.org/C135622632","wikidata":"https://www.wikidata.org/wiki/Q7198851","display_name":"Pitch detection algorithm","level":3,"score":0.44786328077316284},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.42471417784690857},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4115750193595886},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3168085813522339},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.2571659982204437},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2422334849834442},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.1492336392402649},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.12712082266807556},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2004-382","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-382","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.2.6088","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.2.6088","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://ssli.ee.washington.edu/people/bilmes/mypapers/li_icslp04.ps.gz","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions","score":0.47999998927116394}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W86348706","https://openalex.org/W1496562625","https://openalex.org/W1976611840","https://openalex.org/W1995966271","https://openalex.org/W2084562624","https://openalex.org/W2088632109","https://openalex.org/W2091425152","https://openalex.org/W2122678358","https://openalex.org/W2142040441","https://openalex.org/W2171840027"],"related_works":["https://openalex.org/W2036753972","https://openalex.org/W1996861825","https://openalex.org/W2497205885","https://openalex.org/W2079621619","https://openalex.org/W2117854015","https://openalex.org/W2044564457","https://openalex.org/W1548784694","https://openalex.org/W2111139066","https://openalex.org/W2387387595","https://openalex.org/W284503395"],"abstract_inverted_index":{"Many":[0],"pitch":[1,54,67,103,113],"trackers":[2],"based":[3],"on":[4],"dynamic":[5],"programming":[6],"require":[7],"meticulous":[8],"design":[9,100],"of":[10,19,41,77,101],"local":[11],"cost":[12,15],"and":[13,26,69,80,115],"transition":[14,68],"functions.":[16],"The":[17],"forms":[18],"these":[20],"functions":[21],"are":[22,29,72],"often":[23],"empirically":[24],"determined":[25],"their":[27],"parameters":[28,56],"tuned":[30],"accordingly.":[31],"Parameter":[32],"tuning":[33],"usually":[34],"requires":[35],"great":[36],"effort":[37],"without":[38],"a":[39,47,102],"guarantee":[40],"optimal":[42],"performance.":[43],"This":[44],"work":[45],"presents":[46],"graphical":[48,78],"model":[49],"framework":[50,95],"to":[51],"automatically":[52],"optimize":[53],"tracking":[55],"in":[57],"the":[58,75,86,99],"maximum":[59],"likelihood":[60],"sense.":[61],"Therein,":[62],"probabilistic":[63,81],"dependencies":[64],"between":[65],"pitch,":[66],"acoustical":[70],"observations":[71],"expressed":[73],"using":[74,85],"language":[76],"models,":[79],"inference":[82],"is":[83],"accomplished":[84],"Graphical":[87],"Model":[88],"Toolkit":[89],"(GMTK).":[90],"Experiments":[91],"show":[92],"that":[93],"this":[94],"not":[96],"only":[97],"expedites":[98],"tracker,":[104],"but":[105],"also":[106],"yields":[107],"remarkably":[108],"good":[109],"performance":[110],"for":[111],"both":[112],"estimation":[114],"voicing":[116],"decision.":[117]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
