{"id":"https://openalex.org/W123670871","doi":"https://doi.org/10.21437/eurospeech.1997-179","title":"Voice mimic system using an articulatory codebook for estimation of vocal tract shape","display_name":"Voice mimic system using an articulatory codebook for estimation of vocal tract shape","publication_year":1997,"publication_date":"1997-09-22","ids":{"openalex":"https://openalex.org/W123670871","doi":"https://doi.org/10.21437/eurospeech.1997-179","mag":"123670871"},"language":"en","primary_location":{"id":"doi:10.21437/eurospeech.1997-179","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.1997-179","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"5th European Conference on Speech Communication and Technology (Eurospeech 1997)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084174219","display_name":"Samir Chennoukh","orcid":null},"institutions":[{"id":"https://openalex.org/I102322142","display_name":"Rutgers, The State University of New Jersey","ror":"https://ror.org/05vt9qd57","country_code":"US","type":"education","lineage":["https://openalex.org/I102322142"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Samir Chennoukh","raw_affiliation_strings":["Rutgers, University"],"affiliations":[{"raw_affiliation_string":"Rutgers, University","institution_ids":["https://openalex.org/I102322142"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108467953","display_name":"Daniel J. Sinder","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Daniel Sinder","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113927018","display_name":"Ga\u00ebl Richard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gael Richard","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5013430347","display_name":"James L. Flanagan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"James L. Flanagan","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5084174219"],"corresponding_institution_ids":["https://openalex.org/I102322142"],"apc_list":null,"apc_paid":null,"fwci":1.1701,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.8049445,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"429","last_page":"432"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.7543686628341675},{"id":"https://openalex.org/keywords/codebook","display_name":"Codebook","score":0.7072970867156982},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6380845904350281},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4767518937587738},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4443526268005371},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2684805989265442},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.07984185218811035}],"concepts":[{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.7543686628341675},{"id":"https://openalex.org/C127759330","wikidata":"https://www.wikidata.org/wiki/Q637416","display_name":"Codebook","level":2,"score":0.7072970867156982},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6380845904350281},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4767518937587738},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4443526268005371},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2684805989265442},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.07984185218811035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/eurospeech.1997-179","is_oa":false,"landing_page_url":"https://doi.org/10.21437/eurospeech.1997-179","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"5th European Conference on Speech Communication and Technology (Eurospeech 1997)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":2,"referenced_works":["https://openalex.org/W1995451491","https://openalex.org/W2006775235"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2293149949","https://openalex.org/W2026099691","https://openalex.org/W4284672201","https://openalex.org/W2377486419","https://openalex.org/W2943202426","https://openalex.org/W2052077049","https://openalex.org/W2067459736","https://openalex.org/W2105635394"],"abstract_inverted_index":{"VOICEMIMICSYSTEMUSINGANARTICULATORYCODEBOOKFORESTIMATIONOFVOCALTRACTSHAPES.":[0],"Chennoukh,":[1],"D.":[2],"Sinder,":[3],"G.":[4],"Richard*":[5],"and":[6,63,74,117,284,433,488,582],"J.L.":[7],"FlanaganCenter":[8],"for":[9,12,443,479,608],"Computer":[10],"Aids":[11],"Industrial":[13],"Pro":[14],"ductivity":[15],"(CAIP),":[16],"Rutgers":[17],"University,Piscataway,":[18],"NJ":[19],"08855-1390,":[20],"USA*Matra-Communication,":[21],"rue":[22],"J.P.":[23],"Timbaud,":[24],"78392":[25],"Bois":[26],"d'Arcy,FranceTel.+1":[27],"908-445-0080,":[28],"FAX:":[29],"+1":[30],"908":[31],"445-4775,":[32],"E-mail:chenoukh@caip.rutgers.eduABSTRACTVoice":[33],"mimic":[34,264,460,505],"systems":[35],"using":[36,223],"articulatory":[37,68,180,247,355,531],"co":[38,69,77,93,252,356,366,439,471,481,493,518,532,552,571],"deb":[39,70,78,94,357,367,420,440,472,482,494,519,533,556,572],"o":[40,71,79,95,358,368,421,441,468,473,483,495,520,534,554,557,573],"oks":[41,422],"re-quireaninitialestimateofthevo":[42],"caltractshap":[43,578],"einthe":[44],"vicinity":[45,328],"of":[46,59,90,132,167,178,201,204,227,246,270,329,349,376,389,396,401,427,430,491,502,516,529,541,550,562,569,589,605],"the":[47,67,76,88,104,195,228,271,327,330,341,346,374,377,417,492,499,503,514,517,523,530,539,542,548,551,560,570,586,590,609,614,623],"global":[48,418],"optimum.For":[49],"this":[50,85,125,457],"purp":[51],"ose,we":[52],"need":[53],"to":[54,142,182,266,278,285,302,318,334,339,372,416,465,508],"gather":[55],"a":[56,151,164,207,224,243,287,311,319,365,397,424,437,466,603,616],"large":[57,205,425,438],"set":[58,426,561],"corresp":[60,276],"onding":[61],"articu-latory":[62,304],"acoustic":[64,101,105,300,390,411,434],"data":[65],"in":[66,119,124,194,463],"ok.Thus,":[72],"searching":[73],"accessing":[75],"ok":[80,96,359,369,442,484,496,521,535],"b":[81,170,191,324,404,453],"ecomesa":[82],"di\u000ecult":[83],"task.In":[84],"pap":[86,126],"er,":[87],"design":[89,528],"an":[91,100,216,268,299,303,410,455,475],"artic-ulatory":[92,470],"is":[97,370,536,544,619],"presented":[98],"where":[99,622],"net-work":[102],"sub-samples":[103],"space":[106,395],"such":[107],"that":[108,275,322,383,409],"vo":[109,133,155,229,272,378,447,591],"caltract":[110],"mo":[111,143,225,248,594],"del":[112,144,226,249,450,595],"shap":[113,136,145,158,381,451,565,596],"es":[114,137,148,452],"are":[115,161,307,625],"ordered":[116],"clustered":[118],"thenetwork":[120],"according":[121],"toacousticparameters.Anotherissue":[122],"addressed":[123],"er":[127,487],"concerns":[128],"estimating":[129],"thetra":[130],"jectory":[131],"cal":[134,156,230,273,379,448,592],"tract":[135,157,231,274,380,432,593],"as":[138],"they":[139],"change":[140],"withtime.Sincetheinversemappingfromacousticpa-rameters":[141],"e":[146,159,325,382,405,597],"do":[147],"not":[149],"have":[150],"unique":[152],"so-lution,":[153],"several":[154],"variations":[160],"p":[162,185,292,445,489,500],"ossi-ble.Therefore,":[163],"dynamic":[165,600],"optimization":[166,174,255,314,342],"tra":[168],"jectorieshas":[169],"een":[171,192],"develop":[172],"ed.This":[173],"uses":[175],"dynamicprop":[176],"erties":[177],"each":[179],"parameter":[181],"estimatethe":[183],"next":[184],"osition.1.INTRODUCTIONThestudyofsp":[186],"eechp":[187],"erceptionandpro":[188],"duc-tion":[189],"has":[190],"enhanced":[193],"last":[196],"two":[197,509],"decades":[198],"by":[199,260],"thedevelopment":[200],"computers":[202],"capable":[203],"amountofcomputation.As":[206],"result,":[208],"Stevens'":[209],"study":[210],"towards":[211],"anarticulatorymo":[212],"delforsp":[213],"eechrecognition-synthesisb":[214],"ecomesmorefeasiblethanitwasintheearlysix-ties([9]).However,":[215],"incomplete":[217],"understanding":[218],"ofsp":[219],"eechpro":[220],"ductionandtheacousticsofpre-ventedusfromachievingStevens'goal.Thegoalwastomimicinputsp":[221],"eechsignalsbyrecognition-synthesis":[222],"area":[232],"func-tionthatcanmimicthesp":[233],"eechsignalswithoutun-derstanding":[234],"their":[235],"structure":[236],"or":[237],"meaning.An":[238],"early":[239],"attempt":[240],"at":[241],"creating":[242],"complete":[244],"computersimulation":[245],"sp":[250,281,398,610],"eech":[251,282,611],"ding":[253],"usingan":[254],"technique":[256],"was":[257],"rep":[258],"orted":[259],"Flanaganetal.([4]).Thesimulationiscalled\\voice":[261],"mimic.The":[262],"voice":[263,504],"attempts":[265],"provide":[267],"articulatorydescription":[269],"onds":[277],"anarbitrary":[279],"natural":[280],"input":[283],"generate":[286],"syn-thetic":[288],"signal":[289,301],"that,":[290],"within":[291,627],"erceptual":[293],"accuracy,":[294],"dupli-catesthenaturalone.Centraltoe":[295],"ortisinverse":[296],"mapping":[297],"from":[298],"description.However,":[305],"acoustic-to-articulatorymappings":[306],"non-unique":[308],"and,":[309],"given":[310,387],"cost":[312],"function,the":[313],"techniques":[315],"converge":[316],"only":[317],"lo":[320],"calextremum":[321],"may":[323,384],"near":[326],"initialparameters.Therefore,":[331],"one":[332,512,628],"needs":[333],"cho":[335],"ose":[336],"accuratestartup":[337],"parameters":[338],"initialize":[340],"pro-cedure.Schro":[343],"eter":[344,581],"andSondhi([8]),whocontinuedalong":[345],"same":[347],"lines":[348],"Flanagan":[350],"et":[351],"al.'s":[352],"study,":[353],"usedan":[354],"prop":[360,584,620],"osed":[361,585,621],"earlier":[362],"byAtal":[363],"etal.([1]).Since":[364],"used":[371],"obtain":[373],"rstestimates":[375],"pro":[385,477,545],"ducea":[386],"combination":[388],"parameters,":[391],"it":[392],"mustbedesignedsuchthatitspansthenatural":[393],"articula-tory":[394],"eaker.Furthermore,":[399],"sampling":[400],"thespace":[402],"must":[403],"ne":[406],"enough":[407],"so":[408],"entryalways":[412],"exists":[413],"very":[414],"close":[415],"optimum.Suchco":[419],"require":[423],"matching":[428],"pairs":[429],"vo-cal":[431],"parameters.The":[435],"complexityofsearching":[436],"all":[444],"ossible":[446],"tractmo":[449],"ecomes":[454],"issue.For":[456],"reason,":[458],"thevoice":[459],"system":[461,506],"needs,":[462],"addition":[464],"go":[467],"d":[469,618],"ok,":[474],"e\u000ecient":[476],"cedure":[478],"accessingthe":[480],"([6],[7]).The":[485],"numb":[486],"osition":[490],"vectorsa":[497],"ect":[498],"erformance":[501],"ac-cording":[507],"compromising":[510],"problems.On":[511],"hand,increasing":[513],"size":[515,568],"increases":[522],"dif-":[524],"cultyoftheaccesstaskand,onotherhand,reductionofthissizecomplicatestheinverseprob-lemsolution.Inthesecond":[525],"sectionofthispap":[526],"er,anew":[527],"presentedfor":[537],"which":[538],"inversion":[540],"articulatory-to-acousticmapping":[543],"cessed":[546],"during":[547],"building":[549],"de-b":[553],"ok.Thisco":[555],"okdesignallowsreal-time":[558],"accessto":[559],"acoustically":[563],"equivalent":[564],"es,":[566],"regardlessthe":[567],"ok.Sincetheinversemappingfromacousticparam-eterstomo":[574],"delshap":[575],"edo":[576],"esnothaveauniquesolu-tion,severalvo":[577],"eariationsarep":[579],"ossi-ble.Schro":[580],"Sondhi([7])":[583],"use":[587],"ofdynamicprogrammingtoestimatetheoptimaltra-jectory":[588],"variation":[598],"path.The":[599],"programming":[601],"requires":[602],"delay":[604],"severaldata":[606],"frames":[607],"output":[612],"([8]).In":[613],"thirdsection,":[615],"metho":[617],"articulatoryparameters":[624],"estimated":[626],"frame.Section":[629]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
