{"id":"https://openalex.org/W3138712295","doi":"https://doi.org/10.1145/3448748.3448796","title":"A Speech-Driven 3-D Tongue Model with Realistic Movement in Mandarin Chinese","display_name":"A Speech-Driven 3-D Tongue Model with Realistic Movement in Mandarin Chinese","publication_year":2021,"publication_date":"2021-01-22","ids":{"openalex":"https://openalex.org/W3138712295","doi":"https://doi.org/10.1145/3448748.3448796","mag":"3138712295"},"language":"en","primary_location":{"id":"doi:10.1145/3448748.3448796","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448748.3448796","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Bioinformatics and Intelligent Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037483106","display_name":"Changwei Liang","orcid":"https://orcid.org/0009-0006-0226-022X"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Changwei Liang","raw_affiliation_strings":["Department of Chinese Language and Literature, Peking University, Beijing China"],"affiliations":[{"raw_affiliation_string":"Department of Chinese Language and Literature, Peking University, Beijing China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013103032","display_name":"Jiangping Kong","orcid":"https://orcid.org/0000-0001-6941-0882"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiangping Kong","raw_affiliation_strings":["Department of Chinese Language and Literature, Peking University, Beijing China"],"affiliations":[{"raw_affiliation_string":"Department of Chinese Language and Literature, Peking University, Beijing China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113818761","display_name":"Xiyu Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiyu Wu","raw_affiliation_strings":["Department of Chinese Language and Literature, Peking University, Beijing China and Department of Chinese Language and Literature and Center for Chinese Linguistics, Peking University, Beijing, P.R. China"],"affiliations":[{"raw_affiliation_string":"Department of Chinese Language and Literature, Peking University, Beijing China and Department of Chinese Language and Literature and Center for Chinese Linguistics, Peking University, Beijing, P.R. China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5037483106"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.02701045,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"297","last_page":"302"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10515","display_name":"Cancer-related molecular mechanisms research","score":0.9528999924659729,"subfield":{"id":"https://openalex.org/subfields/1306","display_name":"Cancer Research"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T10515","display_name":"Cancer-related molecular mechanisms research","score":0.9528999924659729,"subfield":{"id":"https://openalex.org/subfields/1306","display_name":"Cancer Research"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9524999856948853,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/tongue","display_name":"Tongue","score":0.8539144992828369},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.64149010181427},{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.6381178498268127},{"id":"https://openalex.org/keywords/line","display_name":"Line (geometry)","score":0.45221957564353943},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4442588984966278},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.433524489402771},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.35400378704071045},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2527610659599304},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.11823108792304993}],"concepts":[{"id":"https://openalex.org/C2779744641","wikidata":"https://www.wikidata.org/wiki/Q9614","display_name":"Tongue","level":2,"score":0.8539144992828369},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.64149010181427},{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.6381178498268127},{"id":"https://openalex.org/C198352243","wikidata":"https://www.wikidata.org/wiki/Q37105","display_name":"Line (geometry)","level":2,"score":0.45221957564353943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4442588984966278},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.433524489402771},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35400378704071045},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2527610659599304},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.11823108792304993},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3448748.3448796","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3448748.3448796","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2021 International Conference on Bioinformatics and Intelligent Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W37655516","https://openalex.org/W198124244","https://openalex.org/W1531956331","https://openalex.org/W1778436208","https://openalex.org/W2055080184","https://openalex.org/W2056387890","https://openalex.org/W2079306716","https://openalex.org/W2111701360","https://openalex.org/W2402610474","https://openalex.org/W2576259985","https://openalex.org/W2891698792"],"related_works":["https://openalex.org/W2079194684","https://openalex.org/W2617269004","https://openalex.org/W35292311","https://openalex.org/W1748856376","https://openalex.org/W2803166627","https://openalex.org/W2046073792","https://openalex.org/W1591384192","https://openalex.org/W2099204336","https://openalex.org/W2067459736","https://openalex.org/W2105635394"],"abstract_inverted_index":{"In":[0,168],"this":[1,169,228],"paper,":[2],"a":[3,87],"new":[4],"speech":[5],"driven":[6],"3-D":[7,15,57,70,166,170],"geometric":[8,142,202],"tongue":[9,16,26,53,71,97,115,171,177,203,210],"model":[10,36],"is":[11,18,37,220],"constructed.":[12],"The":[13],"constructed":[14,35],"shape":[17,146],"controlled":[19],"with":[20,65,141,208,222],"control":[21,92,102,190,197],"points":[22,93,103,191],"on":[23,33,120,153,213],"2-D":[24,43],"midsagittal":[25,52,111,137,155],"curve,":[27],"and":[28,55,82,108,130,144,175,188,200],"speech-driven":[29,218],"inverse":[30],"estimation":[31],"based":[32],"the":[34,51,68,77,91,96,110,114,121,125,136,145,154,159,165,189,198,201,214,217,223],"evaluated":[38,221],"by":[39],"empirical":[40],"data.":[41],"X-Ray":[42],"vocal":[44,58],"tract":[45],"motion":[46,178],"videos":[47,78],"are":[48,63,74,83,104,132,139,150,179,192,206],"tagged":[49],"for":[50,67,194],"motion,":[54],"static":[56],"tracts":[59],"of":[60,95,113,124,147,164],"20":[61],"phonemes":[62],"collected":[64],"MRI":[66],"realistic":[69,176,185,209,224],"shape.":[72,98],"MFCC":[73],"calculated":[75],"from":[76,135],"as":[79],"acoustic":[80,173],"features,":[81],"then":[84,133,151],"used":[85],"in":[86],"LSTM-RNN":[88],"to":[89,106,157,182,196],"predict":[90],"movement":[94],"Three":[99],"geometrically":[100],"intuitive":[101,193],"selected":[105],"represent":[107],"calculate":[109],"line":[112,156],"through":[116],"linear":[117],"regression.":[118],"Cross-sections":[119],"central":[122],"lines":[123],"tongues,":[126],"whose":[127],"height,":[128],"width":[129],"angle":[131],"predicted":[134,161,205],"line,":[138],"reconstructed":[140],"curves,":[143],"each":[148],"cross-section":[149],"placed":[152],"get":[158],"overall":[160],"moving":[162],"grid":[163],"tongue.":[167],"model,":[172,199],"features":[174],"mapped":[180],"directly":[181],"preserve":[183],"more":[184],"articulatory":[186],"details,":[187],"non-experts":[195],"shapes":[204],"comparable":[207],"dynamics.":[211],"Based":[212],"proposed":[215,229],"method,":[216],"prediction":[219],"data,":[225],"which":[226],"proved":[227],"method":[230],"feasible.":[231]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
