{"id":"https://openalex.org/W2394917751","doi":"https://doi.org/10.1109/icassp.2016.7472747","title":"Source modeling for HMM based speech synthesis using integrated LP residual","display_name":"Source modeling for HMM based speech synthesis using integrated LP residual","publication_year":2016,"publication_date":"2016-03-01","ids":{"openalex":"https://openalex.org/W2394917751","doi":"https://doi.org/10.1109/icassp.2016.7472747","mag":"2394917751"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2016.7472747","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7472747","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5015353805","display_name":"Nagaraj Adiga","orcid":"https://orcid.org/0000-0002-3438-567X"},"institutions":[{"id":"https://openalex.org/I1317621060","display_name":"Indian Institute of Technology Guwahati","ror":"https://ror.org/0022nd079","country_code":"IN","type":"education","lineage":["https://openalex.org/I1317621060"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Nagaraj Adiga","raw_affiliation_strings":["Department of Electronics and Electrical Engineering, Indian Institute of Technology Guwahati"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Electrical Engineering, Indian Institute of Technology Guwahati","institution_ids":["https://openalex.org/I1317621060"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052129812","display_name":"S. R. Mahadeva Prasanna","orcid":"https://orcid.org/0000-0002-8135-7938"},"institutions":[{"id":"https://openalex.org/I1317621060","display_name":"Indian Institute of Technology Guwahati","ror":"https://ror.org/0022nd079","country_code":"IN","type":"education","lineage":["https://openalex.org/I1317621060"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"S. R. Mahadeva Prasanna","raw_affiliation_strings":["Department of Electronics and Electrical Engineering, Indian Institute of Technology Guwahati"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Electrical Engineering, Indian Institute of Technology Guwahati","institution_ids":["https://openalex.org/I1317621060"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5015353805"],"corresponding_institution_ids":["https://openalex.org/I1317621060"],"apc_list":null,"apc_paid":null,"fwci":0.8569,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.83200671,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"5590","last_page":"5594"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7202445268630981},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6021267175674438},{"id":"https://openalex.org/keywords/vocal-tract","display_name":"Vocal tract","score":0.5648637413978577},{"id":"https://openalex.org/keywords/spectral-envelope","display_name":"Spectral envelope","score":0.5617771744728088},{"id":"https://openalex.org/keywords/residual","display_name":"Residual","score":0.46955588459968567},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4564518928527832},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.41731858253479004},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31796127557754517},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2761896252632141}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7202445268630981},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6021267175674438},{"id":"https://openalex.org/C47401133","wikidata":"https://www.wikidata.org/wiki/Q748953","display_name":"Vocal tract","level":2,"score":0.5648637413978577},{"id":"https://openalex.org/C54926389","wikidata":"https://www.wikidata.org/wiki/Q7575188","display_name":"Spectral envelope","level":2,"score":0.5617771744728088},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.46955588459968567},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4564518928527832},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.41731858253479004},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31796127557754517},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2761896252632141},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2016.7472747","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7472747","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.5199999809265137}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W6725010","https://openalex.org/W95152782","https://openalex.org/W1514941256","https://openalex.org/W1963637322","https://openalex.org/W1966264494","https://openalex.org/W2042691334","https://openalex.org/W2049686551","https://openalex.org/W2060171943","https://openalex.org/W2074460168","https://openalex.org/W2074854222","https://openalex.org/W2108662299","https://openalex.org/W2129142580","https://openalex.org/W2150658333","https://openalex.org/W2155359203","https://openalex.org/W2158432602","https://openalex.org/W2163181067","https://openalex.org/W2166823384","https://openalex.org/W2286166914","https://openalex.org/W2408414488","https://openalex.org/W6603838645","https://openalex.org/W6630796692","https://openalex.org/W6696156092","https://openalex.org/W6713575540"],"related_works":["https://openalex.org/W2136763963","https://openalex.org/W2109705048","https://openalex.org/W2940588515","https://openalex.org/W1909151225","https://openalex.org/W1987783679","https://openalex.org/W153239700","https://openalex.org/W2067459736","https://openalex.org/W2160030256","https://openalex.org/W2105635394","https://openalex.org/W4253235840"],"abstract_inverted_index":{"In":[0],"this":[1],"work,":[2],"new":[3],"method":[4],"of":[5,22,63,71,112],"source":[6,147,167],"modeling":[7,148,168],"for":[8],"HMM":[9,123],"based":[10,173],"speech":[11,66,143],"synthesis":[12],"is":[13,44,84,100,176],"proposed":[14,146],"using":[15,86],"integrated":[16],"LP":[17],"residual":[18],"(ILPR).":[19],"The":[20,41,68,115,141],"nature":[21],"ILPR":[23,42,72],"waveform":[24],"resembles":[25],"the":[26,34,47,52,64,75,110,122,145,150,154,159],"glottal":[27],"flow":[28],"derivative":[29],"signal":[30,43],"and":[31,60,117,128,137,152,164,169,182],"may":[32],"keep":[33],"speaker":[35,155],"characteristics":[36],"in":[37,46,179],"a":[38],"better":[39],"way.":[40],"modeled":[45,85,101,120],"frequency":[48,78],"domain":[49],"by":[50,102,109,144],"dividing":[51],"spectrum":[53],"into":[54],"two":[55],"bands":[56],"to":[57,158],"characterize":[58],"harmonic":[59,69],"noise":[61,93,106,163],"components":[62,70],"voice":[65],"segment.":[67],"signals":[73],"below":[74],"maximum":[76],"voiced":[77],"(f":[79],"<sub":[80,97,130],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[81,98,131],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">m</sub>":[82,99],")":[83],"mel-cepstral":[87],"coefficients":[88],"called":[89],"as":[90],"RMCEPs,":[91],"whereas":[92],"component":[94],"above":[95],"f":[96],"pitch":[103],"adaptive":[104],"triangular":[105],"envelope":[107],"weighted":[108],"strength":[111],"excitation":[113,166],"(SoE).":[114],"RMCEPs":[116],"SoE":[118],"are":[119],"on":[121],"framework":[124],"along":[125],"with":[126,171],"MCEPs":[127],"F":[129],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">0</sub>":[132],"representing":[133],"vocal":[134],"tract":[135],"information":[136],"fundamental":[138],"frequency,":[139],"respectively.":[140],"synthesized":[142],"reduces":[149],"buzziness":[151],"improves":[153],"similarity":[156],"compared":[157],"conventional":[160],"impulse":[161],"/":[162],"mixed":[165],"comparable":[170],"STRAIGHT":[172],"excitation.":[174],"This":[175],"further":[177],"reflected":[178],"both":[180],"objective":[181],"subjective":[183],"valuations.":[184]},"counts_by_year":[{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
