{"id":"https://openalex.org/W1509309911","doi":"https://doi.org/10.1109/icassp.1987.1169449","title":"Some experiments on HMM speaker adaptation","display_name":"Some experiments on HMM speaker adaptation","publication_year":2005,"publication_date":"2005-03-24","ids":{"openalex":"https://openalex.org/W1509309911","doi":"https://doi.org/10.1109/icassp.1987.1169449","mag":"1509309911"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.1987.1169449","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.1987.1169449","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP '87. IEEE International Conference on Acoustics, Speech, and Signal Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084878544","display_name":"A. Jarre","orcid":null},"institutions":[{"id":"https://openalex.org/I55143463","display_name":"University of Turin","ror":"https://ror.org/048tbm396","country_code":"IT","type":"education","lineage":["https://openalex.org/I55143463"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"A. Jarre","raw_affiliation_strings":["Institute di Fisica, Universita di Torino, Torino, Italy"],"affiliations":[{"raw_affiliation_string":"Institute di Fisica, Universita di Torino, Torino, Italy","institution_ids":["https://openalex.org/I55143463"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5021021404","display_name":"Roberto Pieraccini","orcid":null},"institutions":[{"id":"https://openalex.org/I1298633626","display_name":"Telecom Italia Lab","ror":"https://ror.org/01rt74q71","country_code":"IT","type":"facility","lineage":["https://openalex.org/I1298633626","https://openalex.org/I137543953"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"R. Pieraccini","raw_affiliation_strings":["CSELT, Torino, Italy"],"affiliations":[{"raw_affiliation_string":"CSELT, Torino, Italy","institution_ids":["https://openalex.org/I1298633626"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5084878544"],"corresponding_institution_ids":["https://openalex.org/I55143463"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.05258164,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":null,"first_page":"1273","last_page":"1276"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10901","display_name":"Advanced Data Compression Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9876000285148621,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.8562912940979004},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.8011199235916138},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.7922555208206177},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.7913056015968323},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7760337591171265},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.6819003224372864},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5463008880615234},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.47673285007476807},{"id":"https://openalex.org/keywords/interpolation","display_name":"Interpolation (computer graphics)","score":0.4606836140155792},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4185592830181122},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4013509154319763},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.15934088826179504},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10616672039031982}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.8562912940979004},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.8011199235916138},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.7922555208206177},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.7913056015968323},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7760337591171265},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.6819003224372864},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5463008880615234},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.47673285007476807},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.4606836140155792},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4185592830181122},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4013509154319763},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.15934088826179504},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10616672039031982},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.1987.1169449","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.1987.1169449","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP '87. IEEE International Conference on Acoustics, Speech, and Signal Processing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.75}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W1529589667","https://openalex.org/W1599327554","https://openalex.org/W1896748021","https://openalex.org/W1900266864","https://openalex.org/W1936596287","https://openalex.org/W2086699924","https://openalex.org/W2137199074","https://openalex.org/W7065084554"],"related_works":["https://openalex.org/W2206035908","https://openalex.org/W1493012537","https://openalex.org/W2150890698","https://openalex.org/W2162158162","https://openalex.org/W4247736853","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W4310979479","https://openalex.org/W2401394187","https://openalex.org/W4245698648"],"abstract_inverted_index":{"The":[0],"main":[1],"problems":[2],"with":[3,67,94],"HMMs":[4,93,169],"of":[5,12,23,40,58,70,78,145,173],"sub-word":[6],"units":[7],"are":[8,63],"the":[9,21,24,44,47,68,71,75,92,100,105,116,122,134,146,150,153,168,171,180],"large":[10],"amount":[11],"training":[13,59,91,176],"data":[14],"and":[15,81,143,152],"computer":[16],"time":[17],"needed":[18],"for":[19,50,65],"estimating":[20],"parameters":[22],"models.":[25],"In":[26],"some":[27,56],"applications":[28],"it":[29],"is":[30,88,160],"not":[31],"proposable":[32],"that":[33,110,131],"a":[34,51,112,127],"new":[35,151,181],"speaker":[36,72,79,83,102,108,128,155],"utters":[37],"many":[38],"hundreds":[39],"words":[41,97,177],"to":[42,115,162],"train":[43],"system,":[45],"hence":[46],"interest":[48],"arises":[49],"quick":[52],"adaptation":[53,138],"based":[54],"on":[55,170],"tens":[57],"utterances.":[60],"Two":[61],"bounds":[62],"given":[64],"comparison":[66],"results":[69],"adaptation,":[73],"namely":[74],"recognition":[76,87,165],"rates":[77,166],"dependent":[80,86],"cross":[82],"recognition.":[84],"Speaker":[85],"achieved":[89],"by":[90,99,126,179],"nearly":[95],"1000":[96],"uttered":[98,133,178],"same":[101],"used":[103],"in":[104,120],"tests.":[106],"Cross":[107],"recognition,":[109],"gives":[111],"lower":[113],"bound":[114],"performance,":[117],"concerns":[118],"experiments":[119],"which":[121],"models":[123,156],"were":[124],"trained":[125],"different":[129],"from":[130],"who":[132],"test":[135],"sentences.":[136],"An":[137],"algorithm":[139],"using":[140],"Parzen":[141],"estimation":[142],"interpolation":[144],"emission":[147],"densities":[148],"between":[149],"old":[154],"was":[157],"investigated.":[158],"It":[159],"able":[161],"give":[163],"satisfactory":[164],"adapting":[167],"basis":[172],"only":[174],"40":[175],"speaker.":[182]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
