{"id":"https://openalex.org/W2121681768","doi":"https://doi.org/10.1109/89.294355","title":"The metamorphic algorithm: a speaker mapping approach to data augmentation","display_name":"The metamorphic algorithm: a speaker mapping approach to data augmentation","publication_year":1994,"publication_date":"1994-07-01","ids":{"openalex":"https://openalex.org/W2121681768","doi":"https://doi.org/10.1109/89.294355","mag":"2121681768"},"language":"en","primary_location":{"id":"doi:10.1109/89.294355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/89.294355","pdf_url":null,"source":{"id":"https://openalex.org/S202446260","display_name":"IEEE Transactions on Speech and Audio Processing","issn_l":"1063-6676","issn":["1063-6676","1558-2353"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Speech and Audio Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112352288","display_name":"J.R. Bellegarda","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"J.R. Bellegarda","raw_affiliation_strings":["T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]"],"affiliations":[{"raw_affiliation_string":"T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002418228","display_name":"P.V. de Souza","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"P.V. de Souza","raw_affiliation_strings":["T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]"],"affiliations":[{"raw_affiliation_string":"T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063150637","display_name":"Arthur N\u00e1das","orcid":"https://orcid.org/0000-0002-6893-6759"},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"A. Nadas","raw_affiliation_strings":["T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]"],"affiliations":[{"raw_affiliation_string":"T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007586881","display_name":"D. Nahamoo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"D. Nahamoo","raw_affiliation_strings":["T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]"],"affiliations":[{"raw_affiliation_string":"T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034529775","display_name":"Michael Picheny","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]},{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M.A. Picheny","raw_affiliation_strings":["T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]"],"affiliations":[{"raw_affiliation_string":"T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112811561","display_name":"L.R. Bahl","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114115","display_name":"IBM Research - Thomas J. Watson Research Center","ror":"https://ror.org/0265w5591","country_code":"US","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"]},{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"L.R. Bahl","raw_affiliation_strings":["T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]"],"affiliations":[{"raw_affiliation_string":"T. J. Watson Research Center, IBM Research, Yorktown Heights, NY, USA","institution_ids":["https://openalex.org/I4210114115"]},{"raw_affiliation_string":"[IBM Thomas J. Watson Research Center, Yorktown Heights, NY , USA]","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5112352288"],"corresponding_institution_ids":["https://openalex.org/I1341412227","https://openalex.org/I4210114115"],"apc_list":null,"apc_paid":null,"fwci":2.1805,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.89410098,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"2","issue":"3","first_page":"413","last_page":"420"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.749542236328125},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7462161183357239},{"id":"https://openalex.org/keywords/utterance","display_name":"Utterance","score":0.588604211807251},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5848689079284668},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5411121249198914},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5365749597549438},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.4576377868652344},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37678009271621704},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36379629373550415}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.749542236328125},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7462161183357239},{"id":"https://openalex.org/C2775852435","wikidata":"https://www.wikidata.org/wiki/Q258403","display_name":"Utterance","level":2,"score":0.588604211807251},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5848689079284668},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5411121249198914},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5365749597549438},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.4576377868652344},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37678009271621704},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36379629373550415},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/89.294355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/89.294355","pdf_url":null,"source":{"id":"https://openalex.org/S202446260","display_name":"IEEE Transactions on Speech and Audio Processing","issn_l":"1063-6676","issn":["1063-6676","1558-2353"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Speech and Audio Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7099999785423279,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1497807607","https://openalex.org/W1560114291","https://openalex.org/W1611176049","https://openalex.org/W1966812932","https://openalex.org/W2006309149","https://openalex.org/W2019351418","https://openalex.org/W2049894045","https://openalex.org/W2055324606","https://openalex.org/W2096510939","https://openalex.org/W2104687512","https://openalex.org/W2110007337","https://openalex.org/W2112173325","https://openalex.org/W2117671523","https://openalex.org/W2123076331","https://openalex.org/W2125082162","https://openalex.org/W2130322773","https://openalex.org/W2139353158","https://openalex.org/W2146795714","https://openalex.org/W2150583827","https://openalex.org/W2154226865","https://openalex.org/W2169325501","https://openalex.org/W4230880351","https://openalex.org/W4300694379"],"related_works":["https://openalex.org/W2206035908","https://openalex.org/W2162158162","https://openalex.org/W4247736853","https://openalex.org/W1493012537","https://openalex.org/W1999004162","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W4310979479","https://openalex.org/W1521049138","https://openalex.org/W1556857061"],"abstract_inverted_index":{"Large":[0],"vocabulary":[1,129],"speaker-dependent":[2],"speech":[3,57,124],"recognition":[4,125],"systems":[5],"adjust":[6],"to":[7,51,91,159,165],"the":[8,25,32,35,39,73,93,98,102,105,111,115,136,142,179],"acoustic":[9,37],"peculiarities":[10],"of":[11,27,34,54,76,82,97,104,110,130,151,162,173],"each":[12],"new":[13,78,106,180],"speaker":[14,79,100,202],"based":[15,66],"on":[16,67,120],"some":[17],"enrolment":[18,40,152,174],"data":[19,28,63,96,153,175],"provided":[20],"by":[21],"this":[22],"speaker.":[23,85,107,181],"As":[24],"amount":[26,150,172],"required":[29,177],"increases":[30],"with":[31,127],"sophistication":[33],"underlying":[36],"models,":[38],"may":[41],"get":[42],"lengthy.":[43],"To":[44],"streamline":[45],"it,":[46],"it":[47,157,184],"is":[48,89,118,154,176],"therefore":[49],"desirable":[50],"make":[52],"use":[53],"previously":[55,94],"acquired":[56,95],"data.":[58],"The":[59,108],"authors":[60],"describe":[61],"a":[62,68,77,83,128,148,160,169,197],"augmentation":[64],"strategy":[65],"piecewise":[69],"linear":[70],"mapping":[71,88],"between":[72],"feature":[74],"space":[75,103],"and":[80],"that":[81,135,166],"reference":[84,99],"This":[86],"speaker-normalizing":[87],"used":[90,188],"transform":[92],"onto":[101],"performance":[109,163],"resulting":[112],"procedure,":[113],"dubbed":[114],"metamorphic":[116,137],"algorithm,":[117],"illustrated":[119],"an":[121],"isolated":[122],"utterance":[123],"task":[126],"20000":[131],"words.":[132],"Results":[133],"show":[134],"algorithm":[138],"can":[139,185],"substantially":[140],"reduce":[141],"word":[143],"error":[144],"rate":[145],"when":[146,168],"only":[147],"limited":[149],"available.":[155],"Alternatively,":[156],"leads":[158],"level":[161],"comparable":[164],"obtained":[167],"much":[170],"greater":[171],"from":[178],"In":[182],"addition,":[183],"also":[186],"be":[187],"for":[189,200],"tracking":[190],"spectral":[191],"evolution":[192],"over":[193],"time,":[194],"thus":[195],"providing":[196],"possible":[198],"means":[199],"robust":[201],"self-adaptation.<":[203],"<ETX":[204],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[205],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">&gt;</ETX>":[206]},"counts_by_year":[{"year":2022,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
