{"id":"https://openalex.org/W47839664","doi":"https://doi.org/10.21437/interspeech.2004-108","title":"Improved performance of Aurora 4 using HTK and unsupervised MLLR adaptation","display_name":"Improved performance of Aurora 4 using HTK and unsupervised MLLR adaptation","publication_year":2004,"publication_date":"2004-10-04","ids":{"openalex":"https://openalex.org/W47839664","doi":"https://doi.org/10.21437/interspeech.2004-108","mag":"47839664"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2004-108","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-108","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045211387","display_name":"Siu-Kei Au Yeung","orcid":"https://orcid.org/0000-0001-6523-9547"},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Siu-Kei Au Yeung","raw_affiliation_strings":["Hong Kong University of Science & Technology"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science & Technology","institution_ids":["https://openalex.org/I200769079"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067041166","display_name":"Man-Hung Siu","orcid":null},"institutions":[{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Man-Hung Siu","raw_affiliation_strings":["Hong Kong University of Science & Technology"],"affiliations":[{"raw_affiliation_string":"Hong Kong University of Science & Technology","institution_ids":["https://openalex.org/I200769079"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5045211387"],"corresponding_institution_ids":["https://openalex.org/I200769079"],"apc_list":null,"apc_paid":null,"fwci":1.7988,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.86294701,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"161","last_page":"164"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.69341641664505},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6240740418434143},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3358997106552124},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.09097972512245178},{"id":"https://openalex.org/keywords/optics","display_name":"Optics","score":0.07297390699386597}],"concepts":[{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.69341641664505},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6240740418434143},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3358997106552124},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.09097972512245178},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.07297390699386597}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2004-108","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-108","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W61263365","https://openalex.org/W96504731","https://openalex.org/W2146871184","https://openalex.org/W2151484683"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2130043461","https://openalex.org/W2530322880"],"abstract_inverted_index":{"The":[0,126],"introduction":[1],"of":[2,16,61,117,132,144,151,161],"Aurora":[3,26,55],"4":[4,27,56],"tasks":[5,28,57,75],"provides":[6],"a":[7,77],"standard":[8],"database":[9],"and":[10,52,84,107],"methodology":[11],"for":[12],"comparing":[13],"the":[14,30,49,59,71,95,100,115,133,141,146,149,158],"effectiveness":[15],"different":[17,36],"robust":[18],"algorithms":[19],"on":[20,25,54,70,88,121],"LVCSR.":[21],"One":[22],"important":[23],"issue":[24],"is":[29,68,155],"computation":[31,105],"time":[32,79,83,86,106],"involved":[33],"in":[34,81],"evaluating":[35],"test":[37],"conditions.":[38],"In":[39],"this":[40],"paper":[41],"we":[42,91],"show":[43,129],"that":[44,93,130],"by":[45],"employing":[46],"HTK":[47],"as":[48],"recognition":[50,101],"frontend":[51],"backend":[53],"with":[58,114],"use":[60,116,150],"cepstral":[62],"mean":[63],"subtraction,":[64],"14%":[65],"relative":[66],"improvement":[67],"achieved":[69],"baseline":[72,159],"clean":[73],"train":[74],"at":[76],"82.5%":[78],"reduction":[80,87],"training":[82],"40%":[85],"decoding.":[89],"Furthermore,":[90],"found":[92],"optimizing":[94],"model":[96],"complexity":[97],"can":[98,110],"increase":[99],"performance":[102],"(in":[103],"both":[104],"accuracy).":[108],"Accuracy":[109],"be":[111],"further":[112],"improved":[113],"unsupervised":[118],"MLLR":[119],"adaptation":[120,127,136],"one":[122],"or":[123],"multiple":[124],"sentences.":[125],"results":[128],"most":[131],"gain":[134],"from":[135,138,157],"comes":[137],"adapting":[139],"to":[140,145,163],"environment":[142],"instead":[143],"speaker.":[147],"With":[148],"adaptation,the":[152],"error":[153],"rate":[154],"reduced":[156],"result":[160],"69.6%":[162],"40%.":[164]},"counts_by_year":[{"year":2023,"cited_by_count":3},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":4},{"year":2012,"cited_by_count":2}],"updated_date":"2026-02-25T08:12:03.925757","created_date":"2025-10-10T00:00:00"}
