{"id":"https://openalex.org/W3008363190","doi":"https://doi.org/10.1109/asru46091.2019.9003943","title":"Semi-Supervised Training and Data Augmentation for Adaptation of Automatic Broadcast News Captioning Systems","display_name":"Semi-Supervised Training and Data Augmentation for Adaptation of Automatic Broadcast News Captioning Systems","publication_year":2019,"publication_date":"2019-12-01","ids":{"openalex":"https://openalex.org/W3008363190","doi":"https://doi.org/10.1109/asru46091.2019.9003943","mag":"3008363190"},"language":"en","primary_location":{"id":"doi:10.1109/asru46091.2019.9003943","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru46091.2019.9003943","pdf_url":null,"source":{"id":"https://openalex.org/S4306498489","display_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101673889","display_name":"Yinghui Huang","orcid":"https://orcid.org/0000-0003-0607-1507"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yinghui Huang","raw_affiliation_strings":["IBM Research AI, Yorktown Heights, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research AI, Yorktown Heights, USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101787514","display_name":"Samuel Thomas","orcid":"https://orcid.org/0000-0001-7573-0620"},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samuel Thomas","raw_affiliation_strings":["IBM Research AI, Yorktown Heights, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research AI, Yorktown Heights, USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028421346","display_name":"Masayuki Suzuki","orcid":"https://orcid.org/0000-0002-0436-1490"},"institutions":[{"id":"https://openalex.org/I4210145865","display_name":"IBM Research - Tokyo","ror":"https://ror.org/04915qk43","country_code":"JP","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210145865"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Masayuki Suzuki","raw_affiliation_strings":["IBM Research AI, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research AI, Tokyo, Japan","institution_ids":["https://openalex.org/I4210145865"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047353872","display_name":"Zolt\u00e1n T\u00fcske","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zoltan Tuske","raw_affiliation_strings":["IBM Research AI, Yorktown Heights, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research AI, Yorktown Heights, USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063657297","display_name":"Larry Sansone","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Larry Sansone","raw_affiliation_strings":["IBM Research AI, Yorktown Heights, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research AI, Yorktown Heights, USA","institution_ids":["https://openalex.org/I1341412227"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034529775","display_name":"Michael Picheny","orcid":null},"institutions":[{"id":"https://openalex.org/I1341412227","display_name":"IBM (United States)","ror":"https://ror.org/05hh8d621","country_code":"US","type":"company","lineage":["https://openalex.org/I1341412227"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Michael Picheny","raw_affiliation_strings":["IBM Research AI, Yorktown Heights, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"IBM Research AI, Yorktown Heights, USA","institution_ids":["https://openalex.org/I1341412227"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4068,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.67436661,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"4","issue":null,"first_page":"867","last_page":"874"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13310","display_name":"Subtitles and Audiovisual Media","score":0.9926999807357788,"subfield":{"id":"https://openalex.org/subfields/1203","display_name":"Language and Linguistics"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.9598710536956787},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8276939392089844},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.7541059255599976},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.6770095825195312},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4668444097042084},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4177151620388031},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4027891755104065},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36180219054222107},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.34113478660583496}],"concepts":[{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.9598710536956787},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8276939392089844},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.7541059255599976},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.6770095825195312},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4668444097042084},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4177151620388031},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4027891755104065},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36180219054222107},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.34113478660583496},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru46091.2019.9003943","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru46091.2019.9003943","pdf_url":null,"source":{"id":"https://openalex.org/S4306498489","display_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.47999998927116394,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":60,"referenced_works":["https://openalex.org/W8870360","https://openalex.org/W29464808","https://openalex.org/W100415715","https://openalex.org/W103244930","https://openalex.org/W265531733","https://openalex.org/W648786980","https://openalex.org/W854541894","https://openalex.org/W1463944445","https://openalex.org/W1594833364","https://openalex.org/W1654858490","https://openalex.org/W1665214252","https://openalex.org/W1915251500","https://openalex.org/W1978394996","https://openalex.org/W2010362084","https://openalex.org/W2056786202","https://openalex.org/W2057589672","https://openalex.org/W2097560587","https://openalex.org/W2098318492","https://openalex.org/W2099424804","https://openalex.org/W2101234009","https://openalex.org/W2105830342","https://openalex.org/W2117278770","https://openalex.org/W2117590177","https://openalex.org/W2128014038","https://openalex.org/W2144211451","https://openalex.org/W2158195707","https://openalex.org/W2161513525","https://openalex.org/W2163426739","https://openalex.org/W2164666834","https://openalex.org/W2288371874","https://openalex.org/W2327501763","https://openalex.org/W2507680812","https://openalex.org/W2671240430","https://openalex.org/W2746475861","https://openalex.org/W2747909401","https://openalex.org/W2890144771","https://openalex.org/W2896457183","https://openalex.org/W2936995161","https://openalex.org/W2937657912","https://openalex.org/W2939021222","https://openalex.org/W2962784628","https://openalex.org/W2963266252","https://openalex.org/W2963341956","https://openalex.org/W2963499843","https://openalex.org/W2972837679","https://openalex.org/W3148201686","https://openalex.org/W4285719527","https://openalex.org/W6600367688","https://openalex.org/W6601248468","https://openalex.org/W6604108467","https://openalex.org/W6604228424","https://openalex.org/W6609831787","https://openalex.org/W6621543089","https://openalex.org/W6623517193","https://openalex.org/W6637242042","https://openalex.org/W6675354045","https://openalex.org/W6677328538","https://openalex.org/W6677717300","https://openalex.org/W6680395727","https://openalex.org/W6761030284"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W3088136942","https://openalex.org/W2949362007","https://openalex.org/W2775506363","https://openalex.org/W4290852288","https://openalex.org/W4388893791","https://openalex.org/W4283207562","https://openalex.org/W2963177403","https://openalex.org/W2330246314","https://openalex.org/W2551249631"],"abstract_inverted_index":{"In":[0],"this":[1],"paper":[2],"we":[3,135],"present":[4],"a":[5],"comprehensive":[6],"study":[7,98],"on":[8,51,117],"building":[9,30],"and":[10,62,75],"adapting":[11],"deep":[12],"neural":[13],"network":[14],"based":[15,66],"speech":[16,33],"recognition":[17,34],"systems":[18,27,36,141],"for":[19,146],"automatic":[20,32,147],"closed":[21,148],"captioning.":[22,149],"We":[23,70,86,106],"develop":[24],"the":[25,82,100,114,125,137],"proposed":[26,115],"by":[28],"first":[29],"base":[31,84,101],"(ASR)":[35],"that":[37],"are":[38,49],"not":[39],"specific":[40],"to":[41,79,97,109],"any":[42],"particular":[43],"show":[44],"or":[45],"station.":[46],"These":[47],"models":[48,102],"trained":[50,83],"nearly":[52],"6000":[53],"hours":[54,89],"of":[55,90,124],"broadcast":[56],"news":[57],"data":[58,76,91],"using":[59,113],"conventional":[60],"hybrid":[61],"more":[63],"recent":[64],"attention":[65],"end-to-end":[67],"acoustic":[68],"models.":[69,85],"then":[71],"employ":[72],"various":[73],"adaptation":[74,126],"augmentation":[77],"strategies":[78],"further":[80],"improve":[81],"use":[87],"535":[88],"from":[92],"two":[93],"independent":[94,123],"BN":[95,139],"sources":[96],"how":[99],"can":[103,142],"be":[104,143],"customized.":[105],"observe":[107],"up":[108],"32%":[110],"relative":[111],"improvement":[112],"techniques":[116],"test":[118],"sets":[119],"related":[120],"to,":[121],"but":[122],"data.":[127],"At":[128],"these":[129],"low":[130],"word":[131],"error":[132],"rates":[133],"(WERs),":[134],"believe":[136],"customized":[138],"ASR":[140],"used":[144],"effectively":[145]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
