{"id":"https://openalex.org/W4391021675","doi":"https://doi.org/10.1109/asru57964.2023.10389676","title":"Reproducing Whisper-Style Training Using An Open-Source Toolkit And Publicly Available Data","display_name":"Reproducing Whisper-Style Training Using An Open-Source Toolkit And Publicly Available Data","publication_year":2023,"publication_date":"2023-12-16","ids":{"openalex":"https://openalex.org/W4391021675","doi":"https://doi.org/10.1109/asru57964.2023.10389676"},"language":"en","primary_location":{"id":"doi:10.1109/asru57964.2023.10389676","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru57964.2023.10389676","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033862822","display_name":"Yifan Peng","orcid":"https://orcid.org/0000-0002-8581-8674"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yifan Peng","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068192693","display_name":"Jinchuan Tian","orcid":"https://orcid.org/0000-0002-2129-471X"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jinchuan Tian","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103125256","display_name":"Brian Yan","orcid":"https://orcid.org/0000-0002-4160-6282"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian Yan","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024324721","display_name":"Dan Berrebbi","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dan Berrebbi","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050058892","display_name":"Xuankai Chang","orcid":"https://orcid.org/0000-0002-5221-5412"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xuankai Chang","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100660610","display_name":"Xinjian Li","orcid":"https://orcid.org/0000-0003-4585-159X"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xinjian Li","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008336983","display_name":"Jiatong Shi","orcid":"https://orcid.org/0000-0002-9050-8304"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiatong Shi","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047892839","display_name":"Siddhant Arora","orcid":"https://orcid.org/0000-0003-0375-496X"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Siddhant Arora","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101779022","display_name":"William Chen","orcid":"https://orcid.org/0000-0002-3251-3084"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William Chen","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058649002","display_name":"Roshan Sharma","orcid":"https://orcid.org/0000-0003-3760-9955"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Roshan Sharma","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071937621","display_name":"Wangyou Zhang","orcid":"https://orcid.org/0000-0003-4500-3515"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]},{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN","US"],"is_corresponding":false,"raw_author_name":"Wangyou Zhang","raw_affiliation_strings":["Carnegie Mellon University,USA","Shanghai Jiao Tong University, China","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Shanghai Jiao Tong University, China","institution_ids":["https://openalex.org/I183067930"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091425252","display_name":"Yui Sudo","orcid":"https://orcid.org/0000-0003-2094-6701"},"institutions":[{"id":"https://openalex.org/I1283473643","display_name":"Honda (Japan)","ror":"https://ror.org/03jzay846","country_code":"JP","type":"company","lineage":["https://openalex.org/I1283473643"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yui Sudo","raw_affiliation_strings":["Honda Research Institute Japan,Japan","Honda Research Institute Japan, Japan"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute Japan,Japan","institution_ids":["https://openalex.org/I1283473643"]},{"raw_affiliation_string":"Honda Research Institute Japan, Japan","institution_ids":["https://openalex.org/I1283473643"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012020904","display_name":"Muhammad Shakeel","orcid":"https://orcid.org/0000-0002-8515-0053"},"institutions":[{"id":"https://openalex.org/I1283473643","display_name":"Honda (Japan)","ror":"https://ror.org/03jzay846","country_code":"JP","type":"company","lineage":["https://openalex.org/I1283473643"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Muhammad Shakeel","raw_affiliation_strings":["Honda Research Institute Japan,Japan","Honda Research Institute Japan, Japan"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute Japan,Japan","institution_ids":["https://openalex.org/I1283473643"]},{"raw_affiliation_string":"Honda Research Institute Japan, Japan","institution_ids":["https://openalex.org/I1283473643"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091834525","display_name":"Jee-weon Jung","orcid":"https://orcid.org/0000-0003-0505-2988"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jee-Weon Jung","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010858961","display_name":"Soumi Maiti","orcid":"https://orcid.org/0000-0001-6940-0115"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Soumi Maiti","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001291873","display_name":"Shinji Watanabe","orcid":"https://orcid.org/0000-0002-5970-8631"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["Carnegie Mellon University,USA","Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5033862822"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":5.7352,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.96943571,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8293046951293945},{"id":"https://openalex.org/keywords/scripting-language","display_name":"Scripting language","score":0.6272662878036499},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5927241444587708},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.579486608505249},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5418243408203125},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5173015594482422},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.4823962450027466},{"id":"https://openalex.org/keywords/open-source","display_name":"Open source","score":0.4772717356681824},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4068658947944641},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.202769935131073},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.18794625997543335}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8293046951293945},{"id":"https://openalex.org/C61423126","wikidata":"https://www.wikidata.org/wiki/Q187432","display_name":"Scripting language","level":2,"score":0.6272662878036499},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5927241444587708},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.579486608505249},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5418243408203125},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5173015594482422},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.4823962450027466},{"id":"https://openalex.org/C3018397939","wikidata":"https://www.wikidata.org/wiki/Q3644502","display_name":"Open source","level":3,"score":0.4772717356681824},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4068658947944641},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.202769935131073},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.18794625997543335},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru57964.2023.10389676","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru57964.2023.10389676","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2023 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4099999964237213,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320307110","display_name":"Delta","ror":"https://ror.org/03g9c1e75"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":73,"referenced_works":["https://openalex.org/W1494198834","https://openalex.org/W2024490156","https://openalex.org/W2083751884","https://openalex.org/W2166637769","https://openalex.org/W2526425061","https://openalex.org/W2739883972","https://openalex.org/W2788388592","https://openalex.org/W2799473636","https://openalex.org/W2936774411","https://openalex.org/W2962780374","https://openalex.org/W2963242190","https://openalex.org/W2963250244","https://openalex.org/W3012492057","https://openalex.org/W3030437843","https://openalex.org/W3091427154","https://openalex.org/W3092085609","https://openalex.org/W3095410713","https://openalex.org/W3097777922","https://openalex.org/W3101648800","https://openalex.org/W3119308075","https://openalex.org/W3139918052","https://openalex.org/W3166440012","https://openalex.org/W3196509775","https://openalex.org/W3197580070","https://openalex.org/W3198587774","https://openalex.org/W3198694222","https://openalex.org/W3203140070","https://openalex.org/W3203407300","https://openalex.org/W3204647170","https://openalex.org/W3207558756","https://openalex.org/W3209059054","https://openalex.org/W3213029956","https://openalex.org/W4210463634","https://openalex.org/W4224308101","https://openalex.org/W4229005866","https://openalex.org/W4281492411","https://openalex.org/W4292779060","https://openalex.org/W4295108597","https://openalex.org/W4295312788","https://openalex.org/W4297841547","https://openalex.org/W4311000453","https://openalex.org/W4319862255","https://openalex.org/W4319862410","https://openalex.org/W4319862635","https://openalex.org/W4321854923","https://openalex.org/W4322718191","https://openalex.org/W4323066695","https://openalex.org/W4360836968","https://openalex.org/W4372260519","https://openalex.org/W4372262650","https://openalex.org/W4375869065","https://openalex.org/W4385822685","https://openalex.org/W4385823111","https://openalex.org/W4385823140","https://openalex.org/W4385823182","https://openalex.org/W6739901393","https://openalex.org/W6766978945","https://openalex.org/W6771467084","https://openalex.org/W6775053297","https://openalex.org/W6778883912","https://openalex.org/W6780218876","https://openalex.org/W6791904447","https://openalex.org/W6796715840","https://openalex.org/W6810081322","https://openalex.org/W6811340617","https://openalex.org/W6838276489","https://openalex.org/W6839026989","https://openalex.org/W6842738431","https://openalex.org/W6847363464","https://openalex.org/W6850068309","https://openalex.org/W6850218400","https://openalex.org/W6850625674","https://openalex.org/W6850936240"],"related_works":["https://openalex.org/W2046765700","https://openalex.org/W262455470","https://openalex.org/W4242899858","https://openalex.org/W4384345686","https://openalex.org/W2145834781","https://openalex.org/W2357937784","https://openalex.org/W2547618384","https://openalex.org/W2577782152","https://openalex.org/W4240746485","https://openalex.org/W2006708147"],"abstract_inverted_index":{"Pre-training":[0],"speech":[1,25,32],"models":[2,49,133],"on":[3,20],"large":[4],"volumes":[5],"of":[6,23],"data":[7,51,123],"has":[8],"achieved":[9],"remarkable":[10],"success.":[11],"OpenAI":[12],"Whisper":[13],"is":[14,55],"a":[15,39],"multilingual":[16],"multitask":[17],"model":[18],"trained":[19],"680k":[21],"hours":[22],"supervised":[24],"data.":[26,101],"It":[27],"generalizes":[28],"well":[29,130],"to":[30,53,65,113,137],"various":[31],"recognition":[33],"and":[34,70,79,98,108,127,134],"translation":[35,106],"benchmarks":[36],"even":[37,103],"in":[38],"zero-shot":[40],"setup.":[41],"However,":[42],"the":[43],"full":[44],"pipeline":[45],"for":[46,63,122],"developing":[47],"such":[48,74],"(from":[50],"collection":[52],"training)":[54],"not":[56],"publicly":[57,99,117],"accessible,":[58],"which":[59,90],"makes":[60],"it":[61],"difficult":[62],"researchers":[64],"further":[66],"improve":[67],"its":[68],"performance":[69],"address":[71],"training-related":[72],"issues":[73],"as":[75,129,131],"efficiency,":[76],"robustness,":[77],"fairness,":[78],"bias.":[80],"This":[81],"work":[82],"presents":[83],"an":[84,95],"Open":[85],"Whisper-style":[86],"Speech":[87],"Model":[88],"(OWSM),":[89],"reproduces":[91],"Whisperstyle":[92],"training":[93,135],"using":[94],"open-source":[96],"toolkit":[97],"available":[100],"OWSM":[102],"supports":[104],"more":[105,111],"directions":[107],"can":[109],"be":[110],"efficient":[112],"train.":[114],"We":[115],"will":[116],"release":[118],"all":[119],"scripts":[120],"used":[121],"preparation,":[124],"training,":[125],"inference,":[126],"scoring":[128],"pretrained":[132],"logs":[136],"promote":[138],"open":[139],"science.":[140],"<sup":[141,144],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[142,145],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">1</sup>":[143,146],"https://github.com/espnet/espnet":[147]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":20},{"year":2024,"cited_by_count":10}],"updated_date":"2026-04-03T22:45:19.894376","created_date":"2025-10-10T00:00:00"}
