{"id":"https://openalex.org/W7148256791","doi":"https://doi.org/10.1109/asru65441.2025.11434638","title":"Less is More: Data Curation Matters in Scaling Speech Enhancement","display_name":"Less is More: Data Curation Matters in Scaling Speech Enhancement","publication_year":2025,"publication_date":"2025-12-06","ids":{"openalex":"https://openalex.org/W7148256791","doi":"https://doi.org/10.1109/asru65441.2025.11434638"},"language":null,"primary_location":{"id":"doi:10.1109/asru65441.2025.11434638","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru65441.2025.11434638","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007581833","display_name":"Chang Li","orcid":"https://orcid.org/0000-0002-3267-1859"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenda Li","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071937621","display_name":"Wangyou Zhang","orcid":"https://orcid.org/0000-0003-4500-3515"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wangyou Zhang","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100391700","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0001-6853-7785"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020401831","display_name":"Robin Scheibler","orcid":"https://orcid.org/0000-0002-5205-8365"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Robin Scheibler","raw_affiliation_strings":["Google DeepMind,Japan"],"affiliations":[{"raw_affiliation_string":"Google DeepMind,Japan","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132828128","display_name":"Kohei Saijo","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kohei Saijo","raw_affiliation_strings":["Waseda University,Japan"],"affiliations":[{"raw_affiliation_string":"Waseda University,Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047682990","display_name":"Samuele Cornell","orcid":"https://orcid.org/0000-0002-5358-1844"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Samuele Cornell","raw_affiliation_strings":["Carnegie Mellon University,USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010250251","display_name":"Yihui Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I94509681","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66","country_code":"DE","type":"education","lineage":["https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Yihui Fu","raw_affiliation_strings":["Technische Universit&#x00E4;t,Braunschweig,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t,Braunschweig,Germany","institution_ids":["https://openalex.org/I94509681"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110895535","display_name":"Marvin Sach","orcid":null},"institutions":[{"id":"https://openalex.org/I94509681","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66","country_code":"DE","type":"education","lineage":["https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Marvin Sach","raw_affiliation_strings":["Technische Universit&#x00E4;t,Braunschweig,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t,Braunschweig,Germany","institution_ids":["https://openalex.org/I94509681"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132816482","display_name":"Zhaoheng Ni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhaoheng Ni","raw_affiliation_strings":["Meta,USA"],"affiliations":[{"raw_affiliation_string":"Meta,USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Anurag Kumar","orcid":null},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anurag Kumar","raw_affiliation_strings":["Google DeepMind,Japan"],"affiliations":[{"raw_affiliation_string":"Google DeepMind,Japan","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002593702","display_name":"Tim Fingscheidt","orcid":"https://orcid.org/0000-0002-8895-5041"},"institutions":[{"id":"https://openalex.org/I94509681","display_name":"Technische Universit\u00e4t Braunschweig","ror":"https://ror.org/010nsgg66","country_code":"DE","type":"education","lineage":["https://openalex.org/I94509681"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Tim Fingscheidt","raw_affiliation_strings":["Technische Universit&#x00E4;t,Braunschweig,Germany"],"affiliations":[{"raw_affiliation_string":"Technische Universit&#x00E4;t,Braunschweig,Germany","institution_ids":["https://openalex.org/I94509681"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132789061","display_name":"Shinji Watanabe","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["Carnegie Mellon University,USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5129685555","display_name":"Yanmin Qian","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanmin Qian","raw_affiliation_strings":["Shanghai Jiao Tong University,China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University,China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5007581833"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":5.1131,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.95823096,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9179999828338623,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9179999828338623,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.0272000003606081,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.01269999984651804,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.5759000182151794},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5612000226974487},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5364999771118164},{"id":"https://openalex.org/keywords/data-curation","display_name":"Data curation","score":0.46779999136924744},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.43389999866485596},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.42989999055862427},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4034999907016754}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6944000124931335},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.5759000182151794},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5612000226974487},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5364999771118164},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48089998960494995},{"id":"https://openalex.org/C91632574","wikidata":"https://www.wikidata.org/wiki/Q15088675","display_name":"Data curation","level":2,"score":0.46779999136924744},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.43389999866485596},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.42989999055862427},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40220001339912415},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.399399995803833},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3634999990463257},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34630000591278076},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3345000147819519},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.325300008058548},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.3149999976158142},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.29910001158714294},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.29789999127388},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.257099986076355},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.2508000135421753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/asru65441.2025.11434638","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru65441.2025.11434638","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1552314771","https://openalex.org/W1597121597","https://openalex.org/W1989337816","https://openalex.org/W2044893557","https://openalex.org/W2094721231","https://openalex.org/W2127851351","https://openalex.org/W2141998673","https://openalex.org/W2514828952","https://openalex.org/W2952218014","https://openalex.org/W2962866211","https://openalex.org/W2964058413","https://openalex.org/W2972359262","https://openalex.org/W3095410713","https://openalex.org/W3096408984","https://openalex.org/W3151851237","https://openalex.org/W3161480375","https://openalex.org/W3196475561","https://openalex.org/W4221144097","https://openalex.org/W4224936432","https://openalex.org/W4225310539","https://openalex.org/W4225956675","https://openalex.org/W4245919820","https://openalex.org/W4372260337","https://openalex.org/W4372260557","https://openalex.org/W4372271367","https://openalex.org/W4375928773","https://openalex.org/W4380434618","https://openalex.org/W4392903232","https://openalex.org/W4392908343","https://openalex.org/W4399554121","https://openalex.org/W4402111568","https://openalex.org/W4402112079","https://openalex.org/W4402112435","https://openalex.org/W4402112521","https://openalex.org/W4406137543","https://openalex.org/W4406461432","https://openalex.org/W4408353433","https://openalex.org/W4408353835","https://openalex.org/W4415433170","https://openalex.org/W4415433286","https://openalex.org/W4415433380"],"related_works":[],"abstract_inverted_index":{"The":[0],"vast":[1],"majority":[2],"of":[3,97,116],"modern":[4],"speech":[5,42,121],"enhancement":[6,43,122],"systems":[7,123],"rely":[8],"on":[9,47,92,104],"data-driven":[10],"neural":[11],"network":[12],"models.":[13],"Conventionally,":[14],"larger":[15],"datasets":[16],"are":[17],"presumed":[18],"to":[19],"yield":[20],"superior":[21],"model":[22],"performance,":[23],"an":[24],"observation":[25],"empirically":[26],"validated":[27],"across":[28],"numerous":[29],"tasks":[30],"in":[31,54,119],"other":[32],"domains.":[33],"However,":[34],"recent":[35],"studies":[36],"reveal":[37],"diminishing":[38],"returns":[39],"when":[40],"scaling":[41,120],"data.":[44],"We":[45],"focus":[46],"a":[48,93],"critical":[49],"factor:":[50],"prevalent":[51],"quality":[52],"issues":[53],"\u201cclean\u201d":[55],"training":[56,71,75],"labels":[57],"within":[58,69],"large-scale":[59,70],"datasets.":[60],"This":[61,110],"work":[62],"re-examines":[63],"this":[64],"phenomenon":[65],"and":[66],"demonstrates":[67],"that,":[68],"sets,":[72],"prioritizing":[73],"high-quality":[74],"data":[76,84,117],"is":[77],"more":[78],"important":[79],"than":[80],"merely":[81],"expanding":[82],"the":[83,105,113],"volume.":[85],"Experimental":[86],"findings":[87],"suggest":[88],"that":[89],"models":[90,102],"trained":[91,103],"carefully":[94],"curated":[95],"subset":[96],"700":[98],"hours":[99],"can":[100],"outperform":[101],"2,500":[106],"-hour":[107],"full":[108],"dataset.":[109],"outcome":[111],"highlights":[112],"crucial":[114],"role":[115],"curation":[118],"effectively.":[124]},"counts_by_year":[{"year":2026,"cited_by_count":4}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2026-04-03T00:00:00"}
