{"id":"https://openalex.org/W4406462022","doi":"https://doi.org/10.1109/slt61566.2024.10832171","title":"Enhancing Unified Streaming and Non-Streaming ASR Through Curriculum Learning With Easy-To-Hard Tasks","display_name":"Enhancing Unified Streaming and Non-Streaming ASR Through Curriculum Learning With Easy-To-Hard Tasks","publication_year":2024,"publication_date":"2024-12-02","ids":{"openalex":"https://openalex.org/W4406462022","doi":"https://doi.org/10.1109/slt61566.2024.10832171"},"language":"en","primary_location":{"id":"doi:10.1109/slt61566.2024.10832171","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832171","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100605320","display_name":"Yuting Yang","orcid":"https://orcid.org/0009-0001-9316-4332"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuting Yang","raw_affiliation_strings":["NetEase Yidun AI Lab,Hangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NetEase Yidun AI Lab,Hangzhou,China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100697204","display_name":"Yuke Li","orcid":"https://orcid.org/0009-0000-7282-8964"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuke Li","raw_affiliation_strings":["NetEase Yidun AI Lab,Hangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NetEase Yidun AI Lab,Hangzhou,China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049844296","display_name":"Lifeng Zhou","orcid":"https://orcid.org/0000-0001-5479-3681"},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lifeng Zhou","raw_affiliation_strings":["NetEase Yidun AI Lab,Hangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NetEase Yidun AI Lab,Hangzhou,China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001063248","display_name":"Binbin Du","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Binbin Du","raw_affiliation_strings":["NetEase Yidun AI Lab,Hangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NetEase Yidun AI Lab,Hangzhou,China","institution_ids":["https://openalex.org/I4210091137"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5012539121","display_name":"Haoqi Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210091137","display_name":"NetEase (China)","ror":"https://ror.org/00fp6fj05","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210091137"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoqi Zhu","raw_affiliation_strings":["NetEase Yidun AI Lab,Hangzhou,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"NetEase Yidun AI Lab,Hangzhou,China","institution_ids":["https://openalex.org/I4210091137"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210091137"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.22027886,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"232","last_page":"239"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9873999953269958,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.968500018119812,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.777459442615509},{"id":"https://openalex.org/keywords/streaming-current","display_name":"Streaming current","score":0.7399929165840149},{"id":"https://openalex.org/keywords/live-streaming","display_name":"Live streaming","score":0.5363873839378357},{"id":"https://openalex.org/keywords/streaming-data","display_name":"Streaming data","score":0.4794287085533142},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.4763113260269165},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.10685494542121887}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.777459442615509},{"id":"https://openalex.org/C30311675","wikidata":"https://www.wikidata.org/wiki/Q7622689","display_name":"Streaming current","level":3,"score":0.7399929165840149},{"id":"https://openalex.org/C2776741261","wikidata":"https://www.wikidata.org/wiki/Q3027665","display_name":"Live streaming","level":2,"score":0.5363873839378357},{"id":"https://openalex.org/C2777611316","wikidata":"https://www.wikidata.org/wiki/Q39045282","display_name":"Streaming data","level":2,"score":0.4794287085533142},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.4763113260269165},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.10685494542121887},{"id":"https://openalex.org/C27703432","wikidata":"https://www.wikidata.org/wiki/Q2778467","display_name":"Electrokinetic phenomena","level":2,"score":0.0},{"id":"https://openalex.org/C147789679","wikidata":"https://www.wikidata.org/wiki/Q11372","display_name":"Physical chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/slt61566.2024.10832171","is_oa":false,"landing_page_url":"https://doi.org/10.1109/slt61566.2024.10832171","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE Spoken Language Technology Workshop (SLT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6800000071525574,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1710082047","https://openalex.org/W2095705004","https://openalex.org/W2296073425","https://openalex.org/W2407080277","https://openalex.org/W2517617019","https://openalex.org/W2519091744","https://openalex.org/W2739759330","https://openalex.org/W2766219058","https://openalex.org/W2889048668","https://openalex.org/W2913718171","https://openalex.org/W2923622379","https://openalex.org/W2936774411","https://openalex.org/W2948210185","https://openalex.org/W2963242190","https://openalex.org/W3007433671","https://openalex.org/W3015974384","https://openalex.org/W3034623328","https://openalex.org/W3034938700","https://openalex.org/W3036601975","https://openalex.org/W3092122846","https://openalex.org/W3092970820","https://openalex.org/W3095687747","https://openalex.org/W3097777922","https://openalex.org/W3101281919","https://openalex.org/W3111562797","https://openalex.org/W3125815078","https://openalex.org/W3160628828","https://openalex.org/W3163203022","https://openalex.org/W3170405627","https://openalex.org/W3196784225","https://openalex.org/W3197478142","https://openalex.org/W4296069140","https://openalex.org/W4375869292","https://openalex.org/W4375869369","https://openalex.org/W4385245566","https://openalex.org/W4385822686","https://openalex.org/W4385823175","https://openalex.org/W4385823308","https://openalex.org/W4391021732","https://openalex.org/W6631190155","https://openalex.org/W6674330103","https://openalex.org/W6754473786","https://openalex.org/W6780218876","https://openalex.org/W6784400248","https://openalex.org/W6784721964","https://openalex.org/W6787040858","https://openalex.org/W6790121257","https://openalex.org/W6797037654"],"related_works":["https://openalex.org/W2384129116","https://openalex.org/W4328029402","https://openalex.org/W4235833544","https://openalex.org/W4390321210","https://openalex.org/W4361215424","https://openalex.org/W4386953780","https://openalex.org/W2383812552","https://openalex.org/W2082106666","https://openalex.org/W2392424562","https://openalex.org/W3134683720"],"abstract_inverted_index":{"We":[0],"expect":[1],"a":[2,17,55,74,81,93],"unified":[3,64,105],"ASR":[4,30,65,106],"model":[5],"to":[6,50,59,97,115],"deliver":[7],"high":[8],"performance":[9,34],"in":[10,28,73,110,138],"both":[11],"streaming":[12,29],"and":[13,108,129],"non-streaming":[14,38,94],"modes.":[15,140],"However,":[16],"core":[18],"challenge":[19],"is":[20],"that":[21,84,132],"the":[22,37,43,61],"lack":[23],"of":[24,63],"global":[25],"contextual":[26],"information":[27],"inherently":[31],"hinders":[32],"its":[33],"from":[35,42,47],"matching":[36],"counterpart.":[39],"Drawing":[40],"inspiration":[41],"human":[44],"learning":[45,57],"manner":[46],"easy":[48],"concepts":[49],"difficult":[51],"ones,":[52],"we":[53,79],"introduce":[54],"curriculum":[56,83],"framework":[58,68],"enhance":[60],"training":[62,92,102],"models.":[66],"This":[67],"strategically":[69],"increases":[70],"task":[71],"complexity":[72],"graduated,":[75],"easy-to-hard":[76],"order.":[77],"Specifically,":[78],"develop":[80],"structured":[82],"begins":[85],"with":[86],"an":[87,98,103,111],"elementary":[88],"course":[89,100,113],"focused":[90],"on":[91,127],"model,":[95,107],"progresses":[96],"intermediate":[99],"for":[101],"initial":[104],"culminates":[109],"advanced":[112],"designed":[114],"mutual":[116],"promotion":[117],"between":[118],"these":[119],"two":[120,139],"modes":[121],"via":[122],"contrastive":[123],"training.":[124],"Experimental":[125],"results":[126],"AISHELL-1":[128],"AISHELL-2":[130],"show":[131],"our":[133],"method":[134],"achieves":[135],"significant":[136],"improvements":[137]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
