{"id":"https://openalex.org/W2951388445","doi":"https://doi.org/10.1109/ncc.2019.8732237","title":"Data-pooling and multi-task learning for enhanced performance of speech recognition systems in multiple low resourced languages","display_name":"Data-pooling and multi-task learning for enhanced performance of speech recognition systems in multiple low resourced languages","publication_year":2019,"publication_date":"2019-02-01","ids":{"openalex":"https://openalex.org/W2951388445","doi":"https://doi.org/10.1109/ncc.2019.8732237","mag":"2951388445"},"language":"en","primary_location":{"id":"doi:10.1109/ncc.2019.8732237","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ncc.2019.8732237","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 National Conference on Communications (NCC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085635571","display_name":"A. Madhavaraj","orcid":null},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"A Madhavaraj","raw_affiliation_strings":["Electrical Engineering, Indian Institute of Science, Bangalore"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering, Indian Institute of Science, Bangalore","institution_ids":["https://openalex.org/I59270414"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069802599","display_name":"A. G. Ramakrishnan","orcid":"https://orcid.org/0000-0002-3646-1955"},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"A G Ramakrishnan","raw_affiliation_strings":["Electrical Engineering, Indian Institute of Science, Bangalore"],"affiliations":[{"raw_affiliation_string":"Electrical Engineering, Indian Institute of Science, Bangalore","institution_ids":["https://openalex.org/I59270414"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5085635571"],"corresponding_institution_ids":["https://openalex.org/I59270414"],"apc_list":null,"apc_paid":null,"fwci":0.2886,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.65777171,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/telugu","display_name":"Telugu","score":0.9674450159072876},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7720764875411987},{"id":"https://openalex.org/keywords/gujarati","display_name":"Gujarati","score":0.7704360485076904},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.7002109885215759},{"id":"https://openalex.org/keywords/tamil","display_name":"Tamil","score":0.6755472421646118},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5989276766777039},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5950139760971069},{"id":"https://openalex.org/keywords/phone","display_name":"Phone","score":0.581262469291687},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5571093559265137},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.534462571144104},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5263679623603821},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.513813316822052},{"id":"https://openalex.org/keywords/feature-vector","display_name":"Feature vector","score":0.48019206523895264},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4784127175807953},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.0821692943572998},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.07491973042488098}],"concepts":[{"id":"https://openalex.org/C2778756302","wikidata":"https://www.wikidata.org/wiki/Q8097","display_name":"Telugu","level":2,"score":0.9674450159072876},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7720764875411987},{"id":"https://openalex.org/C2779296024","wikidata":"https://www.wikidata.org/wiki/Q5137","display_name":"Gujarati","level":2,"score":0.7704360485076904},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.7002109885215759},{"id":"https://openalex.org/C140688305","wikidata":"https://www.wikidata.org/wiki/Q5885","display_name":"Tamil","level":2,"score":0.6755472421646118},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5989276766777039},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5950139760971069},{"id":"https://openalex.org/C2778707766","wikidata":"https://www.wikidata.org/wiki/Q202064","display_name":"Phone","level":2,"score":0.581262469291687},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5571093559265137},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.534462571144104},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5263679623603821},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.513813316822052},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.48019206523895264},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4784127175807953},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0821692943572998},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.07491973042488098},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/ncc.2019.8732237","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ncc.2019.8732237","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 National Conference on Communications (NCC)","raw_type":"proceedings-article"},{"id":"pmh:oai::78063","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306401429","display_name":"ePrints@IISc (Indian Institute of Science)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I59270414","host_organization_name":"Indian Institute of Science Bangalore","host_organization_lineage":["https://openalex.org/I59270414"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"Conference Paper"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.800000011920929}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W100737242","https://openalex.org/W1524333225","https://openalex.org/W1565000507","https://openalex.org/W1565737905","https://openalex.org/W1978660892","https://openalex.org/W1991180839","https://openalex.org/W2021775343","https://openalex.org/W2025198378","https://openalex.org/W2033436836","https://openalex.org/W2044048901","https://openalex.org/W2069631319","https://openalex.org/W2079508481","https://openalex.org/W2089917322","https://openalex.org/W2583161050","https://openalex.org/W2770107007","https://openalex.org/W2889367800","https://openalex.org/W2893616871","https://openalex.org/W2897396694","https://openalex.org/W6631362777","https://openalex.org/W6903697578","https://openalex.org/W7060890437"],"related_works":["https://openalex.org/W4323529320","https://openalex.org/W2142137786","https://openalex.org/W2336525283","https://openalex.org/W582524164","https://openalex.org/W2270825477","https://openalex.org/W1514154358","https://openalex.org/W4244044226","https://openalex.org/W3203494007","https://openalex.org/W4388184082","https://openalex.org/W3124581537"],"abstract_inverted_index":{"We":[0],"present":[1],"two":[2],"approaches":[3],"to":[4,36,57,64,192],"improve":[5],"the":[6,20,38,41,47,59,62,65,71,86,93,96,123,128,142,154,159,164,180,188],"performance":[7],"of":[8,70,111,156,158,163,182,203],"automatic":[9],"speech":[10],"recognition":[11],"(ASR)":[12],"systems":[13],"for":[14,40,85,113,116,120,178,208],"Gujarati,":[15,114,209],"Tamil":[16,117,210],"and":[17,50,81,95,118,144,206,211],"Telugu.":[18],"In":[19,127],"first":[21],"approach":[22,102,130,197],"using":[23,77,91,131],"data-pooling":[24],"with":[25,148],"phone":[26,79],"mapping":[27,80],"(DP-PM),":[28],"a":[29,146,183],"deep":[30],"neural":[31],"network":[32],"(DNN)":[33],"is":[34,89],"trained":[35,90],"predict":[37],"senones":[39,155,181],"target":[42,66,87,94],"language;":[43],"then":[44,75],"we":[45,136],"use":[46,137],"feature":[48,138,189],"vectors":[49,139],"their":[51],"alignments":[52],"from":[53,61,140],"other":[54],"source":[55,63,72,98],"languages":[56,73,143],"map":[58],"phones":[60],"language.":[67,194],"The":[68],"lexicons":[69],"are":[74,167,185],"modified":[76,97,168],"this":[78],"an":[82],"ASR":[83],"system":[84],"language":[88,184],"both":[92],"data.":[99],"This":[100,195],"DP-PM":[101],"gives":[103],"relative":[104,199],"improvements":[105,200],"in":[106,201],"word":[107],"error":[108],"rates":[109],"(WER)":[110],"5.1%":[112],"3.1%":[115],"3.4%":[119],"Telugu,":[121,212],"over":[122],"corresponding":[124],"baseline":[125],"figures.":[126],"second":[129],"multi-task":[132],"DNN":[133,147,175],"(MT-DNN)":[134],"modeling,":[135],"all":[141],"train":[145],"three":[149],"output":[150,165],"layers,":[151],"each":[152],"predicting":[153,179],"one":[157],"languages.":[160],"Objective":[161],"functions":[162],"layers":[166,176],"such":[169],"that":[170,193],"during":[171],"training,":[172],"only":[173],"those":[174],"responsible":[177],"updated,":[186],"if":[187],"vector":[190],"belongs":[191],"MT-DNN":[196],"achieves":[198],"WER":[202],"5.7%,":[204],"3.3%":[205],"5.2%":[207],"respectively.":[213]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":3},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
