{"id":"https://openalex.org/W4408353885","doi":"https://doi.org/10.1109/icassp49660.2025.10888018","title":"Towards Bringing Parity in Pretraining Datasets for Low-resource Indian Languages","display_name":"Towards Bringing Parity in Pretraining Datasets for Low-resource Indian Languages","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408353885","doi":"https://doi.org/10.1109/icassp49660.2025.10888018"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10888018","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10888018","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049369768","display_name":"Kaushal Santosh Bhogale","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kaushal Santosh Bhogale","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5094077182","display_name":"Deovrat Mehendale","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deovrat Mehendale","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113690063","display_name":"Tahir Javed","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tahir Javed","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116594461","display_name":"Devbrat Anuragi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Devbrat Anuragi","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109774115","display_name":"Sakshi Joshi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sakshi Joshi","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055545634","display_name":"Sai Sundaresan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sai Sundaresan","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065276549","display_name":"Aparna Ananthanarayanan","orcid":"https://orcid.org/0000-0003-4776-9952"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aparna Ananthanarayanan","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058454760","display_name":"Sharmistha Dey","orcid":"https://orcid.org/0000-0003-4122-7415"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharmistha Dey","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111235628","display_name":"S. G.","orcid":null},"institutions":[{"id":"https://openalex.org/I24676775","display_name":"Indian Institute of Technology Madras","ror":"https://ror.org/03v0r5n49","country_code":"IN","type":"facility","lineage":["https://openalex.org/I24676775"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Sathish Kumar Reddy G","raw_affiliation_strings":["IIT Madras"],"affiliations":[{"raw_affiliation_string":"IIT Madras","institution_ids":["https://openalex.org/I24676775"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Anusha Srinivasan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anusha Srinivasan","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035174004","display_name":"Abhigyan Raman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abhigyan Raman","raw_affiliation_strings":["Sarvam AI"],"affiliations":[{"raw_affiliation_string":"Sarvam AI","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101614265","display_name":"Pratyush Kumar","orcid":"https://orcid.org/0000-0002-7446-0363"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pratyush Kumar","raw_affiliation_strings":["Sarvam AI"],"affiliations":[{"raw_affiliation_string":"Sarvam AI","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050036814","display_name":"Mitesh M. Khapra","orcid":"https://orcid.org/0009-0008-3687-9922"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mitesh M. Khapra","raw_affiliation_strings":["AI4Bharat"],"affiliations":[{"raw_affiliation_string":"AI4Bharat","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5049369768"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.0180192,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9675999879837036,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9526000022888184,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6563528776168823},{"id":"https://openalex.org/keywords/parity","display_name":"Parity (physics)","score":0.6286249160766602},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35097038745880127},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.07833355665206909},{"id":"https://openalex.org/keywords/particle-physics","display_name":"Particle physics","score":0.05819252133369446}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6563528776168823},{"id":"https://openalex.org/C2777151079","wikidata":"https://www.wikidata.org/wiki/Q141160","display_name":"Parity (physics)","level":2,"score":0.6286249160766602},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35097038745880127},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.07833355665206909},{"id":"https://openalex.org/C109214941","wikidata":"https://www.wikidata.org/wiki/Q18334","display_name":"Particle physics","level":1,"score":0.05819252133369446}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10888018","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10888018","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1574170747","https://openalex.org/W2127141656","https://openalex.org/W2962784628","https://openalex.org/W2964309797","https://openalex.org/W3097777922","https://openalex.org/W3119308075","https://openalex.org/W3139878283","https://openalex.org/W3195874849","https://openalex.org/W3213029956","https://openalex.org/W4226033575","https://openalex.org/W4391021698","https://openalex.org/W4392902568","https://openalex.org/W4392903564","https://openalex.org/W4402670026","https://openalex.org/W6638749077","https://openalex.org/W6755207826","https://openalex.org/W6804060842","https://openalex.org/W6847363464","https://openalex.org/W6850218400","https://openalex.org/W6852909395"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Lack":[0],"of":[1,60,71,103,113,128],"large-scale":[2],"pretraining":[3],"data":[4],"for":[5,39,116],"low":[6],"resource":[7],"languages":[8,42],"from":[9],"the":[10,69,91,101,111,122,126,144],"Indian":[11,65],"sub-continent,":[12],"leads":[13],"to":[14,33,84,142],"their":[15],"underrepresentation":[16],"in":[17,131],"existing":[18],"massively":[19],"multilingual":[20,87],"models.":[21],"In":[22],"this":[23,27,50],"work,":[24],"we":[25,52,73,99],"address":[26],"gap":[28],"by":[29,43],"proposing":[30],"a":[31,55,75,86,95],"framework":[32],"create":[34],"large":[35],"raw":[36,61],"audio":[37,47,62],"datasets":[38],"such":[40],"under-represented":[41],"collating":[44],"publicly":[45],"accessible":[46],"content.":[48],"Leveraging":[49],"framework,":[51,138],"present":[53],"MahaDhwani,":[54,72],"corpus":[56],"comprising":[57],"279K":[58],"hours":[59],"across":[63],"22":[64,92],"languages.":[66,93],"To":[67],"test":[68],"utility":[70],"pretrain":[74],"conformer":[76],"style":[77],"model,":[78],"and":[79,110,140],"then":[80],"further":[81],"finetune":[82],"it":[83],"build":[85],"ASR":[88],"model":[89],"supporting":[90],"Using":[94],"hybrid":[96],"multi-softmax":[97],"decoder,":[98],"balance":[100],"benefit":[102,112],"shared":[104],"parameters":[105],"which":[106],"enable":[107],"crosslingual":[108],"transfer,":[109],"dedicated":[114],"capacity":[115],"each":[117],"language.":[118],"Our":[119],"evaluations":[120],"on":[121],"IndicVoices":[123],"benchmark":[124],"show":[125],"benefits":[127],"pre-training,":[129],"particularly":[130],"low-resource":[132],"settings.":[133],"We":[134],"will":[135],"open-source":[136],"our":[137],"code":[139],"scripts":[141],"reproduce":[143],"dataset.":[145]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
