{"id":"https://openalex.org/W4416530194","doi":"https://doi.org/10.48550/arxiv.2504.06011","title":"Llama-3-Nanda-10B-Chat: An Open Generative Large Language Model for Hindi","display_name":"Llama-3-Nanda-10B-Chat: An Open Generative Large Language Model for Hindi","publication_year":2025,"publication_date":"2025-04-08","ids":{"openalex":"https://openalex.org/W4416530194","doi":"https://doi.org/10.48550/arxiv.2504.06011"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2504.06011","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.06011","pdf_url":"https://arxiv.org/pdf/2504.06011","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2504.06011","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008944385","display_name":"Monojit Choudhury","orcid":"https://orcid.org/0000-0001-7473-7839"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Choudhury, Monojit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101148056","display_name":"Shivam Chauhan","orcid":"https://orcid.org/0000-0003-0584-3384"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chauhan, Shivam","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056125162","display_name":"Rocktim Jyoti Das","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Das, Rocktim Jyoti","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037725984","display_name":"Dhruv Sahnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sahnan, Dhruv","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058574573","display_name":"Xudong Han","orcid":"https://orcid.org/0000-0001-7961-5179"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Xudong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025855575","display_name":"Haonan Li","orcid":"https://orcid.org/0000-0001-6623-5089"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Haonan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103156822","display_name":"A. J. Singh","orcid":"https://orcid.org/0009-0001-9185-6407"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Singh, Aaryamonvikram","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Jadhav, Alok Anil","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jadhav, Alok Anil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038219269","display_name":"Utkarsh Agarwal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Agarwal, Utkarsh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069473673","display_name":"Mukund Choudhary","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Choudhary, Mukund","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089296560","display_name":"Debopriyo Banerjee","orcid":"https://orcid.org/0000-0001-9773-776X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Banerjee, Debopriyo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065822589","display_name":"Fajri Koto","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Koto, Fajri","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044984870","display_name":"Junaid Hamid Bhat","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhat, Junaid","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102787524","display_name":"A. D. Shukla","orcid":"https://orcid.org/0000-0002-4969-0204"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shukla, Awantika","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008093186","display_name":"Samujjwal Ghosh","orcid":"https://orcid.org/0000-0003-2859-7358"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ghosh, Samujjwal","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004502117","display_name":"Samta Kamboj","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kamboj, Samta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019706515","display_name":"Onkar Pandit","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pandit, Onkar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024823903","display_name":"Lalit Pradhan","orcid":"https://orcid.org/0000-0001-9532-7628"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pradhan, Lalit","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101516062","display_name":"Rahul Pal","orcid":"https://orcid.org/0009-0005-6119-8297"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pal, Rahul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101857471","display_name":"Sunil Kumar Sahu","orcid":"https://orcid.org/0000-0001-6860-9208"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sahu, Sunil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111291495","display_name":"Soundar Doraiswamy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Doraiswamy, Soundar","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106508350","display_name":"Parvez Mullah","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mullah, Parvez","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025649064","display_name":"Ali El Filali","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Filali, Ali El","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060274099","display_name":"Neha Sengupta","orcid":"https://orcid.org/0000-0002-0162-374X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sengupta, Neha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113335335","display_name":"Gokul Ramakrishnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramakrishnan, Gokul","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108970056","display_name":"Rituraj Joshi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Joshi, Rituraj","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072933457","display_name":"Gurpreet Gosal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gosal, Gurpreet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106508351","display_name":"Avraham Sheinin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sheinin, Avraham","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066061534","display_name":"Natalia Vassilieva","orcid":"https://orcid.org/0000-0003-3410-9277"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vassilieva, Natalia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5012055259","display_name":"Preslav Nakov","orcid":"https://orcid.org/0000-0002-3600-1510"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nakov, Preslav","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":30,"corresponding_author_ids":["https://openalex.org/A5008944385"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.20679999887943268,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.20679999887943268,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.20419999957084656,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.04729999974370003,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hindi","display_name":"Hindi","score":0.9199000000953674},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.5630000233650208},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.43380001187324524},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4074999988079071},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.352400004863739}],"concepts":[{"id":"https://openalex.org/C519982507","wikidata":"https://www.wikidata.org/wiki/Q1568","display_name":"Hindi","level":2,"score":0.9199000000953674},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7225000262260437},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.633400022983551},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.5630000233650208},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.536300003528595},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.43380001187324524},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.4327999949455261},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4074999988079071},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.352400004863739},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.31029999256134033},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.27889999747276306}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2504.06011","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.06011","pdf_url":"https://arxiv.org/pdf/2504.06011","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2504.06011","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2504.06011","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2504.06011","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2504.06011","pdf_url":"https://arxiv.org/pdf/2504.06011","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4416530194.pdf","grobid_xml":"https://content.openalex.org/works/W4416530194.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Developing":[0],"high-quality":[1,67],"large":[2],"language":[3,41],"models":[4,106],"(LLMs)":[5],"for":[6,25],"moderately":[7],"resourced":[8],"languages":[9],"presents":[10],"unique":[11],"challenges":[12],"in":[13,150],"data":[14,76],"availability,":[15],"model":[16],"adaptation,":[17],"and":[18,79,85,104,129,153,164],"evaluation.":[19],"We":[20,117],"introduce":[21],"Llama-3-Nanda-10B-Chat,":[22],"or":[23],"Nanda":[24,46,97,137],"short,":[26],"a":[27,155],"state-of-the-art":[28,140],"Hindi-centric":[29],"instruction-tuned":[30],"generative":[31],"LLM,":[32],"designed":[33],"to":[34,88,138,147],"push":[35],"the":[36,55,63,100],"boundaries":[37],"of":[38,66,107,122,158],"open-source":[39,102],"Hindi":[40,68,84,103,151],"models.":[42,116],"Built":[43],"upon":[44],"Llama-3-8B,":[45],"incorporates":[47],"continuous":[48],"pre-training":[49],"with":[50],"expanded":[51],"transformer":[52],"blocks,":[53],"leveraging":[54],"Llama":[56],"Pro":[57],"methodology.":[58],"A":[59],"key":[60],"challenge":[61],"was":[62],"limited":[64],"availability":[65],"text":[69],"data;":[70],"we":[71,145],"addressed":[72],"this":[73],"through":[74],"rigorous":[75],"curation,":[77],"augmentation,":[78],"strategic":[80],"bilingual":[81],"training,":[82],"balancing":[83],"English":[86],"corpora":[87],"optimize":[89],"cross-linguistic":[90],"knowledge":[91],"transfer.":[92],"With":[93],"10":[94],"billion":[95],"parameters,":[96],"stands":[98],"among":[99],"top-performing":[101],"multilingual":[105],"similar":[108],"scale,":[109],"demonstrating":[110,132],"significant":[111],"advantages":[112],"over":[113],"many":[114],"existing":[115],"provide":[118],"an":[119],"in-depth":[120],"discussion":[121],"training":[123],"strategies,":[124],"fine-tuning":[125],"techniques,":[126],"safety":[127],"alignment,":[128],"evaluation":[130],"metrics,":[131],"how":[133],"these":[134],"approaches":[135],"enabled":[136],"achieve":[139],"results.":[141],"By":[142],"open-sourcing":[143],"Nanda,":[144],"aim":[146],"advance":[148],"research":[149],"LLMs":[152],"support":[154],"wide":[156],"range":[157],"real-world":[159],"applications":[160],"across":[161],"academia,":[162],"industry,":[163],"public":[165],"services.":[166]},"counts_by_year":[],"updated_date":"2026-04-17T18:11:37.981687","created_date":"2025-10-10T00:00:00"}
