{"id":"https://openalex.org/W4416243792","doi":"https://doi.org/10.48550/arxiv.2508.08665","title":"Aryabhata: An exam-focused language model for JEE Math","display_name":"Aryabhata: An exam-focused language model for JEE Math","publication_year":2025,"publication_date":"2025-08-12","ids":{"openalex":"https://openalex.org/W4416243792","doi":"https://doi.org/10.48550/arxiv.2508.08665"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2508.08665","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.08665","pdf_url":"https://arxiv.org/pdf/2508.08665","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2508.08665","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5111810032","display_name":"R. Rastogi","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Rastogi, Ritvik","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120402770","display_name":"Sachin Dharashivkar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dharashivkar, Sachin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5032451828","display_name":"Sandeep Varma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Varma, Sandeep","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5111810032"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.6568999886512756,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.6568999886512756,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11122","display_name":"Online Learning and Analytics","score":0.04340000078082085,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.03750000149011612,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.6395000219345093},{"id":"https://openalex.org/keywords/verifiable-secret-sharing","display_name":"Verifiable secret sharing","score":0.545799970626831},{"id":"https://openalex.org/keywords/curriculum","display_name":"Curriculum","score":0.5253999829292297},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.45829999446868896},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.45399999618530273},{"id":"https://openalex.org/keywords/language-acquisition","display_name":"Language acquisition","score":0.36149999499320984},{"id":"https://openalex.org/keywords/constructed-language","display_name":"Constructed language","score":0.3506999909877777}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6589999794960022},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.6395000219345093},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.545799970626831},{"id":"https://openalex.org/C47177190","wikidata":"https://www.wikidata.org/wiki/Q207137","display_name":"Curriculum","level":2,"score":0.5253999829292297},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5005000233650208},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.45829999446868896},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.45399999618530273},{"id":"https://openalex.org/C74672266","wikidata":"https://www.wikidata.org/wiki/Q815859","display_name":"Language acquisition","level":2,"score":0.36149999499320984},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.35740000009536743},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3517000079154968},{"id":"https://openalex.org/C94922259","wikidata":"https://www.wikidata.org/wiki/Q33215","display_name":"Constructed language","level":2,"score":0.3506999909877777},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.3447999954223633},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.30709999799728394},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.30649998784065247},{"id":"https://openalex.org/C2779313563","wikidata":"https://www.wikidata.org/wiki/Q17072565","display_name":"On Language","level":2,"score":0.2818000018596649},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.2615000009536743},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.2612000107765198},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.2533999979496002},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.25270000100135803}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2508.08665","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.08665","pdf_url":"https://arxiv.org/pdf/2508.08665","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2508.08665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2508.08665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2508.08665","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2508.08665","pdf_url":"https://arxiv.org/pdf/2508.08665","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,124],"present":[1],"Aryabhata":[2,38,110,126],"1.0,":[3],"a":[4,128],"compact":[5],"7B":[6],"parameter":[7],"math":[8],"reasoning":[9,46],"model":[10,130],"optimized":[11],"for":[12,35,144,159],"the":[13,17],"Indian":[14],"academic":[15],"exam,":[16],"Joint":[18],"Entrance":[19],"Examination":[20],"(JEE).":[21],"Despite":[22],"rapid":[23],"progress":[24],"in":[25,114],"large":[26],"language":[27,136],"models":[28,31,113,153],"(LLMs),":[29],"current":[30],"often":[32],"remain":[33],"unsuitable":[34],"educational":[36],"use.":[37],"1.0":[39],"is":[40,149],"built":[41],"by":[42,49],"merging":[43],"strong":[44],"open-weight":[45],"models,":[47],"followed":[48],"supervised":[50],"fine-tuning":[51],"(SFT)":[52],"with":[53,74,81,86],"curriculum":[54],"learning":[55,73,157],"on":[56,99],"verified":[57],"chain-of-thought":[58],"(CoT)":[59],"traces":[60],"curated":[61],"through":[62],"best-of-$n$":[63],"rejection":[64],"sampling.":[65],"To":[66],"further":[67,155],"boost":[68],"performance,":[69],"we":[70],"apply":[71],"reinforcement":[72],"verifiable":[75],"rewards":[76],"(RLVR)":[77],"using":[78],"A2C":[79],"objective":[80],"group-relative":[82],"advantage":[83],"estimation":[84],"along":[85],"novel":[87],"exploration":[88],"strategies":[89],"such":[90],"as":[91,127],"Adaptive":[92],"Group":[93],"Resizing":[94],"and":[95,105,116],"Temperature":[96],"Scaling.":[97],"Evaluated":[98],"both":[100],"in-distribution":[101],"(JEE":[102],"Main":[103],"2025)":[104],"out-of-distribution":[106],"(MATH,":[107],"GSM8K)":[108],"benchmarks,":[109],"outperforms":[111],"existing":[112],"accuracy":[115],"efficiency,":[117],"while":[118],"offering":[119],"pedagogically":[120],"useful":[121],"step-by-step":[122],"reasoning.":[123],"release":[125,143],"foundation":[129],"to":[131,154],"advance":[132],"exam-centric,":[133],"open-source":[134],"small":[135],"models.":[137],"This":[138],"marks":[139],"our":[140],"first":[141],"open":[142],"community":[145],"feedback":[146],"(https://huggingface.co/PhysicsWallahAI/Aryabhata-1.0);":[147],"PW":[148],"actively":[150],"training":[151],"future":[152],"improve":[156],"outcomes":[158],"students.":[160]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
