{"id":"https://openalex.org/W7135039912","doi":"https://doi.org/10.48550/arxiv.2603.10767","title":"mAceReason-Math: A Dataset of High-Quality Multilingual Math Problems Ready For RLVR","display_name":"mAceReason-Math: A Dataset of High-Quality Multilingual Math Problems Ready For RLVR","publication_year":2026,"publication_date":"2026-03-11","ids":{"openalex":"https://openalex.org/W7135039912","doi":"https://doi.org/10.48550/arxiv.2603.10767"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.10767","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10767","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.10767","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128827923","display_name":"Konstantin Dobler","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dobler, Konstantin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128837449","display_name":"Simon Lehnerer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lehnerer, Simon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072963991","display_name":"Federico Scozzafava","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Scozzafava, Federico","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128869831","display_name":"Jonathan Janke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Janke, Jonathan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128826683","display_name":"Mohamed Ali","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ali, Mohamed","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5128827923"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.22859999537467957,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.22859999537467957,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1875,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.06459999829530716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7177000045776367},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.5080000162124634},{"id":"https://openalex.org/keywords/verifiable-secret-sharing","display_name":"Verifiable secret sharing","score":0.4523000121116638},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4059000015258789},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.33250001072883606},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.30140000581741333}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7177000045776367},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6880999803543091},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5210999846458435},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.5080000162124634},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.45419999957084656},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.4523000121116638},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4059000015258789},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.366100013256073},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.33250001072883606},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.30140000581741333},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.29829999804496765},{"id":"https://openalex.org/C148043351","wikidata":"https://www.wikidata.org/wiki/Q4456944","display_name":"Current (fluid)","level":2,"score":0.2955000102519989},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2768999934196472},{"id":"https://openalex.org/C74672266","wikidata":"https://www.wikidata.org/wiki/Q815859","display_name":"Language acquisition","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C2780035574","wikidata":"https://www.wikidata.org/wiki/Q30081","display_name":"Multilingualism","level":2,"score":0.26109999418258667},{"id":"https://openalex.org/C2781020372","wikidata":"https://www.wikidata.org/wiki/Q533093","display_name":"On the fly","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.2529999911785126}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.10767","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10767","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.10767","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10767","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8261984586715698}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Reinforcement":[0],"Learning":[1],"with":[2,53,121],"Verifiable":[3],"Rewards":[4],"(RLVR)":[5],"has":[6],"been":[7,44],"successfully":[8],"applied":[9],"to":[10,70,108,132],"significantly":[11],"boost":[12],"the":[13,22,47,130,140],"capabilities":[14],"of":[15,64,87,90,118],"pretrained":[16],"large":[17],"language":[18],"models,":[19],"especially":[20],"in":[21,46,59,115,139],"math":[23,92],"and":[24,31,41,55,61,110,137],"logic":[25],"problem":[26],"domains.":[27],"However,":[28],"current":[29,56,76],"research":[30,136,141],"available":[32],"training":[33,39,73],"datasets":[34],"remain":[35],"English-centric.":[36],"While":[37],"multilingual":[38,134],"data":[40],"benchmarks":[42],"have":[43],"created":[45,52],"past,":[48],"they":[49],"were":[50],"not":[51],"RLVR":[54,101,135],"model":[57],"capability":[58],"mind,":[60],"their":[62],"level":[63],"difficulty":[65],"is":[66],"often":[67],"too":[68],"low":[69],"provide":[71,83],"appropriate":[72],"signals":[74],"for":[75,100],"models.":[77],"To":[78],"address":[79],"this":[80],"gap,":[81],"we":[82],"mAceReason-Math,":[84],"a":[85,96,116],"dataset":[86,131],"high-quality":[88],"translations":[89],"challenging":[91],"problems":[93],"sourced":[94],"from":[95],"corpus":[97],"specifically":[98],"curated":[99],"(AceReason-Math).":[102],"We":[103,128],"further":[104],"take":[105],"specific":[106],"care":[107],"clean":[109],"improve":[111],"our":[112],"translations,":[113],"resulting":[114],"coverage":[117],"14":[119],"languages":[120],"more":[122],"than":[123],"10,000":[124],"samples":[125],"per":[126],"language.":[127],"release":[129],"facilitate":[133],"benchmarking":[138],"community.":[142]},"counts_by_year":[],"updated_date":"2026-03-17T06:59:57.516163","created_date":"2026-03-13T00:00:00"}
