{"id":"https://openalex.org/W7151931035","doi":"https://doi.org/10.48550/arxiv.2604.05160","title":"A Multi-Agent Approach to Validate and Refine LLM-Generated Personalized Math Problems","display_name":"A Multi-Agent Approach to Validate and Refine LLM-Generated Personalized Math Problems","publication_year":2026,"publication_date":"2026-04-06","ids":{"openalex":"https://openalex.org/W7151931035","doi":"https://doi.org/10.48550/arxiv.2604.05160"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.05160","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05160","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.05160","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5119181665","display_name":"Fareya Ikram","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ikram, Fareya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133198333","display_name":"Nischal Ashok Kumar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kumar, Nischal Ashok","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133197461","display_name":"Junyang Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Junyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069001617","display_name":"Hunter McNichols","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McNichols, Hunter","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061100603","display_name":"Candace Walkington","orcid":"https://orcid.org/0000-0002-2338-8760"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Walkington, Candace","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078998782","display_name":"Neil T. Heffernan","orcid":"https://orcid.org/0000-0002-3280-288X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Heffernan, Neil","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133169427","display_name":"Andrew S. Lan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lan, Andrew S.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5119181665"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.31450000405311584,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.31450000405311584,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10636","display_name":"Innovative Teaching and Learning Methods","score":0.07750000059604645,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10130","display_name":"Mathematics Education and Teaching Techniques","score":0.07590000331401825,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/validator","display_name":"Validator","score":0.9358999729156494},{"id":"https://openalex.org/keywords/personalization","display_name":"Personalization","score":0.7929999828338623},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.6057999730110168},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.58160001039505},{"id":"https://openalex.org/keywords/iterative-refinement","display_name":"Iterative refinement","score":0.49399998784065247}],"concepts":[{"id":"https://openalex.org/C35292069","wikidata":"https://www.wikidata.org/wiki/Q1575458","display_name":"Validator","level":2,"score":0.9358999729156494},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.7929999828338623},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6930999755859375},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.6057999730110168},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.58160001039505},{"id":"https://openalex.org/C2779982483","wikidata":"https://www.wikidata.org/wiki/Q6094420","display_name":"Iterative refinement","level":2,"score":0.49399998784065247},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.41530001163482666},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3357999920845032},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2903999984264374},{"id":"https://openalex.org/C159694833","wikidata":"https://www.wikidata.org/wiki/Q2321565","display_name":"Iterative method","level":2,"score":0.2797999978065491}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.05160","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05160","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.05160","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.05160","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5981224775314331}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Students":[0],"benefit":[1],"from":[2,88],"math":[3],"problems":[4,23,27,86],"contextualized":[5],"to":[6,40,99],"their":[7],"interests.":[8],"Large":[9],"language":[10],"models":[11],"(LLMs)":[12],"offer":[13],"promise":[14],"for":[15,185],"efficient":[16],"personalization":[17,58],"at":[18],"scale.":[19],"However,":[20],"LLM-generated":[21],"personalized":[22],"may":[24],"often":[25],"have":[26,156],"such":[28],"as":[29,59],"unrealistic":[30],"quantities":[31],"and":[32,43,77,127,178,192],"contexts,":[33],"poor":[34],"readability,":[35,76],"limited":[36],"authenticity":[37,126],"with":[38],"respect":[39],"students'":[41,193],"experiences,":[42],"occasional":[44],"mathematical":[45],"inconsistencies.":[46],"To":[47],"alleviate":[48],"these":[49,147],"problems,":[50,138],"we":[51,64],"propose":[52],"a":[53,89,100,141],"multi-agent":[54],"framework":[55,83],"that":[56,113,125,140,152,172,189],"formalizes":[57],"an":[60],"iterative":[61],"generate--validate--revise":[62],"process;":[63],"use":[65],"four":[66],"specialized":[67],"validator":[68,165],"agents":[69],"targeting":[70],"the":[71,130,183],"criteria":[72],"of":[73,103],"solvability,":[74],"realism,":[75],"authenticity,":[78,181],"respectively.":[79],"We":[80,108,149,162],"evaluate":[81],"our":[82],"on":[84,159,176,180],"600":[85],"drawn":[87],"popular":[90],"online":[91],"mathematics":[92],"homework":[93],"platform,":[94],"ASSISTments,":[95],"personalizing":[96],"each":[97],"problem":[98],"fixed":[101],"set":[102],"20":[104],"student":[105],"interest":[106],"topics.":[107],"compare":[109],"three":[110],"refinement":[111,143,154],"strategies":[112,155],"differ":[114],"in":[115,135],"how":[116],"validation":[117],"feedback":[118],"is":[119,174],"coordinated":[120],"into":[121],"revisions.":[122],"Results":[123,170],"show":[124,171],"realism":[128,177],"are":[129],"most":[131],"frequent":[132],"failure":[133],"modes":[134],"initial":[136],"LLM-personalized":[137],"but":[139],"single":[142],"iteration":[144],"substantially":[145],"reduces":[146],"failures.":[148],"further":[150],"find":[151],"different":[153,157,160],"strengths":[158],"criteria.":[161],"also":[163],"assess":[164],"reliability":[166,173],"via":[167],"human":[168],"evaluation.":[169],"highest":[175],"lowest":[179],"highlighting":[182],"need":[184],"better":[186],"evaluation":[187],"protocols":[188],"consider":[190],"teachers'":[191],"personal":[194],"characteristics.":[195]},"counts_by_year":[],"updated_date":"2026-04-09T06:13:59.934233","created_date":"2026-04-09T00:00:00"}
