{"id":"https://openalex.org/W7163018776","doi":"https://doi.org/10.48550/arxiv.2605.31212","title":"Benchmarking and Enhancing Text-to-Image Models for Generating Visual Representations in Early Arithmetic Education","display_name":"Benchmarking and Enhancing Text-to-Image Models for Generating Visual Representations in Early Arithmetic Education","publication_year":2026,"publication_date":"2026-05-29","ids":{"openalex":"https://openalex.org/W7163018776","doi":"https://doi.org/10.48550/arxiv.2605.31212"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.31212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.31212","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137604025","display_name":"Junling Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Junling","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137553886","display_name":"Boqi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Boqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137572332","display_name":"Heejin Do","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Do, Heejin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137614378","display_name":"Mubashara Akhtar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akhtar, Mubashara","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046673805","display_name":"April Yi Wang","orcid":"https://orcid.org/0000-0001-8724-4662"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, April Yi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5002316432","display_name":"Mrinmaya Sachan","orcid":"https://orcid.org/0000-0001-8787-8681"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sachan, Mrinmaya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10130","display_name":"Mathematics Education and Teaching Techniques","score":0.2793999910354614,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10130","display_name":"Mathematics Education and Teaching Techniques","score":0.2793999910354614,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10533","display_name":"Teaching and Learning Programming","score":0.07540000230073929,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.06729999929666519,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6287000179290771},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6189000010490417},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6164000034332275},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5458999872207642},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5203999876976013},{"id":"https://openalex.org/keywords/comprehension","display_name":"Comprehension","score":0.4359999895095825},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4002000093460083},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.37709999084472656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6776999831199646},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6287000179290771},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6189000010490417},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6164000034332275},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5458999872207642},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5203999876976013},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4690999984741211},{"id":"https://openalex.org/C511192102","wikidata":"https://www.wikidata.org/wiki/Q5156948","display_name":"Comprehension","level":2,"score":0.4359999895095825},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4018999934196472},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4002000093460083},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.37709999084472656},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.35370001196861267},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.33379998803138733},{"id":"https://openalex.org/C177877439","wikidata":"https://www.wikidata.org/wiki/Q7604413","display_name":"Statistical relational learning","level":3,"score":0.3269999921321869},{"id":"https://openalex.org/C12426560","wikidata":"https://www.wikidata.org/wiki/Q189569","display_name":"Basis (linear algebra)","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.3005000054836273},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.2858999967575073},{"id":"https://openalex.org/C40976572","wikidata":"https://www.wikidata.org/wiki/Q2330873","display_name":"Gauge (firearms)","level":2,"score":0.2720000147819519},{"id":"https://openalex.org/C48164120","wikidata":"https://www.wikidata.org/wiki/Q4491893","display_name":"Concept learning","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.26669999957084656},{"id":"https://openalex.org/C156325361","wikidata":"https://www.wikidata.org/wiki/Q1152864","display_name":"Grounded theory","level":3,"score":0.26089999079704285},{"id":"https://openalex.org/C22304111","wikidata":"https://www.wikidata.org/wiki/Q1417978","display_name":"Object permanence","level":4,"score":0.25839999318122864},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.2578999996185303}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.31212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.31212","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.31212","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.882332980632782}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"AI":[0],"systems":[1],"are":[2,26],"increasingly":[3],"used":[4],"to":[5,28,40],"support":[6],"educational":[7,69],"content":[8],"creation,":[9],"yet":[10],"it":[11],"remains":[12],"unclear":[13],"whether":[14],"they":[15,25],"can":[16],"generate":[17],"outputs":[18],"that":[19,93],"faithfully":[20],"represent":[21],"the":[22,128],"pedagogical":[23],"concepts":[24],"intended":[27],"teach.":[29],"Thus,":[30],"we":[31,71,117],"introduce":[32],"equation-to-visual":[33],"generation,":[34,43],"a":[35,74],"task":[36],"that,":[37],"in":[38,138],"contrast":[39],"conventional":[41],"image":[42],"requires":[44],"producing":[45],"pedagogically":[46,78],"meaningful":[47],"visuals":[48],"from":[49],"arithmetic":[50],"equations":[51],"while":[52,127],"precisely":[53],"preserving":[54],"their":[55],"numerical":[56,134],"and":[57,65,110,135],"relational":[58,112,136],"structure.":[59,113],"Informed":[60],"by":[61,106],"interviews":[62],"with":[63,83,103],"teachers":[64],"an":[66],"analysis":[67],"of":[68],"materials,":[70],"construct":[72],"E2V-Bench,":[73],"benchmark":[75],"spanning":[76],"four":[77],"grounded":[79],"visual":[80,88],"types,":[81],"along":[82],"automatic":[84],"metrics":[85],"for":[86,132],"evaluating":[87],"correctness.":[89],"Our":[90],"evaluation":[91],"reveals":[92],"recent":[94],"text-to-image":[95],"(T2I)":[96],"models":[97],"frequently":[98],"fail":[99],"on":[100,115],"this":[101],"task,":[102],"errors":[104],"dominated":[105],"incorrect":[107],"object":[108],"counts":[109],"broken":[111],"Building":[114],"this,":[116],"explore":[118],"benchmark-guided":[119],"enhancement":[120],"strategies.":[121],"These":[122],"strategies":[123],"improve":[124],"representative":[125],"models,":[126],"remaining":[129],"gap":[130],"calls":[131],"stronger":[133],"grounding":[137],"future":[139],"T2I":[140],"models.":[141]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-06-02T00:00:00"}
