{"id":"https://openalex.org/W7138229259","doi":"https://doi.org/10.1609/aaai.v40i39.40578","title":"From Solver to Tutor: Evaluating the Pedagogical Intelligence of LLMs with KMP-Bench","display_name":"From Solver to Tutor: Evaluating the Pedagogical Intelligence of LLMs with KMP-Bench","publication_year":2026,"publication_date":"2026-03-14","ids":{"openalex":"https://openalex.org/W7138229259","doi":"https://doi.org/10.1609/aaai.v40i39.40578"},"language":null,"primary_location":{"id":"doi:10.1609/aaai.v40i39.40578","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40578","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1609/aaai.v40i39.40578","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5061386830","display_name":"Weikang Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Weikang Shi","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085999236","display_name":"Houxing Ren","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Houxing Ren","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129692302","display_name":"Junting Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Junting Pan","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong\nCPII under InnoHK"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong\nCPII under InnoHK","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129707116","display_name":"Aojun Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Aojun Zhou","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129727326","display_name":"Ke Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Ke Wang","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129643603","display_name":"Zimu Lu","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Zimu Lu","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129751033","display_name":"Yunqiao Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yunqiao Yang","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128058340","display_name":"Yuxuan Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yuxuan Hu","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101253342","display_name":"Linda Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Linda Wei","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129685846","display_name":"Mingjie Zhan","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Mingjie Zhan","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100732453","display_name":"Hongsheng Li","orcid":"https://orcid.org/0000-0002-9929-4023"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]},{"id":"https://openalex.org/I4210164862","display_name":"Artificial Intelligence in Medicine (Canada)","ror":"https://ror.org/05p590m36","country_code":"CA","type":"company","lineage":["https://openalex.org/I4210164862"]}],"countries":["CA","HK"],"is_corresponding":false,"raw_author_name":"Hongsheng Li","raw_affiliation_strings":["Multimedia Laboratory (MMLab), The Chinese University of Hong Kong\nShanghai Artificial Intelligence Laboratory\nCPII under InnoHK"],"affiliations":[{"raw_affiliation_string":"Multimedia Laboratory (MMLab), The Chinese University of Hong Kong\nShanghai Artificial Intelligence Laboratory\nCPII under InnoHK","institution_ids":["https://openalex.org/I177725633","https://openalex.org/I4210164862"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5061386830"],"corresponding_institution_ids":["https://openalex.org/I177725633"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.43950749,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"40","issue":"39","first_page":"32965","last_page":"32973"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.8177000284194946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.8177000284194946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10636","display_name":"Innovative Teaching and Learning Methods","score":0.023499999195337296,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10130","display_name":"Mathematics Education and Teaching Techniques","score":0.013000000268220901,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5997999906539917},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5616999864578247},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.5076000094413757},{"id":"https://openalex.org/keywords/weaving","display_name":"Weaving","score":0.39719998836517334},{"id":"https://openalex.org/keywords/verifiable-secret-sharing","display_name":"Verifiable secret sharing","score":0.3959999978542328},{"id":"https://openalex.org/keywords/solver","display_name":"Solver","score":0.3677000105381012}],"concepts":[{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5997999906539917},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.59170001745224},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5616999864578247},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.5076000094413757},{"id":"https://openalex.org/C145420912","wikidata":"https://www.wikidata.org/wiki/Q853077","display_name":"Mathematics education","level":1,"score":0.451200008392334},{"id":"https://openalex.org/C54525549","wikidata":"https://www.wikidata.org/wiki/Q2553445","display_name":"Weaving","level":2,"score":0.39719998836517334},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.3959999978542328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38359999656677246},{"id":"https://openalex.org/C2778770139","wikidata":"https://www.wikidata.org/wiki/Q1966904","display_name":"Solver","level":2,"score":0.3677000105381012},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.3596999943256378},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3488999903202057},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.3361999988555908},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.2754000127315521},{"id":"https://openalex.org/C3019612716","wikidata":"https://www.wikidata.org/wiki/Q730920","display_name":"Problem solver","level":2,"score":0.27300000190734863},{"id":"https://openalex.org/C132758656","wikidata":"https://www.wikidata.org/wiki/Q5307365","display_name":"Dreyfus model of skill acquisition","level":2,"score":0.2639000117778778},{"id":"https://openalex.org/C188231857","wikidata":"https://www.wikidata.org/wiki/Q2585724","display_name":"Educational assessment","level":2,"score":0.2606000006198883},{"id":"https://openalex.org/C55587333","wikidata":"https://www.wikidata.org/wiki/Q1133029","display_name":"Engineering ethics","level":1,"score":0.258899986743927},{"id":"https://openalex.org/C88610354","wikidata":"https://www.wikidata.org/wiki/Q1813494","display_name":"Teaching method","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v40i39.40578","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40578","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v40i39.40578","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v40i39.40578","pdf_url":null,"source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8164643049240112}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Language":[1],"Models":[2,136],"(LLMs)":[3],"show":[4,140],"significant":[5],"potential":[6],"in":[7],"AI":[8,156],"mathematical":[9],"tutoring,":[10],"yet":[11],"current":[12],"evaluations":[13,102],"often":[14],"rely":[15],"on":[16,103,138,143],"simplistic":[17],"metrics":[18],"or":[19],"narrow":[20],"pedagogical":[21,56,77,125],"scenarios,":[22],"failing":[23],"to":[24,43],"assess":[25,44],"comprehensive,":[26],"multi-turn":[27,69,92],"teaching":[28],"effectiveness.":[29],"In":[30],"this":[31],"paper,":[32],"we":[33,128],"introduce":[34],"KMP-Bench,":[35,144],"a":[36,67,84,106,131],"comprehensive":[37],"K-8":[38],"Mathematical":[39],"Pedagogical":[40],"Benchmark":[41],"designed":[42],"LLMs":[45,111],"from":[46],"two":[47],"complementary":[48],"perspectives.":[49],"The":[50,79],"first":[51],"module,":[52,81],"KMP-Dialogue,":[53],"evaluates":[54],"holistic":[55],"capabilities":[57],"against":[58],"six":[59],"core":[60],"principles":[61],"(e.g.,":[62],"Challenge,":[63],"Explanation,":[64],"Feedback),":[65],"leveraging":[66],"novel":[68],"dialogue":[70,134],"dataset":[71],"constructed":[72],"by":[73],"weaving":[74],"together":[75],"diverse":[76],"components.":[78],"second":[80],"KMP-Skills,":[82],"provides":[83],"granular":[85],"assessment":[86],"of":[87,124,148],"foundational":[88],"tutoring":[89],"abilities,":[90],"including":[91],"problem-solving,":[93],"error":[94],"detection":[95],"and":[96,98],"correction,":[97],"problem":[99],"generation.":[100],"Our":[101],"KMP-Bench":[104],"reveal":[105],"key":[107],"disparity:":[108],"while":[109],"leading":[110],"excel":[112],"at":[113],"tasks":[114],"with":[115,120],"verifiable":[116],"solutions,":[117],"they":[118],"struggle":[119],"the":[121,146],"nuanced":[122],"application":[123],"principles.":[126],"Additionally,":[127],"present":[129],"KMP-Pile,":[130],"large-scale":[132],"(150K)":[133],"dataset.":[135],"fine-tuned":[137],"KMP-Pile":[139],"substantial":[141],"improvement":[142],"underscoring":[145],"value":[147],"pedagogically-rich":[149],"training":[150],"data":[151],"for":[152],"developing":[153],"more":[154],"effective":[155],"math":[157],"tutors.":[158]},"counts_by_year":[],"updated_date":"2026-03-20T20:47:17.329874","created_date":"2026-03-18T00:00:00"}
