{"id":"https://openalex.org/W7133341422","doi":"https://doi.org/10.48550/arxiv.2603.00056","title":"How effective are VLMs in assisting humans in inferring the quality of mental models from Multimodal short answers?","display_name":"How effective are VLMs in assisting humans in inferring the quality of mental models from Multimodal short answers?","publication_year":2026,"publication_date":"2026-02-10","ids":{"openalex":"https://openalex.org/W7133341422","doi":"https://doi.org/10.48550/arxiv.2603.00056"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.00056","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00056","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.00056","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5029549986","display_name":"Pritam Sil","orcid":"https://orcid.org/0000-0002-0992-6892"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sil, Pritam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006357925","display_name":"DurgaPrasad Karnam","orcid":"https://orcid.org/0000-0002-7620-0223"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karnam, Durgaprasad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127945088","display_name":"Vinay Reddy Venumuddala","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Venumuddala, Vinay Reddy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128020117","display_name":"Pushpak Bhattacharyya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bhattacharyya, Pushpak","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10072","display_name":"Science Education and Pedagogy","score":0.6341000199317932,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10072","display_name":"Science Education and Pedagogy","score":0.6341000199317932,"subfield":{"id":"https://openalex.org/subfields/3304","display_name":"Education"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11902","display_name":"Intelligent Tutoring Systems and Adaptive Learning","score":0.11490000039339066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10636","display_name":"Innovative Teaching and Learning Methods","score":0.03830000013113022,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.6898000240325928},{"id":"https://openalex.org/keywords/mental-model","display_name":"Mental model","score":0.605400025844574},{"id":"https://openalex.org/keywords/computational-model","display_name":"Computational model","score":0.3041999936103821},{"id":"https://openalex.org/keywords/mental-health","display_name":"Mental health","score":0.2870999872684479},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.2770000100135803},{"id":"https://openalex.org/keywords/conceptual-model","display_name":"Conceptual model","score":0.27410000562667847}],"concepts":[{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.6898000240325928},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6642000079154968},{"id":"https://openalex.org/C2982912361","wikidata":"https://www.wikidata.org/wiki/Q1851867","display_name":"Mental model","level":2,"score":0.605400025844574},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.492900013923645},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43779999017715454},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4320000112056732},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3091000020503998},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.3041999936103821},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2881999909877777},{"id":"https://openalex.org/C134362201","wikidata":"https://www.wikidata.org/wiki/Q317309","display_name":"Mental health","level":2,"score":0.2870999872684479},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.2770000100135803},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.2754000127315521},{"id":"https://openalex.org/C13606891","wikidata":"https://www.wikidata.org/wiki/Q2623243","display_name":"Conceptual model","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C3020001037","wikidata":"https://www.wikidata.org/wiki/Q836575","display_name":"Quality assessment","level":3,"score":0.2630999982357025},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.25699999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.00056","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00056","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.00056","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00056","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8869808316230774,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"STEM":[0],"Mental":[1],"models":[2,65,89,114,162],"can":[3,31,151],"play":[4],"a":[5,14,131,138],"critical":[6,45],"role":[7],"in":[8,158],"assessing":[9],"students'":[10,42,87],"conceptual":[11],"understanding":[12,52],"of":[13,47,50,86,117,128,134,163],"topic.":[15],"They":[16],"not":[17,54],"only":[18,124],"offer":[19],"insights":[20],"into":[21,27],"what":[22],"students":[23,191],"know":[24],"but":[25],"also":[26],"how":[28],"effectively":[29,179],"they":[30,123],"apply,":[32],"relate":[33],"to,":[34],"and":[35,53,137,173,185],"integrate":[36],"concepts":[37],"across":[38],"various":[39],"contexts.":[40],"Thus,":[41],"responses":[43,93],"are":[44],"markers":[46],"the":[48,84,112,160],"quality":[49,85],"their":[51,91,164,176],"entities":[55],"that":[56,82,111,187],"should":[57],"be":[58,152],"merely":[59],"graded.":[60],"However,":[61],"inferring":[62,159],"these":[63,150],"mental":[64,88,161],"from":[66,90],"student":[67],"answers":[68],"is":[69,121],"challenging":[70],"as":[71,97],"it":[72],"requires":[73],"deep":[74],"reasoning":[75],"skills.":[76],"We":[77],"propose":[78],"MMGrader,":[79],"an":[80,98,126],"approach":[81],"infers":[83],"multimodal":[92],"using":[94],"concept":[95],"graphs":[96],"analytical":[99],"framework.":[100],"In":[101],"our":[102],"evaluation":[103],"with":[104,143],"9":[105],"openly":[106],"available":[107],"models,":[108],"we":[109],"found":[110],"best-performing":[113],"fall":[115],"short":[116],"human-level":[118],"performance.":[119],"This":[120],"because":[122],"achieved":[125],"accuracy":[127],"approximately":[129],"40%,":[130],"prediction":[132],"error":[133],"1.1":[135],"units,":[136],"scoring":[139,145],"distribution":[140],"fairly":[141],"aligned":[142],"human":[144],"patterns.":[146],"With":[147],"improved":[148],"accuracy,":[149],"highly":[153],"effective":[154],"assistants":[155],"to":[156,169],"teachers":[157],"entire":[165],"classrooms,":[166],"enabling":[167],"them":[168],"do":[170],"so":[171],"efficiently":[172],"help":[174,183],"improve":[175],"pedagogies":[177],"more":[178],"by":[180],"designing":[181],"targeted":[182],"sessions":[184],"lectures":[186],"strengthen":[188],"areas":[189],"where":[190],"collectively":[192],"demonstrate":[193],"lower":[194],"proficiency.":[195]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-04T00:00:00"}
