{"id":"https://openalex.org/W7125788709","doi":"https://doi.org/10.48550/arxiv.2601.18085","title":"\"Crash Test Dummies\" for AI-Enabled Clinical Assessment: Validating Virtual Patient Scenarios with Virtual Learners","display_name":"\"Crash Test Dummies\" for AI-Enabled Clinical Assessment: Validating Virtual Patient Scenarios with Virtual Learners","publication_year":2026,"publication_date":"2026-01-26","ids":{"openalex":"https://openalex.org/W7125788709","doi":"https://doi.org/10.48550/arxiv.2601.18085"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.18085","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.18085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.18085","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5124012691","display_name":"Brian Gin","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Gin, Brian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124015613","display_name":"Ahreum Lim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lim, Ahreum","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124015767","display_name":"Fl\u00e1via Silva e Oliveira","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oliveira, Fl\u00e1via Silva e","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123902453","display_name":"Kuan Xing","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xing, Kuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124001972","display_name":"Xiaomei Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Xiaomei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124030598","display_name":"Gayana Amiyangoda","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Amiyangoda, Gayana","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123932348","display_name":"Thilanka Seneviratne","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Seneviratne, Thilanka","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123895857","display_name":"Alison F. Doubleday","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Doubleday, Alison F.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124038749","display_name":"Ananya Gangopadhyaya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gangopadhyaya, Ananya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123984098","display_name":"Bob Kiser","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kiser, Bob","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123957471","display_name":"Lukas Shum-Tim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shum-Tim, Lukas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124044501","display_name":"Dhruva Patel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Patel, Dhruva","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124018728","display_name":"Kosala Marambe","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marambe, Kosala","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123974508","display_name":"Lauren Maggio","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maggio, Lauren","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5124028980","display_name":"Ara Tekian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tekian, Ara","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123963625","display_name":"Yoon Soo Park","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Yoon Soo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5124012691"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.4392000138759613,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.4392000138759613,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11238","display_name":"Simulation-Based Education in Healthcare","score":0.3747999966144562,"subfield":{"id":"https://openalex.org/subfields/2737","display_name":"Physiology"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12574","display_name":"Clinical Reasoning and Diagnostic Skills","score":0.09070000052452087,"subfield":{"id":"https://openalex.org/subfields/2714","display_name":"Family Practice"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/virtual-patient","display_name":"Virtual patient","score":0.6089000105857849},{"id":"https://openalex.org/keywords/inter-rater-reliability","display_name":"Inter-rater reliability","score":0.5310999751091003},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4880000054836273},{"id":"https://openalex.org/keywords/competence","display_name":"Competence (human resources)","score":0.4787999987602234},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.45350000262260437},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.4449000060558319},{"id":"https://openalex.org/keywords/educational-measurement","display_name":"Educational measurement","score":0.4374000132083893},{"id":"https://openalex.org/keywords/item-response-theory","display_name":"Item response theory","score":0.4081999957561493},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.364300012588501}],"concepts":[{"id":"https://openalex.org/C2778533338","wikidata":"https://www.wikidata.org/wiki/Q7935148","display_name":"Virtual patient","level":2,"score":0.6089000105857849},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6083999872207642},{"id":"https://openalex.org/C61863361","wikidata":"https://www.wikidata.org/wiki/Q470749","display_name":"Inter-rater reliability","level":3,"score":0.5310999751091003},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4925999939441681},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4880000054836273},{"id":"https://openalex.org/C100521375","wikidata":"https://www.wikidata.org/wiki/Q2015382","display_name":"Competence (human resources)","level":2,"score":0.4787999987602234},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4668000042438507},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.45350000262260437},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.4449000060558319},{"id":"https://openalex.org/C22156102","wikidata":"https://www.wikidata.org/wiki/Q5341294","display_name":"Educational measurement","level":3,"score":0.4374000132083893},{"id":"https://openalex.org/C19875794","wikidata":"https://www.wikidata.org/wiki/Q1207340","display_name":"Item response theory","level":3,"score":0.4081999957561493},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3801000118255615},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.364300012588501},{"id":"https://openalex.org/C178823583","wikidata":"https://www.wikidata.org/wiki/Q3269883","display_name":"Online assessment","level":3,"score":0.3443000018596649},{"id":"https://openalex.org/C171606756","wikidata":"https://www.wikidata.org/wiki/Q506132","display_name":"Psychometrics","level":2,"score":0.33239999413490295},{"id":"https://openalex.org/C33724603","wikidata":"https://www.wikidata.org/wiki/Q812540","display_name":"Bayesian network","level":2,"score":0.3163999915122986},{"id":"https://openalex.org/C80059220","wikidata":"https://www.wikidata.org/wiki/Q7521302","display_name":"Simulated patient","level":2,"score":0.3059000074863434},{"id":"https://openalex.org/C194969405","wikidata":"https://www.wikidata.org/wiki/Q170519","display_name":"Virtual reality","level":2,"score":0.2915000021457672},{"id":"https://openalex.org/C75630572","wikidata":"https://www.wikidata.org/wiki/Q538904","display_name":"Applied psychology","level":1,"score":0.28700000047683716},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.2833999991416931},{"id":"https://openalex.org/C156639949","wikidata":"https://www.wikidata.org/wiki/Q13362737","display_name":"Item bank","level":4,"score":0.2777999937534332},{"id":"https://openalex.org/C25344961","wikidata":"https://www.wikidata.org/wiki/Q192726","display_name":"Virtual machine","level":2,"score":0.27489998936653137},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.27239999175071716},{"id":"https://openalex.org/C83849319","wikidata":"https://www.wikidata.org/wiki/Q7295720","display_name":"Rating scale","level":2,"score":0.26759999990463257},{"id":"https://openalex.org/C150303390","wikidata":"https://www.wikidata.org/wiki/Q1983852","display_name":"Virtual actor","level":3,"score":0.26600000262260437},{"id":"https://openalex.org/C3019813237","wikidata":"https://www.wikidata.org/wiki/Q65089264","display_name":"Model validation","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.2558000087738037},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.2526000142097473}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.18085","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.18085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.18085","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.18085","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7780169248580933,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Background:":[0],"In":[1],"medical":[2],"and":[3,29,38,47,66,82,91,109,135,141,177,183,232],"health":[4],"professions":[5],"education":[6],"(HPE),":[7],"AI":[8,61,78,112,188,205],"is":[9],"increasingly":[10],"used":[11],"to":[12,51,64,159,210,239],"assess":[13],"clinical":[14],"competencies,":[15,155],"including":[16],"via":[17],"virtual":[18,79,100,102,218],"standardized":[19],"patients.":[20],"However,":[21],"most":[22],"evaluations":[23],"rely":[24],"on":[25],"AI-human":[26],"interrater":[27],"reliability":[28],"lack":[30],"a":[31,97,124,168,199,216,222],"measurement":[32,83],"framework":[33],"for":[34,85,203],"how":[35],"cases,":[36],"learners,":[37,208],"raters":[39,113,189],"jointly":[40],"shape":[41],"scores.":[42],"This":[43],"leaves":[44],"robustness":[45],"uncertain":[46],"can":[48],"expose":[49],"learners":[50,103],"misguidance":[52],"from":[53],"unvalidated":[54],"systems.":[55],"We":[56,95,196],"address":[57],"this":[58],"by":[59,175],"using":[60,190],"\"simulated":[62],"learners\"":[63],"stress-test":[65],"psychometrically":[67],"characterize":[68],"assessment":[69,237],"pipelines":[70],"before":[71],"human":[72,242],"use.":[73],"Objective:":[74],"Develop":[75],"an":[76],"open-source":[77],"patient":[80,219],"platform":[81,98,220],"model":[84,127,151,225],"robust":[86],"competency":[87,107,176,230],"evaluation":[88],"across":[89,163,187],"cases":[90],"rating":[92],"conditions.":[93],"Methods:":[94],"built":[96],"with":[99,104,116,123,147,156,207,221,241],"patients,":[101],"tunable":[105],"ACGME-aligned":[106],"profiles,":[108],"multiple":[110],"independent":[111],"scoring":[114],"encounters":[115],"structured":[117],"Key-Features":[118],"items.":[119],"Transcripts":[120],"were":[121,145],"analyzed":[122],"Bayesian":[125],"HRM-SDT":[126],"that":[128],"treats":[129],"ratings":[130],"as":[131],"decisions":[132],"under":[133],"uncertainty":[134],"separates":[136],"learner":[137],"ability,":[138],"case":[139,173],"performance,":[140],"rater":[142,180],"behavior;":[143],"parameters":[144],"estimated":[146,172],"MCMC.":[148],"Results:":[149],"The":[150],"recovered":[152],"simulated":[153],"learners'":[154],"significant":[157],"correlations":[158],"the":[160],"generating":[161],"competencies":[162],"all":[164],"ACGME":[165],"domains":[166],"despite":[167],"non-deterministic":[169],"pipeline.":[170],"It":[171],"difficulty":[174],"showed":[178],"stable":[179],"detection":[181],"(sensitivity)":[182],"criteria":[184],"(severity/leniency":[185],"thresholds)":[186],"identical":[191],"models/prompts":[192],"but":[193],"different":[194],"seeds.":[195],"also":[197],"propose":[198],"staged":[200],"\"safety":[201],"blueprint\"":[202],"deploying":[204],"tools":[206],"tied":[209],"entrustment-based":[211],"validation":[212,234],"milestones.":[213],"Conclusions:":[214],"Combining":[215],"purpose-built":[217],"principled":[223],"psychometric":[224],"enables":[226],"robust,":[227],"interpretable,":[228],"generalizable":[229],"estimates":[231],"supports":[233],"of":[235],"AI-assisted":[236],"prior":[238],"use":[240],"learners.":[243]},"counts_by_year":[],"updated_date":"2026-01-28T23:18:48.515280","created_date":"2026-01-28T00:00:00"}
