{"id":"https://openalex.org/W7156273530","doi":"https://doi.org/10.48550/arxiv.2604.22156","title":"Sum-of-Checks: Structured Reasoning for Surgical Safety with Large Vision-Language Models","display_name":"Sum-of-Checks: Structured Reasoning for Surgical Safety with Large Vision-Language Models","publication_year":2026,"publication_date":"2026-04-24","ids":{"openalex":"https://openalex.org/W7156273530","doi":"https://doi.org/10.48550/arxiv.2604.22156"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.22156","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22156","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.22156","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5057842780","display_name":"Weiqiu You","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"You, Weiqiu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134679704","display_name":"Cassandra Goldberg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Goldberg, Cassandra","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134719798","display_name":"Amin Madani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Madani, Amin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112853881","display_name":"Daniel A. Hashimoto","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hashimoto, Daniel A.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134699387","display_name":"Eric Wong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wong, Eric","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.43230000138282776,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.43230000138282776,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.20190000534057617,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12574","display_name":"Clinical Reasoning and Diagnostic Skills","score":0.08479999750852585,"subfield":{"id":"https://openalex.org/subfields/2714","display_name":"Family Practice"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.49230000376701355},{"id":"https://openalex.org/keywords/observational-study","display_name":"Observational study","score":0.41190001368522644},{"id":"https://openalex.org/keywords/laparoscopic-cholecystectomy","display_name":"Laparoscopic cholecystectomy","score":0.39399999380111694},{"id":"https://openalex.org/keywords/binary-number","display_name":"Binary number","score":0.38850000500679016},{"id":"https://openalex.org/keywords/structuring","display_name":"Structuring","score":0.3734000027179718},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.36250001192092896},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.34940001368522644}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5770000219345093},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.49230000376701355},{"id":"https://openalex.org/C23131810","wikidata":"https://www.wikidata.org/wiki/Q818574","display_name":"Observational study","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4092000126838684},{"id":"https://openalex.org/C2987287001","wikidata":"https://www.wikidata.org/wiki/Q638774","display_name":"Laparoscopic cholecystectomy","level":2,"score":0.39399999380111694},{"id":"https://openalex.org/C48372109","wikidata":"https://www.wikidata.org/wiki/Q3913","display_name":"Binary number","level":2,"score":0.38850000500679016},{"id":"https://openalex.org/C2775945657","wikidata":"https://www.wikidata.org/wiki/Q381442","display_name":"Structuring","level":2,"score":0.3734000027179718},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.36250001192092896},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.34940001368522644},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.29829999804496765},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2953000068664551},{"id":"https://openalex.org/C19527891","wikidata":"https://www.wikidata.org/wiki/Q1120908","display_name":"Medical physics","level":1,"score":0.2770000100135803},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.26980000734329224},{"id":"https://openalex.org/C3018741271","wikidata":"https://www.wikidata.org/wiki/Q1346149","display_name":"Surgical complication","level":3,"score":0.26409998536109924},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.25459998846054077},{"id":"https://openalex.org/C3019611579","wikidata":"https://www.wikidata.org/wiki/Q6641956","display_name":"Surgical procedures","level":2,"score":0.2515000104904175}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.22156","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22156","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.22156","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.22156","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"score":0.42818763852119446,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Purpose:":[0],"Accurate":[1],"assessment":[2],"of":[3,7,91,140,176],"the":[4,97,130],"Critical":[5],"View":[6],"Safety":[8],"(CVS)":[9],"during":[10],"laparoscopic":[11,70],"cholecystectomy":[12],"is":[13,188,198],"essential":[14],"to":[15,40,129],"prevent":[16],"bile":[17],"duct":[18],"injury,":[19],"a":[20,52,69,78],"complication":[21],"associated":[22],"with":[23,113],"significant":[24],"morbidity":[25],"and":[26,42,81,109,114,137,174,192],"mortality.":[27],"While":[28],"large":[29],"vision-language":[30],"models":[31,136],"(LVLMs)":[32],"offer":[33],"flexible":[34],"reasoning,":[35],"their":[36],"predictions":[37],"remain":[38],"difficult":[39],"audit":[41],"unreliable":[43],"on":[44,96,148,159],"safety-critical":[45],"surgical":[46,165,194],"tasks.":[47],"Methods:":[48],"We":[49,94],"introduce":[50],"Sum-of-Checks,":[51],"framework":[53],"that":[54,144,181],"decomposes":[55],"each":[56,75,112],"CVS":[57,178],"criterion":[58],"into":[59,167],"expert-defined":[60],"reasoning":[61,166],"checks":[62,142,150,170],"reflecting":[63],"clinically":[64],"relevant":[65],"visual":[66],"evidence.":[67,162],"Given":[68],"frame,":[71],"an":[72],"LVLM":[73],"evaluates":[74],"check,":[76],"producing":[77],"binary":[79],"judgment":[80],"justification.":[82],"Criterion-level":[83],"scores":[84],"are":[85,146],"computed":[86],"via":[87],"fixed,":[88],"weighted":[89],"aggregation":[90],"check":[92],"outcomes.":[93],"evaluate":[95],"Endoscapes2023":[98],"benchmark":[99],"using":[100],"three":[101,135],"frontier":[102],"LVLMs,":[103],"comparing":[104],"against":[105],"direct":[106],"prompting,":[107],"chain-of-thought,":[108],"sub-question":[110],"decomposition,":[111],"without":[115],"few-shot":[116],"examples.":[117],"Results:":[118],"Sum-of-Checks":[119],"improves":[120,171],"average":[121,124],"frame-level":[122],"mean":[123],"precision":[125],"by":[126],"12--14%":[127],"relative":[128],"best":[131],"baseline":[132],"across":[133],"all":[134],"criteria.":[138],"Analysis":[139],"individual":[141],"reveals":[143],"LVLMs":[145],"reliable":[147,191],"observational":[149],"(e.g.,":[151],"visibility,":[152],"tool":[153],"obstruction)":[154],"but":[155],"show":[156],"substantial":[157],"variability":[158],"decision-critical":[160],"anatomical":[161],"Conclusion:":[163],"Structuring":[164],"expert-aligned":[168],"verification":[169],"both":[172],"accuracy":[173],"transparency":[175],"LVLM-based":[177],"assessment,":[179],"demonstrating":[180],"explicitly":[182],"separating":[183],"evidence":[184],"elicitation":[185],"from":[186],"decision-making":[187],"critical":[189],"for":[190],"auditable":[193],"AI":[195],"systems.":[196],"Code":[197],"available":[199],"at":[200],"https://github.com/BrachioLab/SumOfChecks.":[201]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-04-28T00:00:00"}
