{"id":"https://openalex.org/W7138871742","doi":"https://doi.org/10.48550/arxiv.2603.16822","title":"Surg$\u03a3$: A Spectrum of Large-Scale Multimodal Data and Foundation Models for Surgical Intelligence","display_name":"Surg$\u03a3$: A Spectrum of Large-Scale Multimodal Data and Foundation Models for Surgical Intelligence","publication_year":2026,"publication_date":"2026-03-17","ids":{"openalex":"https://openalex.org/W7138871742","doi":"https://doi.org/10.48550/arxiv.2603.16822"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16822","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16822","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16822","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089203954","display_name":"Zhitao Zeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zeng, Zhitao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129987792","display_name":"Mengya Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Mengya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130115484","display_name":"Jian Jiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129810609","display_name":"Pengfei Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Pengfei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129862039","display_name":"Yunqiu Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Yunqiu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126873062","display_name":"Zhu Zhuo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhuo, Zhu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058834100","display_name":"Chang Han Low","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Low, Chang Han","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130073899","display_name":"Yufan He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Yufan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130109264","display_name":"Dong Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Dong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129772897","display_name":"Chenxi Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Chenxi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102216183","display_name":"Yiming Gu","orcid":"https://orcid.org/0009-0009-4077-096X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Yiming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130198315","display_name":"Jiaxin Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Jiaxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011762462","display_name":"Yutong Ban","orcid":"https://orcid.org/0000-0001-5396-9251"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ban, Yutong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129766225","display_name":"Daguang Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Daguang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130079142","display_name":"Qi Dou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dou, Qi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129813608","display_name":"Yueming Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Yueming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.46239998936653137,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.46239998936653137,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.14180000126361847,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.12200000137090683,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.5900999903678894},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5720999836921692},{"id":"https://openalex.org/keywords/standardization","display_name":"Standardization","score":0.41909998655319214},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.36980000138282776},{"id":"https://openalex.org/keywords/semantic-mapping","display_name":"Semantic mapping","score":0.358599990606308},{"id":"https://openalex.org/keywords/surgical-procedures","display_name":"Surgical procedures","score":0.35339999198913574}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.640999972820282},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.5900999903678894},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5720999836921692},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.4327000081539154},{"id":"https://openalex.org/C188087704","wikidata":"https://www.wikidata.org/wiki/Q369577","display_name":"Standardization","level":2,"score":0.41909998655319214},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.39640000462532043},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3799999952316284},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.36980000138282776},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.358599990606308},{"id":"https://openalex.org/C3019611579","wikidata":"https://www.wikidata.org/wiki/Q6641956","display_name":"Surgical procedures","level":2,"score":0.35339999198913574},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.34119999408721924},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.319599986076355},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.30559998750686646},{"id":"https://openalex.org/C3020442560","wikidata":"https://www.wikidata.org/wiki/Q4971815","display_name":"Broad spectrum","level":2,"score":0.2653999924659729},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.2581000030040741},{"id":"https://openalex.org/C168065819","wikidata":"https://www.wikidata.org/wiki/Q845566","display_name":"Debugging","level":2,"score":0.2563000023365021}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16822","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16822","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16822","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16822","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Surgical":[0],"intelligence":[1],"has":[2],"the":[3,7,55,83,202],"potential":[4],"to":[5,24,96,122,178],"improve":[6,123],"safety":[8],"and":[9,22,28,76,114,126,137,144,156,212,220],"consistency":[10,125],"of":[11,57,72,85,205],"surgical":[12,17,80,99,104,139,150,185,195],"care,":[13],"yet":[14],"most":[15],"existing":[16],"AI":[18],"frameworks":[19],"remain":[20],"task-specific":[21],"struggle":[23],"generalize":[25],"across":[26,44,129,147],"procedures":[27],"institutions.":[29],"Although":[30],"multimodal":[31,35,61,74,92,167,207],"foundation":[32,77,94,196],"models,":[33,38],"particularly":[34],"large":[36],"language":[37],"have":[39],"demonstrated":[40],"strong":[41],"cross-task":[42,218],"capabilities":[43],"various":[45],"medical":[46],"domains,":[47],"their":[48],"advancement":[49],"in":[50,183],"surgery":[51],"remains":[52],"constrained":[53],"by":[54],"lack":[56],"large-scale,":[58],"systematically":[59],"curated":[60,110],"data.":[62],"To":[63],"address":[64],"this":[65,86],"challenge,":[66],"we":[67],"introduce":[68],"Surg$\u03a3$,":[69],"a":[70,90,118],"spectrum":[71],"large-scale":[73,91,206],"data":[75,93,105,127],"models":[78,197],"for":[79,216],"intelligence.":[81],"At":[82],"core":[84],"framework":[87],"lies":[88],"Surg$\u03a3$-DB,":[89,200],"designed":[95],"support":[97,179],"diverse":[98,138],"tasks.":[100],"Surg$\u03a3$-DB":[101,132,169],"consolidates":[102],"heterogeneous":[103,130],"sources":[106],"(including":[107],"open-source":[108],"datasets,":[109],"in-house":[111],"clinical":[112,135],"collections":[113],"web-source":[115],"data)":[116],"into":[117],"unified":[119,209],"schema,":[120],"aiming":[121],"label":[124],"standardization":[128],"datasets.":[131],"spans":[133],"6":[134],"specialties":[136],"types,":[140],"providing":[141,174],"rich":[142],"image-":[143],"video-level":[145],"annotations":[146,215],"18":[148],"practical":[149,203],"tasks":[151],"covering":[152],"understanding,":[153],"reasoning,":[154],"planning,":[155],"generation,":[157],"at":[158],"an":[159],"unprecedented":[160],"scale":[161],"(over":[162],"5.98M":[163],"conversations).":[164],"Beyond":[165],"conventional":[166],"conversations,":[168],"incorporates":[170],"hierarchical":[171],"reasoning":[172,214],"annotations,":[173,208],"richer":[175],"semantic":[176,210],"cues":[177],"deeper":[180],"contextual":[181],"understanding":[182],"complex":[184],"scenarios.":[186],"We":[187],"further":[188],"provide":[189],"empirical":[190],"evidence":[191],"through":[192],"recently":[193],"developed":[194],"built":[198],"upon":[199],"illustrating":[201],"benefits":[204],"design,":[211],"structured":[213],"improving":[217],"generalization":[219],"interpretability.":[221]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-20T00:00:00"}
