{"id":"https://openalex.org/W7133356590","doi":"https://doi.org/10.48550/arxiv.2603.00108","title":"SurgFusion-Net: Diversified Adaptive Multimodal Fusion Network for Surgical Skill Assessment","display_name":"SurgFusion-Net: Diversified Adaptive Multimodal Fusion Network for Surgical Skill Assessment","publication_year":2026,"publication_date":"2026-02-18","ids":{"openalex":"https://openalex.org/W7133356590","doi":"https://doi.org/10.48550/arxiv.2603.00108"},"language":"en","primary_location":{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/a89a5ae8-fe0d-423c-a7e8-c429f0ffd00e","is_oa":true,"landing_page_url":"https://research.manchester.ac.uk/en/publications/a89a5ae8-fe0d-423c-a7e8-c429f0ffd00e","pdf_url":"https://pure.manchester.ac.uk/ws/files/1877075731/2603.00108v1.pdf","source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"He, R, Tesfai, F M, Boal, M W E, Sirajudeen, N, Anastasiou, D, Xu, J, Hoque, M I, Kelly, J D, Sridhar, A, Kadkhodamohammadi, A, Chandrasekaran, D, Clarkson, M J, Stoyanov, D, Francis, N & Mazomenos, E B 2026 'SurgFusion-Net : Diversified Adaptive Multimodal Fusion Network for Surgical Skill Assessment' arXiv. https://doi.org/10.48550/arXiv.2603.00108","raw_type":"info:eu-repo/semantics/preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pure.manchester.ac.uk/ws/files/1877075731/2603.00108v1.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128010237","display_name":"Runlong He","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"He, Runlong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127977124","display_name":"Freweini M. Tesfai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tesfai, Freweini M.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127981608","display_name":"Matthew W. E. Boal","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boal, Matthew W. E.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127987729","display_name":"Nazir Sirajudeen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sirajudeen, Nazir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034986735","display_name":"Dimitrios Anastasiou","orcid":"https://orcid.org/0000-0003-1772-522X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anastasiou, Dimitrios","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066662339","display_name":"Jialang Xu","orcid":"https://orcid.org/0000-0003-2324-7033"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Jialang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011069641","display_name":"M. I. Hoque","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hoque, Mobarak I.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029036520","display_name":"Philip Edwards","orcid":"https://orcid.org/0000-0003-0203-5736"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Edwards, Philip J.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127902142","display_name":"John D. Kelly","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kelly, John D.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127911187","display_name":"Ashwin Sridhar","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sridhar, Ashwin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019400238","display_name":"Abdolrahim Kadkhodamohammadi","orcid":"https://orcid.org/0000-0002-1873-6660"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kadkhodamohammadi, Abdolrahim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127889087","display_name":"Dhivya Chandrasekaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandrasekaran, Dhivya","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127942187","display_name":"Matthew J. Clarkson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Clarkson, Matthew J.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127890248","display_name":"Danail Stoyanov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stoyanov, Danail","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031651895","display_name":"Nader Francis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Francis, Nader","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5048400975","display_name":"Evangelos B. Mazomenos","orcid":"https://orcid.org/0000-0003-0357-5996"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mazomenos, Evangelos B.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":16,"corresponding_author_ids":["https://openalex.org/A5128010237"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.864799976348877,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.864799976348877,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.016599999740719795,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.013199999928474426,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.5182999968528748},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.515999972820282},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.4537999927997589},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.3864000141620636},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.357699990272522},{"id":"https://openalex.org/keywords/data-integration","display_name":"Data integration","score":0.3391000032424927},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.3346000015735626},{"id":"https://openalex.org/keywords/optical-flow","display_name":"Optical flow","score":0.32519999146461487}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6830999851226807},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6047999858856201},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.5182999968528748},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.515999972820282},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.4537999927997589},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.3864000141620636},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37790000438690186},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.357699990272522},{"id":"https://openalex.org/C72634772","wikidata":"https://www.wikidata.org/wiki/Q386824","display_name":"Data integration","level":2,"score":0.3391000032424927},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.3346000015735626},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33379998803138733},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32690000534057617},{"id":"https://openalex.org/C155542232","wikidata":"https://www.wikidata.org/wiki/Q736111","display_name":"Optical flow","level":3,"score":0.32519999146461487},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.323199987411499},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.3190000057220459},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.3160000145435333},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.29679998755455017},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.2924000024795532},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.2583000063896179},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.2524000108242035},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.25209999084472656}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/a89a5ae8-fe0d-423c-a7e8-c429f0ffd00e","is_oa":true,"landing_page_url":"https://research.manchester.ac.uk/en/publications/a89a5ae8-fe0d-423c-a7e8-c429f0ffd00e","pdf_url":"https://pure.manchester.ac.uk/ws/files/1877075731/2603.00108v1.pdf","source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"He, R, Tesfai, F M, Boal, M W E, Sirajudeen, N, Anastasiou, D, Xu, J, Hoque, M I, Kelly, J D, Sridhar, A, Kadkhodamohammadi, A, Chandrasekaran, D, Clarkson, M J, Stoyanov, D, Francis, N & Mazomenos, E B 2026 'SurgFusion-Net : Diversified Adaptive Multimodal Fusion Network for Surgical Skill Assessment' arXiv. https://doi.org/10.48550/arXiv.2603.00108","raw_type":"info:eu-repo/semantics/preprint"},{"id":"doi:10.48550/arxiv.2603.00108","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.00108","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:pure.atira.dk:openaire_cris_publications/a89a5ae8-fe0d-423c-a7e8-c429f0ffd00e","is_oa":true,"landing_page_url":"https://research.manchester.ac.uk/en/publications/a89a5ae8-fe0d-423c-a7e8-c429f0ffd00e","pdf_url":"https://pure.manchester.ac.uk/ws/files/1877075731/2603.00108v1.pdf","source":{"id":"https://openalex.org/S4306400662","display_name":"Research Explorer (The University of Manchester)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28407311","host_organization_name":"University of Manchester","host_organization_lineage":["https://openalex.org/I28407311"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"He, R, Tesfai, F M, Boal, M W E, Sirajudeen, N, Anastasiou, D, Xu, J, Hoque, M I, Kelly, J D, Sridhar, A, Kadkhodamohammadi, A, Chandrasekaran, D, Clarkson, M J, Stoyanov, D, Francis, N & Mazomenos, E B 2026 'SurgFusion-Net : Diversified Adaptive Multimodal Fusion Network for Surgical Skill Assessment' arXiv. https://doi.org/10.48550/arXiv.2603.00108","raw_type":"info:eu-repo/semantics/preprint"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.43972548842430115}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W7133356590.pdf","grobid_xml":"https://content.openalex.org/works/W7133356590.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Robotic-assisted":[0],"surgery":[1],"(RAS)":[2],"is":[3],"established":[4],"in":[5,197,200],"clinical":[6,71,108],"practice,":[7],"and":[8,22,39,53,69,80,90,124,149,158,176,184,205,207,212],"automated":[9],"surgical":[10,20,75,101,171],"skill":[11,102,144],"assessment":[12,174],"utilizing":[13],"multimodal":[14,27,100,164],"data":[15],"offers":[16],"transformative":[17],"potential":[18],"for":[19,42,99],"analytics":[21],"education.":[23],"However,":[24],"developing":[25],"effective":[26],"methods":[28],"remains":[29],"challenging":[30],"due":[31],"to":[32,60,162],"the":[33,62,74,110,125,180],"task":[34],"complexity,":[35],"limited":[36],"annotated":[37],"datasets":[38,141],"insufficient":[40],"techniques":[41],"cross-modal":[43],"information":[44],"fusion.":[45],"Existing":[46],"state-of-the-art":[47],"relies":[48],"exclusively":[49],"on":[50,56,170,179,210],"RGB":[51,115,130],"video":[52],"only":[54],"applies":[55],"dry-lab":[57],"settings,":[58],"failing":[59],"address":[61],"significant":[63],"domain":[64],"gap":[65],"between":[66],"controlled":[67],"simulation":[68],"real":[70],"cases,":[72],"where":[73],"environment":[76],"together":[77],"with":[78,192],"camera":[79],"tissue":[81],"motion":[82],"introduce":[83],"substantial":[84],"complexities.":[85],"This":[86],"work":[87],"introduces":[88],"SurgFusion-Net":[89],"Divergence":[91],"Regulated":[92],"Attention":[93],"(DRA),":[94],"an":[95],"innovative":[96],"fusion":[97],"strategy":[98],"assessment.":[103],"We":[104],"contribute":[105],"two":[106],"first-of-their-kind":[107],"datasets:":[109],"RAH-skill":[111,211],"dataset":[112,127],"containing":[113,128],"279,691":[114],"frames":[116,131],"from":[117,132,166],"37":[118],"videos":[119,134],"of":[120,135,195],"Robot-assisted":[121],"Hysterectomy":[122],"(RAH),":[123],"RARP-skill":[126,185],"70,661":[129],"33":[133],"Robot-Assisted":[136],"Radical":[137],"Prostatectomy":[138],"(RARP).":[139],"Both":[140],"include":[142],"M-GEARS":[143],"annotations,":[145],"corresponding":[146],"optical":[147],"flow":[148],"tool":[150],"segmentation":[151],"masks.":[152],"DRA":[153],"incorporates":[154],"adaptive":[155],"dual":[156],"attention":[157,161],"diversity-promoting":[159],"multi-head":[160],"fuse":[163],"information,":[165],"three":[167],"modalities,":[168],"based":[169],"context,":[172],"enhancing":[173],"accuracy":[175],"reliability.":[177],"Validated":[178],"JIGSAWS":[181,203],"benchmark,":[182],"RAH-skill,":[183],"datasets,":[186],"our":[187],"approach":[188],"outperforms":[189],"recent":[190],"baselines":[191],"SCC":[193],"improvements":[194],"0.02":[196],"LOSO,":[198],"0.04":[199],"LOUO":[201],"across":[202],"tasks,":[204],"0.0538":[206],"0.0493":[208],"gains":[209],"RARP-skill,":[213],"respectively.":[214]},"counts_by_year":[],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2026-03-04T00:00:00"}
