{"id":"https://openalex.org/W4384918569","doi":"https://doi.org/10.48550/arxiv.2307.09548","title":"Surgical Action Triplet Detection by Mixed Supervised Learning of Instrument-Tissue Interactions","display_name":"Surgical Action Triplet Detection by Mixed Supervised Learning of Instrument-Tissue Interactions","publication_year":2023,"publication_date":"2023-07-18","ids":{"openalex":"https://openalex.org/W4384918569","doi":"https://doi.org/10.48550/arxiv.2307.09548"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2307.09548","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.09548","pdf_url":"https://arxiv.org/pdf/2307.09548","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2307.09548","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008060664","display_name":"Saurav Sharma","orcid":"https://orcid.org/0000-0002-6021-6132"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sharma, Saurav","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018519401","display_name":"Chinedu Innocent Nwoye","orcid":"https://orcid.org/0000-0003-4777-0857"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nwoye, Chinedu Innocent","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107918178","display_name":"Didier Mutter","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mutter, Didier","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5071976104","display_name":"Nicolas Padoy","orcid":"https://orcid.org/0000-0002-5010-4137"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Padoy, Nicolas","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5008060664"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.96670001745224,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T11930","display_name":"Cardiac, Anesthesia and Surgical Outcomes","score":0.9513000249862671,"subfield":{"id":"https://openalex.org/subfields/2705","display_name":"Cardiology and Cardiovascular Medicine"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7025169134140015},{"id":"https://openalex.org/keywords/bipartite-graph","display_name":"Bipartite graph","score":0.6010505557060242},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5218419432640076},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5060991644859314},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.4866117238998413},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.46773892641067505},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.45088374614715576},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3263383209705353},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3253800868988037},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2417943775653839},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11076951026916504}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7025169134140015},{"id":"https://openalex.org/C197657726","wikidata":"https://www.wikidata.org/wiki/Q174733","display_name":"Bipartite graph","level":3,"score":0.6010505557060242},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5218419432640076},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5060991644859314},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.4866117238998413},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.46773892641067505},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.45088374614715576},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3263383209705353},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3253800868988037},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2417943775653839},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11076951026916504},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2307.09548","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.09548","pdf_url":"https://arxiv.org/pdf/2307.09548","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"pmh:oai:HAL:hal-04215902v1","is_oa":false,"landing_page_url":"https://hal.science/hal-04215902","pdf_url":null,"source":{"id":"https://openalex.org/S4406922461","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"The 26th International Conference on Medical Image Computing and Computer Assisted Intervention, MICCAI 2023, Vancouver, Canada, octobre 2023, Oct 2023, Vancouver, Canada","raw_type":"Conference papers"},{"id":"doi:10.48550/arxiv.2307.09548","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2307.09548","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2307.09548","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2307.09548","pdf_url":"https://arxiv.org/pdf/2307.09548","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[{"score":0.5799999833106995,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G1536759560","display_name":null,"funder_award_id":"ANR-10-IAHU-02","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G3954744813","display_name":null,"funder_award_id":"ANR-20-CHIA-0029-01","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G54056163","display_name":"Automatic Endoscopic Scene Assessment for Safety Checkpoint Validation in the Operating Room","funder_award_id":"ANR-20-CHIA-0029","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G6851345361","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"},{"id":"https://openalex.org/G7240651115","display_name":null,"funder_award_id":"ANR-10","funder_id":"https://openalex.org/F4320320883","funder_display_name":"Agence Nationale de la Recherche"}],"funders":[{"id":"https://openalex.org/F4320320883","display_name":"Agence Nationale de la Recherche","ror":"https://ror.org/00rbzpz17"},{"id":"https://openalex.org/F4320326256","display_name":"Grand \u00c9quipement National De Calcul Intensif","ror":"https://ror.org/0010d1q40"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4384918569.pdf","grobid_xml":"https://content.openalex.org/works/W4384918569.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2371352078","https://openalex.org/W2953461625","https://openalex.org/W2077383796","https://openalex.org/W2080136900","https://openalex.org/W2372768926","https://openalex.org/W2999799752","https://openalex.org/W2115167491","https://openalex.org/W2567825307","https://openalex.org/W2054458431","https://openalex.org/W1981780420"],"abstract_inverted_index":{"Surgical":[0],"action":[1,27,58],"triplets":[2],"describe":[3],"instrument-tissue":[4],"interactions":[5],"as":[6,42,145,174],"(instrument,":[7],"verb,":[8],"target)":[9],"combinations,":[10],"thereby":[11],"supporting":[12],"a":[13,122,160,179],"detailed":[14],"analysis":[15],"of":[16,45,49,55,74,83,106,135,142,152,239],"surgical":[17,26,50,57],"scene":[18],"activities":[19],"and":[20,52,90,112,171,191,225,233],"workflow.":[21],"This":[22],"work":[23],"focuses":[24],"on":[25,221,229],"triplet":[28,39,59,76,88,100,193,215,234],"detection,":[29,235],"which":[30],"is":[31,67],"challenging":[32],"but":[33],"more":[34],"precise":[35],"than":[36],"the":[37,56,72,81,104,110,116,143,150,156,166,169,175,222,237,240],"traditional":[38],"recognition":[40,54],"task":[41],"it":[43],"consists":[44],"joint":[46],"(1)":[47],"localization":[48,95,232],"instruments":[51,170],"(2)":[53],"associated":[60],"with":[61,109,209],"every":[62],"localized":[63],"instrument.":[64],"Triplet":[65],"detection":[66,89,101],"highly":[68],"complex":[69],"due":[70,102],"to":[71,103,148,164,197],"lack":[73],"spatial":[75,85,207],"annotation.":[77],"We":[78,177,201,217],"analyze":[79],"how":[80],"amount":[82],"instrument":[84,94,206,231],"annotations":[86,208],"affects":[87],"observe":[91],"that":[92,125,183,203],"accurate":[93],"does":[96],"not":[97],"guarantee":[98],"better":[99,214],"risk":[105,151],"erroneous":[107],"associations":[108],"verbs":[111],"targets.":[113],"To":[114],"solve":[115],"two":[117],"tasks,":[118],"we":[119],"propose":[120],"MCIT-IG,":[121],"two-stage":[123],"network,":[124],"stands":[126],"for":[127,189,195],"Multi-Class":[128],"Instrument-aware":[129],"Transformer-Interaction":[130],"Graph.":[131],"The":[132],"MCIT":[133,190],"stage":[134,158],"our":[136,199,219],"network":[137],"models":[138],"per":[139],"class":[140],"embedding":[141],"targets":[144],"additional":[146],"features":[147],"reduce":[149],"misassociating":[153],"triplets.":[154],"Furthermore,":[155],"IG":[157,196],"constructs":[159],"bipartite":[161],"dynamic":[162],"graph":[163],"model":[165,220],"interaction":[167],"between":[168],"targets,":[172],"cast":[173],"verbs.":[176],"utilize":[178],"mixed-supervised":[180],"learning":[181],"strategy":[182],"combines":[184],"weak":[185],"target":[186,210],"presence":[187],"labels":[188,194],"pseudo":[192],"train":[198],"network.":[200],"observed":[202],"complementing":[204],"minimal":[205],"embeddings":[211],"results":[212],"in":[213,243],"detection.":[216],"evaluate":[218],"CholecT50":[223],"dataset":[224],"show":[226],"improved":[227],"performance":[228],"both":[230],"topping":[236],"leaderboard":[238],"CholecTriplet":[241],"challenge":[242],"MICCAI":[244],"2022.":[245]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
