{"id":"https://openalex.org/W4400908946","doi":"https://doi.org/10.1109/siu61531.2024.10601051","title":"Generating Automatic Surgical Captions Using a Contrastive Language-Image Pre-Training Model for Nephrectomy Surgery Images","display_name":"Generating Automatic Surgical Captions Using a Contrastive Language-Image Pre-Training Model for Nephrectomy Surgery Images","publication_year":2024,"publication_date":"2024-05-15","ids":{"openalex":"https://openalex.org/W4400908946","doi":"https://doi.org/10.1109/siu61531.2024.10601051"},"language":"en","primary_location":{"id":"doi:10.1109/siu61531.2024.10601051","is_oa":false,"landing_page_url":"https://doi.org/10.1109/siu61531.2024.10601051","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 32nd Signal Processing and Communications Applications Conference (SIU)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017372993","display_name":"Sevdenur K\u00fct\u00fck","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sevdenur K\u00fct\u00fck","raw_affiliation_strings":["Fen Bilimleri Enstit&#x00FC;s&#x00FC;, Gazi &#x00DC;niversitesi,Bilgisayar M&#x00FC;hendisli&#x011F;i Ana Bilim Dal&#x0131;,Ankara,T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"Fen Bilimleri Enstit&#x00FC;s&#x00FC;, Gazi &#x00DC;niversitesi,Bilgisayar M&#x00FC;hendisli&#x011F;i Ana Bilim Dal&#x0131;,Ankara,T&#x00FC;rkiye","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056610357","display_name":"Tuba \u00c7a\u011fl\u0131kantar","orcid":"https://orcid.org/0000-0001-5590-5307"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tuba \u00c7a\u011fl\u0131kantar","raw_affiliation_strings":["M&#x00FC;hendislik Fak&#x00FC;ltesi, Gazi &#x00DC;niversitesi,Bilgisayar M&#x00FC;hendisli&#x011F;i,Ankara,T&#x00FC;rkiye"],"affiliations":[{"raw_affiliation_string":"M&#x00FC;hendislik Fak&#x00FC;ltesi, Gazi &#x00DC;niversitesi,Bilgisayar M&#x00FC;hendisli&#x011F;i,Ankara,T&#x00FC;rkiye","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050695785","display_name":"Duygu Sar\u0131kaya","orcid":"https://orcid.org/0000-0002-2083-4999"},"institutions":[{"id":"https://openalex.org/I130828816","display_name":"University of Leeds","ror":"https://ror.org/024mrxd33","country_code":"GB","type":"education","lineage":["https://openalex.org/I130828816"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Duygu Sar\u0131kaya","raw_affiliation_strings":["University of Leeds,School Of Computing,Leeds,United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Leeds,School Of Computing,Leeds,United Kingdom","institution_ids":["https://openalex.org/I130828816"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5017372993"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.10374798,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"4"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.993399977684021,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9276999831199646,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nephrectomy","display_name":"Nephrectomy","score":0.8025466203689575},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6661651730537415},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5427733659744263},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.42086154222488403},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3374135494232178},{"id":"https://openalex.org/keywords/medicine","display_name":"Medicine","score":0.3174353837966919},{"id":"https://openalex.org/keywords/kidney","display_name":"Kidney","score":0.12634089589118958},{"id":"https://openalex.org/keywords/internal-medicine","display_name":"Internal medicine","score":0.06476143002510071}],"concepts":[{"id":"https://openalex.org/C2780227381","wikidata":"https://www.wikidata.org/wiki/Q1357376","display_name":"Nephrectomy","level":3,"score":0.8025466203689575},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6661651730537415},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5427733659744263},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42086154222488403},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3374135494232178},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.3174353837966919},{"id":"https://openalex.org/C2780091579","wikidata":"https://www.wikidata.org/wiki/Q9377","display_name":"Kidney","level":2,"score":0.12634089589118958},{"id":"https://openalex.org/C126322002","wikidata":"https://www.wikidata.org/wiki/Q11180","display_name":"Internal medicine","level":1,"score":0.06476143002510071}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/siu61531.2024.10601051","is_oa":false,"landing_page_url":"https://doi.org/10.1109/siu61531.2024.10601051","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 32nd Signal Processing and Communications Applications Conference (SIU)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Gender equality","score":0.41999998688697815,"id":"https://metadata.un.org/sdg/5"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Surgical":[0],"reporting":[1],"plays":[2,25],"an":[3,26],"important":[4,27],"role":[5,28],"in":[6,29,79],"providing":[7],"surgical":[8,40,46,52,55,68,97],"feedback":[9],"and":[10,32,39,50,88,121,124],"medical":[11],"training,":[12],"however,":[13],"it":[14,132],"remains":[15],"a":[16,72,134],"complex":[17],"task":[18],"that":[19],"requires":[20],"clinical":[21],"expertise.":[22],"It":[23],"also":[24],"postoperative":[30],"care":[31],"diagnosis":[33],"of":[34],"complications":[35],"after":[36],"surgery.":[37],"Surgeons":[38],"teams":[41],"can":[42],"use":[43],"automatically":[44],"generated":[45],"captions":[47],"for":[48,99],"effective":[49],"efficient":[51],"reporting.":[53],"Automated":[54],"report":[56],"generation":[57],"has":[58],"the":[59,85,91,109,128],"potential":[60],"to":[61,94,127],"decrease":[62],"surgeons\u2019":[63],"workload":[64],"and,":[65],"therefore":[66],"improve":[67],"outcomes.":[69],"We":[70],"utilized":[71],"customized":[73],"Contrastive":[74],"Language-Image":[75],"Pre-Training":[76],"(CLIP)":[77],"model":[78,104],"this":[80],"research,":[81],"employing":[82],"VGG-19":[83],"as":[84,90],"image":[86],"encoder":[87,93],"ClinicalBERT":[89],"text":[92],"produce":[95],"automated":[96],"descriptions":[98],"nephrectomy":[100],"surgery":[101],"images.":[102],"The":[103],"we":[105],"named":[106],"SurgicalClip":[107],"achieved":[108],"following":[110],"average":[111],"scores:":[112],"0.702":[113],"BLEU-1,":[114],"0.51":[115],"BLEU-4,":[116],"3.615":[117],"CIDEr,":[118],"0.382":[119],"METEOR,":[120],"0.657":[122],"ROUGE,":[123],"performed":[125],"comparably":[126],"benchmark":[129],"models":[130],"although":[131],"proposes":[133],"lightweight":[135],"solution.":[136]},"counts_by_year":[],"updated_date":"2025-12-26T23:08:49.675405","created_date":"2025-10-10T00:00:00"}
