{"id":"https://openalex.org/W4415202774","doi":"https://doi.org/10.1088/2632-2153/ae13d1","title":"Depthwise-dilated convolutional adapters for medical object tracking and segmentation using the segment anything model 2","display_name":"Depthwise-dilated convolutional adapters for medical object tracking and segmentation using the segment anything model 2","publication_year":2025,"publication_date":"2025-10-15","ids":{"openalex":"https://openalex.org/W4415202774","doi":"https://doi.org/10.1088/2632-2153/ae13d1","pmid":"https://pubmed.ncbi.nlm.nih.gov/41551748"},"language":"en","primary_location":{"id":"doi:10.1088/2632-2153/ae13d1","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ae13d1","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj","pubmed"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1088/2632-2153/ae13d1","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033484584","display_name":"Guoping Xu","orcid":"https://orcid.org/0000-0003-1431-7191"},"institutions":[{"id":"https://openalex.org/I867280407","display_name":"The University of Texas Southwestern Medical Center","ror":"https://ror.org/05byvp690","country_code":"US","type":"education","lineage":["https://openalex.org/I867280407"]},{"id":"https://openalex.org/I288746156","display_name":"Parker University","ror":"https://ror.org/01s8vy398","country_code":"US","type":"education","lineage":["https://openalex.org/I288746156"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Guoping Xu","raw_affiliation_strings":["The Medical Artificial Intelligence and Automation (MAIA) Laboratory, Department of Radiation Oncology, University of Texas Southwestern Medical Center, Dallas, TX 75390, USA","WIT, 5720 Forest Park Road, Dallas, Dallas, Texas, 75235, UNITED STATES"],"affiliations":[{"raw_affiliation_string":"The Medical Artificial Intelligence and Automation (MAIA) Laboratory, Department of Radiation Oncology, University of Texas Southwestern Medical Center, Dallas, TX 75390, USA","institution_ids":["https://openalex.org/I867280407"]},{"raw_affiliation_string":"WIT, 5720 Forest Park Road, Dallas, Dallas, Texas, 75235, UNITED STATES","institution_ids":["https://openalex.org/I288746156"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048827243","display_name":"Christopher Kabat","orcid":null},"institutions":[{"id":"https://openalex.org/I867280407","display_name":"The University of Texas Southwestern Medical Center","ror":"https://ror.org/05byvp690","country_code":"US","type":"education","lineage":["https://openalex.org/I867280407"]},{"id":"https://openalex.org/I4210096815","display_name":"Southwestern Medical Center","ror":"https://ror.org/00t9vx427","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210096815"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Christopher Kabat","raw_affiliation_strings":["The Medical Artificial Intelligence and Automation (MAIA) Laboratory, Department of Radiation Oncology, University of Texas Southwestern Medical Center, Dallas, TX 75390, USA","UT Southwestern Medical Center, 2280 Inwood Rd, Dallas, TX 75235, Dallas, Dallas, Texas, 75235, UNITED STATES"],"affiliations":[{"raw_affiliation_string":"The Medical Artificial Intelligence and Automation (MAIA) Laboratory, Department of Radiation Oncology, University of Texas Southwestern Medical Center, Dallas, TX 75390, USA","institution_ids":["https://openalex.org/I867280407"]},{"raw_affiliation_string":"UT Southwestern Medical Center, 2280 Inwood Rd, Dallas, TX 75235, Dallas, Dallas, Texas, 75235, UNITED STATES","institution_ids":["https://openalex.org/I4210096815","https://openalex.org/I867280407"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100384572","display_name":"You Zhang","orcid":"https://orcid.org/0000-0002-8033-2755"},"institutions":[{"id":"https://openalex.org/I4210096815","display_name":"Southwestern Medical Center","ror":"https://ror.org/00t9vx427","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I4210096815"]},{"id":"https://openalex.org/I867280407","display_name":"The University of Texas Southwestern Medical Center","ror":"https://ror.org/05byvp690","country_code":"US","type":"education","lineage":["https://openalex.org/I867280407"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"You Zhang","raw_affiliation_strings":["The Medical Artificial Intelligence and Automation (MAIA) Laboratory, Department of Radiation Oncology, University of Texas Southwestern Medical Center, Dallas, TX 75390, USA","Department of Radiation Oncology, UT Southwestern Medical Center, 2280 Inwood Road, Dallas, Texas, 75390, UNITED STATES"],"affiliations":[{"raw_affiliation_string":"The Medical Artificial Intelligence and Automation (MAIA) Laboratory, Department of Radiation Oncology, University of Texas Southwestern Medical Center, Dallas, TX 75390, USA","institution_ids":["https://openalex.org/I867280407"]},{"raw_affiliation_string":"Department of Radiation Oncology, UT Southwestern Medical Center, 2280 Inwood Road, Dallas, Texas, 75390, UNITED STATES","institution_ids":["https://openalex.org/I867280407","https://openalex.org/I4210096815"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5033484584","https://openalex.org/A5048827243","https://openalex.org/A5100384572"],"corresponding_institution_ids":["https://openalex.org/I288746156","https://openalex.org/I4210096815","https://openalex.org/I867280407"],"apc_list":{"value":1600,"currency":"GBP","value_usd":1962},"apc_paid":{"value":1600,"currency":"GBP","value_usd":1962},"fwci":1.7261,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.87177021,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"6","issue":"4","first_page":"045026","last_page":"045026"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.7305999994277954,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.7305999994277954,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T14510","display_name":"Medical Imaging and Analysis","score":0.6236000061035156,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6527000069618225},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5777000188827515},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.48080000281333923},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.46369999647140503},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4449000060558319},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4253999888896942},{"id":"https://openalex.org/keywords/medical-imaging","display_name":"Medical imaging","score":0.42329999804496765},{"id":"https://openalex.org/keywords/adaptability","display_name":"Adaptability","score":0.38940000534057617},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3806999921798706}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8547000288963318},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6527000069618225},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6398000121116638},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5777000188827515},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.48080000281333923},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.46369999647140503},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.45579999685287476},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4449000060558319},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4307999908924103},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4253999888896942},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.42329999804496765},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.38940000534057617},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3806999921798706},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3716999888420105},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.36660000681877136},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.34689998626708984},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.33820000290870667},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.33070001006126404},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.3167000114917755},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.31279999017715454},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.310699999332428},{"id":"https://openalex.org/C22029948","wikidata":"https://www.wikidata.org/wiki/Q45089","display_name":"Dice","level":2,"score":0.3066999912261963},{"id":"https://openalex.org/C102392041","wikidata":"https://www.wikidata.org/wiki/Q592860","display_name":"Sliding window protocol","level":3,"score":0.29989999532699585},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.2903999984264374},{"id":"https://openalex.org/C127705205","wikidata":"https://www.wikidata.org/wiki/Q5748245","display_name":"Heuristics","level":2,"score":0.28200000524520874},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.27390000224113464},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2632000148296356},{"id":"https://openalex.org/C2781018962","wikidata":"https://www.wikidata.org/wiki/Q5164884","display_name":"Container (type theory)","level":2,"score":0.25859999656677246}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1088/2632-2153/ae13d1","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ae13d1","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},{"id":"pmid:41551748","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41551748","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine learning: science and technology","raw_type":null},{"id":"pmh:oai:doaj.org/article:714630f8ccf740f4b0b7229eac43da60","is_oa":true,"landing_page_url":"https://doaj.org/article/714630f8ccf740f4b0b7229eac43da60","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Machine Learning: Science and Technology, Vol 6, Iss 4, p 045026 (2025)","raw_type":"article"},{"id":"pmh:oai:pubmedcentral.nih.gov:12806169","is_oa":true,"landing_page_url":"https://pmc.ncbi.nlm.nih.gov/articles/PMC12806169/","pdf_url":null,"source":{"id":"https://openalex.org/S2764455111","display_name":"PubMed Central","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Mach Learn Sci Technol","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.1088/2632-2153/ae13d1","is_oa":true,"landing_page_url":"https://doi.org/10.1088/2632-2153/ae13d1","pdf_url":null,"source":{"id":"https://openalex.org/S4210200687","display_name":"Machine Learning Science and Technology","issn_l":"2632-2153","issn":["2632-2153"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320083","host_organization_name":"IOP Publishing","host_organization_lineage":["https://openalex.org/P4310320083","https://openalex.org/P4310311669"],"host_organization_lineage_names":["IOP Publishing","Institute of Physics"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Machine Learning: Science and Technology","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1970928383","https://openalex.org/W2891631795","https://openalex.org/W2915232829","https://openalex.org/W2919115771","https://openalex.org/W2996290406","https://openalex.org/W3013692475","https://openalex.org/W3033114334","https://openalex.org/W3198377975","https://openalex.org/W4226497331","https://openalex.org/W4310330006","https://openalex.org/W4322766882","https://openalex.org/W4387953602","https://openalex.org/W4389430914","https://openalex.org/W4391109864","https://openalex.org/W4400881081","https://openalex.org/W4401819803","https://openalex.org/W4401852105","https://openalex.org/W4406610911","https://openalex.org/W4407316270","https://openalex.org/W4408634392","https://openalex.org/W4408997492","https://openalex.org/W4412417281"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2],"medical":[3,27,62,121,143,193],"image":[4],"segmentation":[5,195],"have":[6],"been":[7],"driven":[8],"by":[9,18],"deep":[10],"learning;":[11],"however,":[12],"most":[13],"existing":[14,128],"methods":[15,130],"remain":[16],"limited":[17,124],"modality-specific":[19],"designs":[20],"and":[21,36,79,147,155,169,196,200],"exhibit":[22],"poor":[23],"adaptability":[24],"to":[25,61,75,104],"dynamic":[26],"imaging":[28],"scenarios.":[29],"The":[30],"Segment":[31],"Anything":[32],"Model":[33],"2":[34],"(SAM2)":[35],"its":[37],"related":[38],"variants,":[39],"which":[40],"introduce":[41],"a":[42,100],"streaming":[43,140],"memory":[44,141],"mechanism":[45],"for":[46,53,69,96,142,190],"real-time":[47],"video":[48,63,144,194],"segmentation,":[49],"present":[50],"new":[51],"opportunities":[52],"prompt-based,":[54],"generalizable":[55],"solutions.":[56],"Nevertheless,":[57],"adapting":[58],"these":[59,87],"models":[60,201],"scenarios":[64],"typically":[65],"requires":[66],"large-scale":[67],"datasets":[68,160],"retraining":[70],"or":[71],"transfer":[72],"learning,":[73],"leading":[74],"high":[76],"computational":[77],"costs":[78],"the":[80,173],"risk":[81],"of":[82,118,167,175],"catastrophic":[83],"forgetting.":[84],"To":[85,172],"address":[86],"challenges,":[88],"we":[89],"propose":[90],"DD-SAM2,":[91],"an":[92,181],"efficient":[93],"adaptation":[94],"framework":[95],"SAM2":[97,119,191],"that":[98],"incorporates":[99],"Depthwise-Dilated":[101],"Adapter":[102],"(DD-Adapter)":[103],"enhance":[105],"multi-scale":[106],"feature":[107],"extraction":[108],"with":[109,123],"minimal":[110],"parameter":[111],"overhead.":[112],"This":[113],"design":[114],"enables":[115],"effective":[116],"fine-tuning":[117,188],"on":[120,133,151],"videos":[122],"training":[125],"data.":[126],"Unlike":[127],"adapter-based":[129,187],"focused":[131],"solely":[132],"static":[134],"images,":[135],"DD-SAM2":[136],"fully":[137],"exploits":[138],"SAM2's":[139],"objects":[145],"tracking":[146],"segmentation.":[148],"Comprehensive":[149],"evaluations":[150],"TrackRad2025":[152],"(tumor":[153],"segmentation)":[154],"EchoNet-Dynamic":[156],"(left":[157],"ventricle":[158],"tracking)":[159],"demonstrate":[161],"superior":[162],"performance,":[163],"achieving":[164],"Dice":[165],"scores":[166],"0.93\u00b10.04":[168],"0.97\u00b10.01,":[170],"respectively.":[171],"best":[174],"our":[176],"knowledge,":[177],"this":[178],"work":[179],"provides":[180],"initial":[182],"attempt":[183],"at":[184,207],"systematically":[185],"exploring":[186],"strategies":[189],"applied":[192],"tracking.":[197],"Code,":[198],"datasets,":[199],"will":[202],"be":[203],"made":[204],"publicly":[205],"available":[206],"https://github.com/apple1986/DD-SAM2.":[208]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-03-25T14:56:36.534964","created_date":"2025-10-16T00:00:00"}
