{"id":"https://openalex.org/W7161236667","doi":"https://doi.org/10.48550/arxiv.2605.14253","title":"Towards Real-Time Autonomous Navigation: Transformer-Based Catheter Tip Tracking in Fluoroscopy","display_name":"Towards Real-Time Autonomous Navigation: Transformer-Based Catheter Tip Tracking in Fluoroscopy","publication_year":2026,"publication_date":"2026-05-14","ids":{"openalex":"https://openalex.org/W7161236667","doi":"https://doi.org/10.48550/arxiv.2605.14253"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.14253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.14253","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134444326","display_name":"Harry Robertshaw","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Robertshaw, Harry","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134744436","display_name":"Yanghe Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao, Yanghe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134397098","display_name":"Weiyuan Deng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Deng, Weiyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136240668","display_name":"Benjamin Jackson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jackson, Benjamin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136233103","display_name":"S. M. Hadi Sadati","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sadati, S. M. Hadi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136253810","display_name":"Nikola Fischer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fischer, Nikola","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136200297","display_name":"Tom Vercauteren","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vercauteren, Tom","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136229956","display_name":"Alejandro Granados","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Granados, Alejandro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136196195","display_name":"Thomas C. Booth","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Booth, Thomas C.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.8532999753952026,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.8532999753952026,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.029200000688433647,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.008799999952316284,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6025999784469604},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5824000239372253},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5669000148773193},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.44359999895095825},{"id":"https://openalex.org/keywords/fluoroscopy","display_name":"Fluoroscopy","score":0.43380001187324524},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3905999958515167},{"id":"https://openalex.org/keywords/tracking-system","display_name":"Tracking system","score":0.3522999882698059},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.35179999470710754}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7218999862670898},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7071999907493591},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.689300000667572},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6025999784469604},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5824000239372253},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5669000148773193},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.44359999895095825},{"id":"https://openalex.org/C2776805002","wikidata":"https://www.wikidata.org/wiki/Q614984","display_name":"Fluoroscopy","level":2,"score":0.43380001187324524},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3905999958515167},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.3522999882698059},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.35179999470710754},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.337799996137619},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.31769999861717224},{"id":"https://openalex.org/C112353826","wikidata":"https://www.wikidata.org/wiki/Q127313","display_name":"Active contour model","level":4,"score":0.30399999022483826},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.30000001192092896},{"id":"https://openalex.org/C91158637","wikidata":"https://www.wikidata.org/wiki/Q223818","display_name":"Biplane","level":2,"score":0.29269999265670776},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C19609008","wikidata":"https://www.wikidata.org/wiki/Q2138203","display_name":"Region of interest","level":2,"score":0.26440000534057617},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.26260000467300415},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.26030001044273376},{"id":"https://openalex.org/C2780645631","wikidata":"https://www.wikidata.org/wiki/Q671554","display_name":"Stroke (engine)","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.14253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.14253","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.14253","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Purpose:":[0],"Mechanical":[1],"thrombectomy":[2],"(MT)":[3],"improves":[4],"stroke":[5],"outcomes,":[6],"but":[7,35],"is":[8],"limited":[9],"by":[10],"a":[11,54,131,193],"lack":[12],"of":[13,19,135,162],"local":[14],"treatment":[15],"access.":[16],"Widespread":[17],"distribution":[18],"reinforcement":[20],"learning":[21,86],"(RL)-based":[22],"robotic":[23],"systems":[24],"can":[25],"be":[26],"used":[27],"to":[28,45,50,164],"alleviate":[29],"this":[30],"challenge":[31],"through":[32],"autonomous":[33,200],"navigation,":[34],"current":[36],"RL":[37],"methods":[38],"require":[39],"live":[40],"device":[41,70],"tip":[42,57],"coordinate":[43],"tracking":[44,58,179],"function.":[46],"This":[47],"paper":[48],"aims":[49],"develop":[51],"and":[52,69,83,92,96,100,111,145,195],"evaluate":[53],"real-time":[55],"catheter":[56],"pipeline":[59,75],"under":[60,184],"fluoroscopy,":[61],"addressing":[62],"challenges":[63],"such":[64],"as":[65],"low":[66],"contrast,":[67],"noise,":[68],"occlusion.":[71],"Methods:":[72],"A":[73],"multi-threaded":[74,178],"was":[76],"designed,":[77],"incorporating":[78],"frame":[79],"reading,":[80],"preprocessing,":[81],"inference,":[82],"post-processing.":[84],"Deep":[85],"segmentation":[87,152],"models,":[88],"including":[89],"U-Net,":[90],"U-Net+Transformer,":[91],"SegFormer,":[93],"were":[94],"trained":[95],"benchmarked":[97],"using":[98],"two-class":[99,128],"three-class":[101,147],"formulations.":[102],"Post-processing":[103],"involved":[104],"two-step":[105],"component":[106],"filtering,":[107],"one-pixel":[108],"medial":[109],"skeletonization,":[110],"greedy":[112],"arc-length":[113],"path":[114],"following":[115],"with":[116,160],"contour":[117],"fall-back.":[118],"Results:":[119],"On":[120,151],"manually-labeled":[121],"moderate":[122],"complexity":[123],"fluoroscopic":[124],"video":[125],"data,":[126],"the":[127,154,176],"SegFormer":[129],"achieved":[130],"mean":[132],"absolute":[133],"error":[134],"4.44":[136],"mm,":[137],"outperforming":[138,188],"U-Net":[139],"(4.60":[140],"mm),":[141],"U-Net+Transformer":[142],"(6.20":[143],"mm)":[144],"all":[146],"models":[148],"(5.19-7.74":[149],"mm).":[150],"benchmarks,":[153,190],"system":[155],"exceeded":[156],"state-of-the-art":[157],"CathAction":[158],"results":[159,173],"improvements":[161],"up":[163],"+5%":[165],"in":[166],"Dice":[167],"scores":[168],"for":[169,198],"three-segmentation.":[170],"Conclusion:":[171],"The":[172],"demonstrate":[174],"that":[175],"proposed":[177],"framework":[180],"maintains":[181],"stable":[182],"performance":[183],"challenging":[185],"imaging":[186],"conditions,":[187],"prior":[189],"while":[191],"providing":[192],"reliable":[194],"efficient":[196],"foundation":[197],"RL-based":[199],"MT":[201],"navigation.":[202]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-16T00:00:00"}
