{"id":"https://openalex.org/W7131415613","doi":"https://doi.org/10.48550/arxiv.2602.20216","title":"Sample-Efficient Learning with Online Expert Correction for Autonomous Catheter Steering in Endovascular Bifurcation Navigation","display_name":"Sample-Efficient Learning with Online Expert Correction for Autonomous Catheter Steering in Endovascular Bifurcation Navigation","publication_year":2026,"publication_date":"2026-02-23","ids":{"openalex":"https://openalex.org/W7131415613","doi":"https://doi.org/10.48550/arxiv.2602.20216"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.20216","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5126778580","display_name":"Hao Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Hao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044674377","display_name":"Tianliang Yao","orcid":"https://orcid.org/0009-0000-7063-3880"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao, Tianliang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126788642","display_name":"Bo Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Bo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126853543","display_name":"Zhiqiang Pei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pei, Zhiqiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126821564","display_name":"Liu Dong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dong, Liu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126797093","display_name":"Lei Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Lei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126809386","display_name":"Peng Qi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Peng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5126778580"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9146999716758728,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.9146999716758728,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11486","display_name":"Micro and Nano Robotics","score":0.025100000202655792,"subfield":{"id":"https://openalex.org/subfields/3104","display_name":"Condensed Matter Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.006300000008195639,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.51910001039505},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.5058000087738037},{"id":"https://openalex.org/keywords/imaging-phantom","display_name":"Imaging phantom","score":0.49880000948905945},{"id":"https://openalex.org/keywords/fuzzy-logic","display_name":"Fuzzy logic","score":0.3797000050544739},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.3734999895095825},{"id":"https://openalex.org/keywords/visual-servoing","display_name":"Visual servoing","score":0.31040000915527344},{"id":"https://openalex.org/keywords/robotics","display_name":"Robotics","score":0.29010000824928284}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6438000202178955},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.51910001039505},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5080999732017517},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.5058000087738037},{"id":"https://openalex.org/C104293457","wikidata":"https://www.wikidata.org/wiki/Q28324852","display_name":"Imaging phantom","level":2,"score":0.49880000948905945},{"id":"https://openalex.org/C58166","wikidata":"https://www.wikidata.org/wiki/Q224821","display_name":"Fuzzy logic","level":2,"score":0.3797000050544739},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.3734999895095825},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35100001096725464},{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.31040000915527344},{"id":"https://openalex.org/C34413123","wikidata":"https://www.wikidata.org/wiki/Q170978","display_name":"Robotics","level":3,"score":0.29010000824928284},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2896000146865845},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.28360000252723694},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.2782999873161316},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.2694999873638153},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26660001277923584},{"id":"https://openalex.org/C55282118","wikidata":"https://www.wikidata.org/wiki/Q252683","display_name":"Snapshot (computer storage)","level":2,"score":0.25839999318122864},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.2572000026702881}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.20216","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.20216","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.20216","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.20216","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Robot-assisted":[0],"endovascular":[1,77,207],"intervention":[2],"offers":[3],"a":[4,27,64,140,144,160],"safe":[5],"and":[6,42,52,106,129,195],"effective":[7],"solution":[8],"for":[9,30,72,93,102,206],"remote":[10],"catheter":[11,32,74,197],"manipulation,":[12],"reducing":[13,173],"radiation":[14],"exposure":[15],"while":[16,172],"enabling":[17],"precise":[18],"navigation.":[19,79,208],"Reinforcement":[20],"learning":[21],"(RL)":[22],"has":[23],"recently":[24],"emerged":[25],"as":[26],"promising":[28],"approach":[29,152],"autonomous":[31,73],"steering;":[33],"however,":[34],"conventional":[35],"methods":[36],"suffer":[37],"from":[38],"sparse":[39],"reward":[40,110],"design":[41],"reliance":[43],"on":[44,139],"static":[45],"vascular":[46,135,146],"models,":[47],"limiting":[48],"their":[49],"sample":[50],"efficiency":[51],"generalization":[53],"to":[54,115,164,177],"intraoperative":[55],"variations.":[56],"To":[57],"overcome":[58],"these":[59],"challenges,":[60],"this":[61],"paper":[62],"introduces":[63],"sample-efficient":[65,187],"RL":[66,188],"framework":[67,82,125],"with":[68,189],"online":[69,121,190],"expert":[70,113,122,191],"correction":[71,192],"steering":[75],"in":[76,133,155,200],"bifurcation":[78,203],"The":[80],"proposed":[81,151],"integrates":[83],"three":[84],"key":[85],"components:":[86],"(1)":[87],"A":[88,99,108],"segmentation-based":[89],"pose":[90],"estimation":[91],"module":[92],"accurate":[94,196],"real-time":[95],"state":[96],"feedback,":[97],"(2)":[98],"fuzzy":[100],"controller":[101],"bifurcation-aware":[103],"orientation":[104],"adjustment,":[105],"(3)":[107],"structured":[109],"generator":[111],"incorporating":[112],"priors":[114],"guide":[116],"policy":[117,131],"learning.":[118],"By":[119],"leveraging":[120],"correction,":[123],"the":[124,150,165,180],"reduces":[126],"exploration":[127],"inefficiency":[128],"enhances":[130],"robustness":[132],"complex":[134],"structures.":[136],"Experimental":[137],"validation":[138],"robotic":[141],"platform":[142],"using":[143],"transparent":[145],"phantom":[147],"demonstrates":[148],"that":[149,185],"achieves":[153],"convergence":[154],"123":[156],"training":[157],"episodes":[158],"--":[159,171],"25.9%":[161],"reduction":[162],"compared":[163],"baseline":[166],"Soft":[167],"Actor-Critic":[168],"(SAC)":[169],"algorithm":[170],"average":[174],"positional":[175],"error":[176],"83.8%":[178],"of":[179],"baseline.":[181],"These":[182],"results":[183],"indicate":[184],"combining":[186],"enables":[193],"reliable":[194],"steering,":[198],"particularly":[199],"anatomically":[201],"challenging":[202],"scenarios":[204],"critical":[205]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-26T00:00:00"}
