{"id":"https://openalex.org/W7147069775","doi":"https://doi.org/10.48550/arxiv.2603.26720","title":"SutureAgent: Learning Surgical Trajectories via Goal-conditioned Offline RL in Pixel Space","display_name":"SutureAgent: Learning Surgical Trajectories via Goal-conditioned Offline RL in Pixel Space","publication_year":2026,"publication_date":"2026-03-19","ids":{"openalex":"https://openalex.org/W7147069775","doi":"https://doi.org/10.48550/arxiv.2603.26720"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.26720","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26720","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.26720","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132699745","display_name":"Huanrong Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Liu, Huanrong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132580308","display_name":"Chunlin Tian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Chunlin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132626520","display_name":"Tongyu Jia","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jia, Tongyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132638835","display_name":"Tailai Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Tailai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100432512","display_name":"Qin Liu","orcid":"https://orcid.org/0000-0003-1951-854X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Qin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132567980","display_name":"Yu Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011762462","display_name":"Yutong Ban","orcid":"https://orcid.org/0000-0001-5396-9251"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ban, Yutong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132654516","display_name":"Yun Gu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gu, Yun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000400312","display_name":"Guy Rosman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rosman, Guy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132679697","display_name":"Xin Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Xin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132670035","display_name":"Qingbiao Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Qingbiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5132699745"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.859499990940094,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10868","display_name":"Soft Robotics and Applications","score":0.859499990940094,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10916","display_name":"Surgical Simulation and Training","score":0.08940000087022781,"subfield":{"id":"https://openalex.org/subfields/2746","display_name":"Surgery"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.01600000075995922,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.6394000053405762},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5644000172615051},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5223000049591064},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion capture","score":0.43709999322891235},{"id":"https://openalex.org/keywords/state-space","display_name":"State space","score":0.3930000066757202},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.38679999113082886},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.3693000078201294},{"id":"https://openalex.org/keywords/trajectory-optimization","display_name":"Trajectory optimization","score":0.3377000093460083},{"id":"https://openalex.org/keywords/displacement","display_name":"Displacement (psychology)","score":0.33320000767707825}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6980000138282776},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6707000136375427},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.6394000053405762},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6376000046730042},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5644000172615051},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5223000049591064},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.43709999322891235},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.3930000066757202},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.38679999113082886},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3792000114917755},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.3693000078201294},{"id":"https://openalex.org/C173246807","wikidata":"https://www.wikidata.org/wiki/Q7833062","display_name":"Trajectory optimization","level":3,"score":0.3377000093460083},{"id":"https://openalex.org/C107551265","wikidata":"https://www.wikidata.org/wiki/Q1458245","display_name":"Displacement (psychology)","level":2,"score":0.33320000767707825},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.33169999718666077},{"id":"https://openalex.org/C50637493","wikidata":"https://www.wikidata.org/wiki/Q1136781","display_name":"Morphing","level":2,"score":0.30149999260902405},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C136389625","wikidata":"https://www.wikidata.org/wiki/Q334384","display_name":"Supervised learning","level":3,"score":0.2824999988079071},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2727000117301941},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.2685999870300293},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.2606000006198883},{"id":"https://openalex.org/C10912380","wikidata":"https://www.wikidata.org/wiki/Q527952","display_name":"Visual servoing","level":3,"score":0.2590999901294708},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.2587999999523163},{"id":"https://openalex.org/C23379248","wikidata":"https://www.wikidata.org/wiki/Q200904","display_name":"Epipolar geometry","level":3,"score":0.25130000710487366},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.26720","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26720","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.26720","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26720","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8046742081642151,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Predicting":[0],"surgical":[1],"needle":[2,68,79,101,236],"trajectories":[3,213],"from":[4,28,192,214],"endoscopic":[5],"video":[6],"is":[7,81],"critical":[8],"for":[9],"robot-assisted":[10],"suturing,":[11],"enabling":[12],"anticipatory":[13],"planning,":[14],"real-time":[15],"guidance,":[16],"and":[17,103,168,172,183],"safer":[18],"motion":[19,26,39,102,152],"execution.":[20],"Existing":[21],"methods":[22],"that":[23,86,128,218],"directly":[24],"learn":[25],"distributions":[27],"visual":[29],"observations":[30],"tend":[31],"to":[32,47,132,143,162],"overlook":[33],"the":[34,53,78,98,105,141,228,232],"sequential":[35,73,241],"dependency":[36],"among":[37],"adjacent":[38],"steps.":[40],"Moreover,":[41],"sparse":[42,130],"waypoint":[43],"annotations":[44,131],"often":[45],"fail":[46],"provide":[48],"sufficient":[49],"supervision,":[50],"further":[51],"increasing":[52],"difficulty":[54],"of":[55,100,108,180,234],"supervised":[56],"or":[57],"imitation":[58],"learning":[59,126],"methods.":[60],"To":[61,186],"address":[62],"these":[63],"challenges,":[64],"we":[65,119,195],"formulate":[66],"image-based":[67],"trajectory":[69,237],"prediction":[70,238],"as":[71,83,239],"a":[72,122,205],"decision-making":[74],"problem,":[75],"in":[76,91],"which":[77],"tip":[80],"treated":[82],"an":[84,159],"agent":[85],"moves":[87],"step":[88,90],"by":[89,224],"pixel":[92],"space.":[93],"This":[94],"formulation":[95],"naturally":[96],"captures":[97],"continuity":[99],"enables":[104],"explicit":[106],"modeling":[107,235],"physically":[109],"plausible":[110,150],"pixel-wise":[111],"state":[112],"transitions":[113],"over":[114],"time.":[115],"From":[116],"this":[117],"perspective,":[118],"propose":[120],"SutureAgent,":[121],"goal-conditioned":[123],"offline":[124,189],"reinforcement":[125],"framework":[127],"leverages":[129],"dense":[133],"reward":[134],"signals":[135],"via":[136],"cubic":[137],"spline":[138],"interpolation,":[139],"encouraging":[140],"policy":[142,190],"exploit":[144],"limited":[145],"expert":[146,193],"guidance":[147],"while":[148],"exploring":[149],"future":[151,175],"paths.":[153],"SutureAgent":[154,219],"encodes":[155],"variable-length":[156],"clips":[157],"using":[158],"observation":[160],"encoder":[161],"capture":[163],"both":[164],"local":[165],"spatial":[166],"cues":[167],"long-range":[169],"temporal":[170],"dynamics,":[171],"autoregressively":[173],"predicts":[174],"waypoints":[176],"through":[177],"actions":[178],"composed":[179],"discrete":[181],"directions":[182],"continuous":[184],"magnitudes.":[185],"enable":[187],"stable":[188],"optimization":[191],"demonstrations,":[194],"adopt":[196],"Conservative":[197],"Q-Learning":[198],"with":[199,227],"Behavioral":[200],"Cloning":[201],"regularization.":[202],"Experiments":[203],"on":[204],"new":[206],"kidney":[207],"wound":[208],"suturing":[209],"dataset":[210],"containing":[211],"1,158":[212],"50":[215],"patients":[216],"show":[217],"reduces":[220],"Average":[221],"Displacement":[222],"Error":[223],"58.6%":[225],"compared":[226],"strongest":[229],"baseline,":[230],"demonstrating":[231],"effectiveness":[233],"pixel-level":[240],"action":[242],"learning.":[243]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-04-02T00:00:00"}
