{"id":"https://openalex.org/W4415537456","doi":"https://doi.org/10.1145/3746027.3754876","title":"EchoVim: Making Vision Mamba Docile for Echocardiography Video Segmentation via Dynamic Interaction and Semantic Token-attentive Refinement","display_name":"EchoVim: Making Vision Mamba Docile for Echocardiography Video Segmentation via Dynamic Interaction and Semantic Token-attentive Refinement","publication_year":2025,"publication_date":"2025-10-25","ids":{"openalex":"https://openalex.org/W4415537456","doi":"https://doi.org/10.1145/3746027.3754876"},"language":null,"primary_location":{"id":"doi:10.1145/3746027.3754876","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3754876","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114949640","display_name":"Jingxing Guo","orcid":"https://orcid.org/0009-0005-2218-591X"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingxing Guo","raw_affiliation_strings":["Shenzhen University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103638629","display_name":"George TY Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guilian Chen","raw_affiliation_strings":["Shenzhen University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yimu Sun","orcid":"https://orcid.org/0009-0002-7011-1729"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yimu Sun","raw_affiliation_strings":["Shenzhen University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026540573","display_name":"Huisi Wu","orcid":"https://orcid.org/0000-0002-0399-9089"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huisi Wu","raw_affiliation_strings":["Shenzhen University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen University, Shenzhen, China","institution_ids":["https://openalex.org/I180726961"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100662807","display_name":"Jing Qin","orcid":"https://orcid.org/0000-0002-7059-0929"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jing Qin","raw_affiliation_strings":["Hong Kong Polytechnic University, Hong Kong, China"],"affiliations":[{"raw_affiliation_string":"Hong Kong Polytechnic University, Hong Kong, China","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5114949640"],"corresponding_institution_ids":["https://openalex.org/I180726961"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.2964524,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"3261","last_page":"3269"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.992900013923645,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7347000241279602},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.566100001335144},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5163000226020813},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5078999996185303},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4984999895095825},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4973999857902527},{"id":"https://openalex.org/keywords/speckle-noise","display_name":"Speckle noise","score":0.47510001063346863},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.46309998631477356},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.4453999996185303}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7810999751091003},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7347000241279602},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6789000034332275},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.574999988079071},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.566100001335144},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5163000226020813},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5078999996185303},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4984999895095825},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4973999857902527},{"id":"https://openalex.org/C180940675","wikidata":"https://www.wikidata.org/wiki/Q7575045","display_name":"Speckle noise","level":3,"score":0.47510001063346863},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.46309998631477356},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.4453999996185303},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.41350001096725464},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3873000144958496},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.36550000309944153},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3359000086784363},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.33399999141693115},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3165000081062317},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.30809998512268066},{"id":"https://openalex.org/C16345878","wikidata":"https://www.wikidata.org/wiki/Q107472979","display_name":"Orientation (vector space)","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.27810001373291016},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.27090001106262207},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2621999979019165},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26019999384880066}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746027.3754876","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746027.3754876","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4206905956","display_name":null,"funder_award_id":"2024A1515011946","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G6694410858","display_name":null,"funder_award_id":"62273241","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W2048309569","https://openalex.org/W3013692475","https://openalex.org/W3093273221","https://openalex.org/W3209901427","https://openalex.org/W4214612132","https://openalex.org/W4214701508","https://openalex.org/W4229447846","https://openalex.org/W4308769137","https://openalex.org/W4312396403","https://openalex.org/W4312560592","https://openalex.org/W4389430914","https://openalex.org/W4390874575"],"related_works":[],"abstract_inverted_index":{"Automatic":[0],"echocardiography":[1,182],"video":[2,183],"segmentation":[3,60],"is":[4],"a":[5,19,57,83,115,147],"powerful":[6],"tool":[7],"for":[8],"improving":[9],"the":[10,47,189],"accuracy":[11],"of":[12,35,50],"cardiovascular":[13],"function":[14],"assessment.":[15],"However,":[16],"it":[17,74],"remains":[18],"challenging":[20],"task":[21],"owing":[22],"to":[23,46,67,101,109,158,167],"(1)":[24],"extensive":[25,177],"speckle":[26,169],"noise":[27,170],"and":[28,40,97,186,188],"blurred":[29],"boundaries,":[30],"(2)":[31],"dramatic":[32],"shape":[33],"variations":[34,142],"targeting":[36],"structures":[37],"across":[38,126],"frames,":[39],"(3)":[41],"limited":[42],"labeled":[43],"data":[44],"due":[45],"high":[48],"cost":[49],"annotation.":[51],"In":[52],"this":[53],"paper,":[54],"we":[55,72],"present":[56],"novel":[58],"semi-supervised":[59],"model":[61],"based":[62],"on":[63,179],"Vision":[64],"Mamba":[65],"(Vim)":[66],"comprehensively":[68],"tackle":[69],"these":[70],"challenges;":[71],"call":[73],"EchoVim.":[75],"Our":[76],"framework":[77],"introduces":[78],"three":[79],"technical":[80],"innovations:":[81],"First,":[82],"bidirectional":[84],"inference":[85],"mechanism":[86],"(BIM)":[87],"which":[88],"can":[89],"propagate":[90],"label":[91],"information":[92],"bidirectionally":[93],"from":[94,171],"end-diastolic":[95],"(ED)":[96],"end-systolic":[98],"(ES)":[99],"frames":[100,127],"generate":[102],"pseudo-labels,":[103],"coupled":[104],"with":[105,199],"confidence-aware":[106],"dynamic":[107,116],"updating":[108],"progressively":[110],"refine":[111],"supervision":[112],"signals.":[113],"Second,":[114],"interaction":[117],"temporal":[118],"alignment":[119],"(DITA)":[120],"module":[121,152],"that":[122,153,192],"establishes":[123],"anatomical":[124,173],"correspondence":[125],"by":[128],"adaptively":[129],"enhancing":[130],"features":[131],"near":[132],"temporally":[133],"stable":[134],"regions":[135],"while":[136],"suppressing":[137],"motion-irrelevant":[138],"artifacts,":[139],"effectively":[140],"addressing":[141],"in":[143],"cardiac":[144,160],"shape.":[145],"Third,":[146],"semantic":[148,156],"token-attentive":[149],"refinement":[150],"(STR)":[151],"constructs":[154],"low-rank":[155],"tokens":[157],"encode":[159],"structure":[161],"priors,":[162],"utilizing":[163],"attention-guided":[164],"nonlinear":[165],"transformations":[166],"disentangle":[168],"true":[172],"patterns.":[174],"We":[175],"conduct":[176],"experiments":[178],"two":[180],"benchmarking":[181],"datasets:":[184],"CAMUS":[185],"EchoNet-Dynamic,":[187],"results":[190],"demonstrate":[191],"our":[193],"method":[194],"outperforms":[195],"existing":[196],"state-of-the-art":[197],"approaches":[198],"real-time":[200],"inference.":[201],"Codes":[202],"are":[203],"available":[204],"at":[205],"https://github.com/guojx2255/EchoVim.":[206]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-25T00:00:00"}
