{"id":"https://openalex.org/W4417295122","doi":"https://doi.org/10.1109/iccv51701.2025.01133","title":"GDKVM: Echocardiography Video Segmentation via Spatiotemporal Key-Value Memory with Gated Delta Rule","display_name":"GDKVM: Echocardiography Video Segmentation via Spatiotemporal Key-Value Memory with Gated Delta Rule","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4417295122","doi":"https://doi.org/10.1109/iccv51701.2025.01133"},"language":null,"primary_location":{"id":"doi:10.1109/iccv51701.2025.01133","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.01133","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.10252","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101720157","display_name":"Rui Wang","orcid":"https://orcid.org/0000-0002-4813-8514"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Rui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Sun, Yimu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Yimu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114949640","display_name":"Jingxing Guo","orcid":"https://orcid.org/0009-0005-2218-591X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Jingxing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026540573","display_name":"Huisi Wu","orcid":"https://orcid.org/0000-0002-0399-9089"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Huisi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100662807","display_name":"Jing Qin","orcid":"https://orcid.org/0000-0002-7059-0929"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Jing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101720157"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.38494743,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"12191","last_page":"12200"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.6208000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10052","display_name":"Medical Image Segmentation Techniques","score":0.6208000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.17499999701976776,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14510","display_name":"Medical Imaging and Analysis","score":0.034299999475479126,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7329999804496765},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6412000060081482},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.5665000081062317},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5376999974250793},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.42989999055862427},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.38670000433921814},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.3840999901294708},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.34880000352859497}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7645000219345093},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7440999746322632},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7329999804496765},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6412000060081482},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.5665000081062317},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5376999974250793},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5242000222206116},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.42989999055862427},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.38670000433921814},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.3840999901294708},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.34880000352859497},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.34850001335144043},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.31139999628067017},{"id":"https://openalex.org/C2987395694","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Feature tracking","level":3,"score":0.30480000376701355},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.29089999198913574},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2874999940395355},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.27889999747276306},{"id":"https://openalex.org/C31601959","wikidata":"https://www.wikidata.org/wiki/Q931309","display_name":"Medical imaging","level":2,"score":0.2648000121116638},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.2517000138759613}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.01133","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.01133","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2512.10252","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.10252","pdf_url":"https://arxiv.org/pdf/2512.10252","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2512.10252","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.10252","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.10252","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2512.10252","pdf_url":"https://arxiv.org/pdf/2512.10252","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4206905956","display_name":null,"funder_award_id":"2024A1515011946","funder_id":"https://openalex.org/F4320321921","funder_display_name":"Natural Science Foundation of Guangdong Province"},{"id":"https://openalex.org/G6694410858","display_name":null,"funder_award_id":"62273241","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321921","display_name":"Natural Science Foundation of Guangdong Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Accurate":[0],"segmentation":[1,38,55,167],"of":[2,14,32,166],"cardiac":[3,15],"chambers":[4],"in":[5,18,164],"echocardiography":[6,86,143],"sequences":[7],"is":[8,118,176],"crucial":[9],"for":[10,85],"the":[11,28,33,61],"quantitative":[12],"analysis":[13],"function,":[16],"aiding":[17],"clinical":[19],"diagnosis":[20],"and":[21,27,30,49,68,101,123,134,147,149,169],"treatment.":[22],"The":[23,89],"imaging":[24],"noise,":[25],"artifacts,":[26],"deformation":[29],"motion":[31],"heart":[34],"pose":[35],"challenges":[36],"to":[37,96,107,120],"algorithms.":[39],"While":[40],"existing":[41,162],"methods":[42],"based":[43],"on":[44,140],"convolutional":[45],"neural":[46],"networks,":[47],"Transformers,":[48],"space-time":[50],"memory":[51,111],"networks":[52],"have":[53],"improved":[54],"accuracy,":[56],"they":[57],"often":[58],"struggle":[59],"with":[60,72,152],"trade-off":[62],"between":[63],"capturing":[64],"long-range":[65],"spatiotemporal":[66],"dependencies":[67],"maintaining":[69],"computational":[70],"efficiency":[71],"fine-grained":[73],"feature":[74],"representation.":[75],"In":[76],"this":[77],"paper,":[78],"we":[79],"introduce":[80],"GDKVM,":[81],"a":[82],"novel":[83],"architecture":[84],"video":[87,144],"segmentation.":[88],"model":[90,98],"employs":[91],"Linear":[92],"Key-Value":[93],"Association":[94],"(LKVA)":[95],"effectively":[97],"inter-frame":[99],"correlations,":[100],"introduces":[102],"Gated":[103],"Delta":[104],"Rule":[105],"(GDR)":[106],"efficiently":[108],"store":[109],"intermediate":[110],"states.":[112],"Key-Pixel":[113],"Feature":[114],"Fusion":[115],"(KPFF)":[116],"module":[117],"designed":[119],"integrate":[121],"local":[122],"global":[124],"features":[125],"at":[126,178],"multiple":[127],"scales,":[128],"enhancing":[129],"robustness":[130],"against":[131],"boundary":[132],"blurring":[133],"noise":[135],"interference.":[136],"We":[137],"validated":[138],"GDKVM":[139,160],"two":[141],"mainstream":[142],"datasets":[145],"(CAMUS":[146],"EchoNet-Dynamic)":[148],"compared":[150],"it":[151],"various":[153],"state-of-the-art":[154],"methods.":[155],"Experimental":[156],"results":[157],"show":[158],"that":[159],"outperforms":[161],"approaches":[163],"terms":[165],"accuracy":[168],"robustness,":[170],"while":[171],"ensuring":[172],"real-time":[173],"performance.":[174],"Code":[175],"available":[177],"https://github.com/wangrui2025/GDKVM.":[179]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-12-13T00:00:00"}
