{"id":"https://openalex.org/W4398249851","doi":"https://doi.org/10.1109/access.2024.3404463","title":"ASDeM: Augmenting SAM With Decoupled Memory for Video Object Segmentation","display_name":"ASDeM: Augmenting SAM With Decoupled Memory for Video Object Segmentation","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4398249851","doi":"https://doi.org/10.1109/access.2024.3404463"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3404463","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3404463","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10537204.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10537204.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100697068","display_name":"Xiaohu Liu","orcid":"https://orcid.org/0000-0002-8973-438X"},"institutions":[{"id":"https://openalex.org/I187175081","display_name":"Shaanxi University of Technology","ror":"https://ror.org/056m91h77","country_code":"CN","type":"education","lineage":["https://openalex.org/I187175081"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xiaohu Liu","raw_affiliation_strings":["Trine Engineering Institute, Shaanxi University of Technology, Hanzhong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Trine Engineering Institute, Shaanxi University of Technology, Hanzhong, China","institution_ids":["https://openalex.org/I187175081"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101611817","display_name":"Yichuang Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210139547","display_name":"Xi'an Peihua University","ror":"https://ror.org/032fx1s95","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210139547"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yichuang Luo","raw_affiliation_strings":["Department of Intelligent Science and Engineering, Xi&#x2019;an Peihua University, Xi&#x2019;an, China"],"raw_orcid":"https://orcid.org/0000-0002-2064-8037","affiliations":[{"raw_affiliation_string":"Department of Intelligent Science and Engineering, Xi&#x2019;an Peihua University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I4210139547"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100452387","display_name":"Wei Sun","orcid":"https://orcid.org/0000-0002-6350-8966"},"institutions":[{"id":"https://openalex.org/I187175081","display_name":"Shaanxi University of Technology","ror":"https://ror.org/056m91h77","country_code":"CN","type":"education","lineage":["https://openalex.org/I187175081"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Sun","raw_affiliation_strings":["School of Mechanical Engineering, Shaanxi University of Technology, Hanzhong, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Shaanxi University of Technology, Hanzhong, China","institution_ids":["https://openalex.org/I187175081"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100697068"],"corresponding_institution_ids":["https://openalex.org/I187175081"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.06020614,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"12","issue":null,"first_page":"73218","last_page":"73227"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8844534158706665},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8338768482208252},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.7372782230377197},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6603219509124756},{"id":"https://openalex.org/keywords/interactivity","display_name":"Interactivity","score":0.6451855897903442},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6162639856338501},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.6087501049041748},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.5915409922599792},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4853421747684479},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.44824346899986267},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.44228479266166687},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.4085221588611603},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3510970175266266},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.16119599342346191}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8844534158706665},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8338768482208252},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.7372782230377197},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6603219509124756},{"id":"https://openalex.org/C144430266","wikidata":"https://www.wikidata.org/wiki/Q839721","display_name":"Interactivity","level":2,"score":0.6451855897903442},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6162639856338501},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.6087501049041748},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.5915409922599792},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4853421747684479},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.44824346899986267},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.44228479266166687},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.4085221588611603},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3510970175266266},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.16119599342346191},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3404463","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3404463","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10537204.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:4897b3c9d7b4406391a8eb2b53be858b","is_oa":true,"landing_page_url":"https://doaj.org/article/4897b3c9d7b4406391a8eb2b53be858b","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 73218-73227 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3404463","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1109/access.2024.3404463","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10537204.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4398249851.pdf"},"referenced_works_count":43,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W2470139095","https://openalex.org/W2799157347","https://openalex.org/W2890447039","https://openalex.org/W2916743882","https://openalex.org/W2990205821","https://openalex.org/W3034499084","https://openalex.org/W3094664776","https://openalex.org/W3108819577","https://openalex.org/W3160550216","https://openalex.org/W3171516518","https://openalex.org/W3176027594","https://openalex.org/W3183673520","https://openalex.org/W3187838476","https://openalex.org/W3202466785","https://openalex.org/W4225544038","https://openalex.org/W4312326540","https://openalex.org/W4312396403","https://openalex.org/W4312815172","https://openalex.org/W4365606129","https://openalex.org/W4367000115","https://openalex.org/W4376312146","https://openalex.org/W4379474533","https://openalex.org/W4383180710","https://openalex.org/W4385327889","https://openalex.org/W4386072247","https://openalex.org/W4390874575","https://openalex.org/W4390874670","https://openalex.org/W6631190155","https://openalex.org/W6754033419","https://openalex.org/W6759534164","https://openalex.org/W6796494355","https://openalex.org/W6796505553","https://openalex.org/W6796524941","https://openalex.org/W6797162190","https://openalex.org/W6809716307","https://openalex.org/W6843861238","https://openalex.org/W6846581650","https://openalex.org/W6851607685","https://openalex.org/W6852276098","https://openalex.org/W6852629184","https://openalex.org/W6853702739","https://openalex.org/W6854990339"],"related_works":["https://openalex.org/W3144569342","https://openalex.org/W2945274617","https://openalex.org/W2185902295","https://openalex.org/W2103507220","https://openalex.org/W2055202857","https://openalex.org/W4205800335","https://openalex.org/W2371519352","https://openalex.org/W2386644571","https://openalex.org/W2372421320","https://openalex.org/W2901890255"],"abstract_inverted_index":{"Video":[0],"object":[1,124],"segmentation":[2,46,65,132],"models":[3,22],"have":[4],"gained":[5],"impressive":[6],"performance,":[7],"but":[8],"present":[9],"low":[10],"interactivity":[11],"with":[12,24,57,100],"different":[13],"prompts,":[14],"such":[15],"as":[16],"click,":[17],"box":[18],"or":[19],"text.":[20],"Some":[21],"combined":[23],"SAM":[25,56,74,85],"in":[26,66,125],"a":[27,36,126],"naive":[28],"manner":[29],"to":[30,40,69,86,105],"enhance":[31],"this":[32,49],"ability,":[33],"which":[34,54],"achieve":[35],"limited":[37],"performance":[38],"owing":[39],"the":[41,71,81,88,96,107,112,119,122,139],"coarse":[42],"mask":[43],"and":[44,64,75,94,111,133],"inconsistent":[45],"propagation.":[47],"In":[48],"paper,":[50],"we":[51],"propose":[52],"ASDeM,":[53],"augments":[55],"decoupled":[58,101],"memory,":[59],"achieving":[60],"high-performance":[61],"on":[62,143],"tracking":[63,134],"videos.":[67],"Specifically,":[68],"explore":[70],"combination":[72],"of":[73,115,141],"VOS":[76,92],"model,":[77,93],"ASDeM":[78,142],"fully":[79],"utilizes":[80],"class-agnostic":[82],"features":[83,90],"from":[84],"build":[87],"memory":[89,102],"for":[91,121],"further":[95],"object-agnostic":[97],"temporal":[98],"propagation":[99],"is":[103],"applied":[104],"address":[106],"feature":[108],"staleness":[109],"problem":[110,114],"oblivion":[113],"visual":[116],"information.":[117],"Given":[118],"prompt":[120],"specific":[123],"video,":[127],"people":[128],"can":[129],"get":[130],"satisfactory":[131],"results.":[135],"The":[136],"experiments":[137],"demonstrate":[138],"effectiveness":[140],"public":[144],"benchmarks.":[145]},"counts_by_year":[],"updated_date":"2026-05-06T08:25:59.206177","created_date":"2025-10-10T00:00:00"}
