{"id":"https://openalex.org/W4312297823","doi":"https://doi.org/10.1109/tmm.2022.3225720","title":"Dual Cross-Attention for Video Object Segmentation via Uncertainty Refinement","display_name":"Dual Cross-Attention for Video Object Segmentation via Uncertainty Refinement","publication_year":2022,"publication_date":"2022-12-01","ids":{"openalex":"https://openalex.org/W4312297823","doi":"https://doi.org/10.1109/tmm.2022.3225720"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2022.3225720","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2022.3225720","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020420401","display_name":"Jiahao Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiahao Hong","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100441587","display_name":"Wei Zhang","orcid":"https://orcid.org/0000-0002-2358-8543"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-2358-8543","affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109593667","display_name":"Zhiwei Feng","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwei Feng","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100669255","display_name":"Wenqiang Zhang","orcid":"https://orcid.org/0000-0002-3339-8751"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenqiang Zhang","raw_affiliation_strings":["Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-3339-8751","affiliations":[{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5020420401"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.5102,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.65077277,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":97},"biblio":{"volume":"25","issue":null,"first_page":"7710","last_page":"7725"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8817810416221619},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7415038347244263},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7241684794425964},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6275304555892944},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5878915786743164},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5674282312393188},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5425177216529846},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.45050740242004395},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4497886300086975},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.4434361457824707},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.43453770875930786},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4282609522342682},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41379451751708984},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.38671234250068665},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.08739596605300903}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8817810416221619},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7415038347244263},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7241684794425964},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6275304555892944},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5878915786743164},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5674282312393188},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5425177216529846},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.45050740242004395},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4497886300086975},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.4434361457824707},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.43453770875930786},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4282609522342682},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41379451751708984},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.38671234250068665},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.08739596605300903},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2022.3225720","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2022.3225720","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G7143284523","display_name":null,"funder_award_id":"62072112","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":79,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W1903029394","https://openalex.org/W2031489346","https://openalex.org/W2291627510","https://openalex.org/W2302255633","https://openalex.org/W2470139095","https://openalex.org/W2562457735","https://openalex.org/W2564998703","https://openalex.org/W2610147486","https://openalex.org/W2750515003","https://openalex.org/W2794847483","https://openalex.org/W2798441772","https://openalex.org/W2799157347","https://openalex.org/W2884585870","https://openalex.org/W2889658408","https://openalex.org/W2889986507","https://openalex.org/W2896457183","https://openalex.org/W2907536214","https://openalex.org/W2916743882","https://openalex.org/W2916797271","https://openalex.org/W2921536280","https://openalex.org/W2945161979","https://openalex.org/W2962825871","https://openalex.org/W2963091558","https://openalex.org/W2963131444","https://openalex.org/W2963227409","https://openalex.org/W2963253279","https://openalex.org/W2963503215","https://openalex.org/W2963563276","https://openalex.org/W2963732700","https://openalex.org/W2964110616","https://openalex.org/W2964211168","https://openalex.org/W2964218467","https://openalex.org/W2964343881","https://openalex.org/W2967622921","https://openalex.org/W2981793666","https://openalex.org/W2990205821","https://openalex.org/W3033502887","https://openalex.org/W3034263000","https://openalex.org/W3034538699","https://openalex.org/W3034798428","https://openalex.org/W3034885317","https://openalex.org/W3035042565","https://openalex.org/W3035077787","https://openalex.org/W3035358681","https://openalex.org/W3035672751","https://openalex.org/W3047258141","https://openalex.org/W3094664776","https://openalex.org/W3098341861","https://openalex.org/W3102457447","https://openalex.org/W3106773277","https://openalex.org/W3107113572","https://openalex.org/W3108819577","https://openalex.org/W3110030584","https://openalex.org/W3117097536","https://openalex.org/W3160550216","https://openalex.org/W3166738350","https://openalex.org/W3169367294","https://openalex.org/W3170630188","https://openalex.org/W3171516518","https://openalex.org/W3175132347","https://openalex.org/W3175373394","https://openalex.org/W3176065502","https://openalex.org/W3177322837","https://openalex.org/W3183673520","https://openalex.org/W3192871594","https://openalex.org/W3200949949","https://openalex.org/W3202509201","https://openalex.org/W4214542306","https://openalex.org/W4239147634","https://openalex.org/W4288374355","https://openalex.org/W6631190155","https://openalex.org/W6696672603","https://openalex.org/W6739901393","https://openalex.org/W6743811873","https://openalex.org/W6759534164","https://openalex.org/W6761623811","https://openalex.org/W6784713722","https://openalex.org/W6796524941"],"related_works":["https://openalex.org/W3144569342","https://openalex.org/W2185902295","https://openalex.org/W2945274617","https://openalex.org/W2103507220","https://openalex.org/W2055202857","https://openalex.org/W2371519352","https://openalex.org/W4205800335","https://openalex.org/W2386644571","https://openalex.org/W2372421320","https://openalex.org/W2901890255"],"abstract_inverted_index":{"In":[0,68],"this":[1],"paper,":[2],"we":[3],"propose":[4],"a":[5,17,21,106],"novel":[6],"approach":[7,141],"to":[8,26,44,61,70,98,116,142],"video":[9,53,143],"object":[10,122,144],"segmentation":[11],"where":[12],"dual":[13,77],"streams":[14],"consisting":[15],"of":[16,31,35,138],"shared":[18],"network":[19,23],"and":[20,38,56,72,84,95,120,133],"special":[22],"are":[24,41,58,92],"designed":[25,111],"constitute":[27],"the":[28,46,52,75,89,113,127,136],"feature":[29],"memory":[30],"history":[32],"frames.":[33],"Cues":[34],"spatial":[36],"position":[37],"time":[39],"stamp":[40],"explicitly":[42],"explored":[43],"learn":[45],"context":[47],"for":[48,66,104,112],"each":[49],"frame":[50],"in":[51,80],"sequence.":[54],"Self-attention":[55],"cross-attention":[57,78],"simultaneously":[59],"exploited":[60],"extract":[62],"more":[63,93,118],"powerful":[64],"features":[65,91],"segmentation.":[67,145],"contrast":[69],"STM":[71],"its":[73],"variants,":[74],"proposed":[76,140],"performs":[79],"both":[81],"appearance":[82],"space":[83,86],"semantic":[85],"such":[87],"that":[88],"derived":[90],"distinctive":[94],"then":[96],"robust":[97],"similar":[99],"overlapping":[100],"objects.":[101],"During":[102],"decoding":[103],"segmentation,":[105],"local":[107],"refinement":[108],"technique":[109],"is":[110],"uncertain":[114],"boundaries":[115],"obtain":[117],"precise":[119],"smooth":[121],"contours.":[123],"Experimental":[124],"results":[125],"on":[126],"challenging":[128],"benchmark":[129],"datasets":[130],"DAVIS-2016,":[131],"DAVIS-2017,":[132],"YouTube-VOS":[134],"demonstrate":[135],"effectiveness":[137],"our":[139]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
