{"id":"https://openalex.org/W4410115110","doi":"https://doi.org/10.1109/tip.2025.3565879","title":"Explicit Motion Handling and Interactive Prompting for Video Camouflaged Object Detection","display_name":"Explicit Motion Handling and Interactive Prompting for Video Camouflaged Object Detection","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4410115110","doi":"https://doi.org/10.1109/tip.2025.3565879","pmid":"https://pubmed.ncbi.nlm.nih.gov/40327478"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2025.3565879","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3565879","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100327451","display_name":"Xin Zhang","orcid":"https://orcid.org/0000-0002-4133-6964"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Zhang","raw_affiliation_strings":["National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-4133-6964","affiliations":[{"raw_affiliation_string":"National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Tao Xiao","orcid":"https://orcid.org/0009-0007-0614-0257"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tao Xiao","raw_affiliation_strings":["College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China"],"raw_orcid":"https://orcid.org/0009-0007-0614-0257","affiliations":[{"raw_affiliation_string":"College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]},{"raw_affiliation_string":"College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001285878","display_name":"Ge-Peng Ji","orcid":"https://orcid.org/0000-0001-7092-2877"},"institutions":[{"id":"https://openalex.org/I118347636","display_name":"Australian National University","ror":"https://ror.org/019wvm592","country_code":"AU","type":"education","lineage":["https://openalex.org/I118347636"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Ge-Peng Ji","raw_affiliation_strings":["School of Computing, Australian National University, Canberra, Australia"],"raw_orcid":"https://orcid.org/0000-0001-7092-2877","affiliations":[{"raw_affiliation_string":"School of Computing, Australian National University, Canberra, Australia","institution_ids":["https://openalex.org/I118347636"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042741381","display_name":"Xuan Wu","orcid":"https://orcid.org/0000-0003-2088-9380"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuan Wu","raw_affiliation_strings":["College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]},{"raw_affiliation_string":"College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042631401","display_name":"Keren Fu","orcid":"https://orcid.org/0000-0002-3195-2077"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Keren Fu","raw_affiliation_strings":["College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0002-3195-2077","affiliations":[{"raw_affiliation_string":"College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]},{"raw_affiliation_string":"College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5085914001","display_name":"Qijun Zhao","orcid":"https://orcid.org/0000-0003-4651-7163"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qijun Zhao","raw_affiliation_strings":["College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0003-4651-7163","affiliations":[{"raw_affiliation_string":"College of Computer Science and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]},{"raw_affiliation_string":"College of Computer Science, and the National Key Laboratory of Fundamental Science on Synthetic Vision, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I24185976"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100327451"],"corresponding_institution_ids":["https://openalex.org/I24185976"],"apc_list":null,"apc_paid":null,"fwci":2.2665,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.87738053,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"34","issue":null,"first_page":"2853","last_page":"2866"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11019","display_name":"Image Enhancement Techniques","score":0.9876000285148621,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9761000275611877,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.7441573143005371},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.692948043346405},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6544574499130249},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5265184640884399},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5031434893608093},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.4622623026371002},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4502628445625305},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.4492338299751282},{"id":"https://openalex.org/keywords/motion-detection","display_name":"Motion detection","score":0.42015135288238525},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.20179754495620728}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.7441573143005371},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.692948043346405},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6544574499130249},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5265184640884399},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5031434893608093},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.4622623026371002},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4502628445625305},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.4492338299751282},{"id":"https://openalex.org/C2780624872","wikidata":"https://www.wikidata.org/wiki/Q852453","display_name":"Motion detection","level":3,"score":0.42015135288238525},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.20179754495620728}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2025.3565879","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3565879","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:40327478","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40327478","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1560263876","display_name":null,"funder_award_id":"2025ZNSFSC0469","funder_id":"https://openalex.org/F4320336756","funder_display_name":"Tianjin Science and Technology Program"},{"id":"https://openalex.org/G4542985435","display_name":null,"funder_award_id":"62176170","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4709256565","display_name":null,"funder_award_id":"62176169","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5435438650","display_name":null,"funder_award_id":"62176169, 62176170","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320336756","display_name":"Tianjin Science and Technology Program","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":93,"referenced_works":["https://openalex.org/W1849277567","https://openalex.org/W1982075130","https://openalex.org/W1994922096","https://openalex.org/W1995517039","https://openalex.org/W2076756823","https://openalex.org/W2100470808","https://openalex.org/W2110019070","https://openalex.org/W2133665775","https://openalex.org/W2138682569","https://openalex.org/W2151040689","https://openalex.org/W2326050853","https://openalex.org/W2339309815","https://openalex.org/W2470139095","https://openalex.org/W2793029440","https://openalex.org/W2797488090","https://openalex.org/W2884367402","https://openalex.org/W2894890793","https://openalex.org/W2895340898","https://openalex.org/W2942939335","https://openalex.org/W2943125866","https://openalex.org/W2948937967","https://openalex.org/W2961348656","https://openalex.org/W2962823460","https://openalex.org/W2963091558","https://openalex.org/W2963112696","https://openalex.org/W2963868681","https://openalex.org/W2965638232","https://openalex.org/W2969626490","https://openalex.org/W2970648063","https://openalex.org/W2983488121","https://openalex.org/W2984144959","https://openalex.org/W2990205821","https://openalex.org/W2990984982","https://openalex.org/W2997217064","https://openalex.org/W3034684132","https://openalex.org/W3034896357","https://openalex.org/W3044364325","https://openalex.org/W3048236698","https://openalex.org/W3092344722","https://openalex.org/W3108043693","https://openalex.org/W3108460979","https://openalex.org/W3109908659","https://openalex.org/W3122006940","https://openalex.org/W3164098653","https://openalex.org/W3168112135","https://openalex.org/W3172675153","https://openalex.org/W3173782971","https://openalex.org/W3175515048","https://openalex.org/W3199914841","https://openalex.org/W3202285299","https://openalex.org/W3203092180","https://openalex.org/W3212593512","https://openalex.org/W3215023725","https://openalex.org/W4214542306","https://openalex.org/W4221151441","https://openalex.org/W4225672218","https://openalex.org/W4285240374","https://openalex.org/W4308456711","https://openalex.org/W4312258849","https://openalex.org/W4312510454","https://openalex.org/W4312642299","https://openalex.org/W4312651322","https://openalex.org/W4312880622","https://openalex.org/W4315490105","https://openalex.org/W4362654014","https://openalex.org/W4381716707","https://openalex.org/W4382450131","https://openalex.org/W4385245566","https://openalex.org/W4386075647","https://openalex.org/W4386075673","https://openalex.org/W4386076039","https://openalex.org/W4387969595","https://openalex.org/W4388574886","https://openalex.org/W4390659810","https://openalex.org/W4390874575","https://openalex.org/W4391697007","https://openalex.org/W4399923948","https://openalex.org/W4402727860","https://openalex.org/W4402978305","https://openalex.org/W4403081532","https://openalex.org/W4403420280","https://openalex.org/W4406457466","https://openalex.org/W4408634392","https://openalex.org/W6631190155","https://openalex.org/W6685670348","https://openalex.org/W6754033419","https://openalex.org/W6755977528","https://openalex.org/W6759534164","https://openalex.org/W6766978945","https://openalex.org/W6778883912","https://openalex.org/W6796075269","https://openalex.org/W6803857009","https://openalex.org/W6839270766"],"related_works":["https://openalex.org/W4205448459","https://openalex.org/W4292830139","https://openalex.org/W4319309705","https://openalex.org/W3162303681","https://openalex.org/W2965594636","https://openalex.org/W2164674712","https://openalex.org/W3204216905","https://openalex.org/W2017155773","https://openalex.org/W2911525783","https://openalex.org/W4376454785"],"abstract_inverted_index":{"Camouflage":[0],"poses":[1],"notable":[2],"challenges":[3],"in":[4,50,108,160],"distinguishing":[5],"a":[6,59,78,89,161,176,246],"static":[7],"target,":[8],"as":[9,41,175],"it":[10,28],"usually":[11],"blends":[12],"seamlessly":[13],"with":[14,185,206],"the":[15,21,103,125,144,151,195,215,254],"background.":[16],"However,":[17],"any":[18],"movement":[19],"by":[20,88,116,156],"target":[22],"can":[23,171],"disrupt":[24],"this":[25,55],"disguise,":[26],"making":[27],"detectable.":[29],"Existing":[30],"video":[31,242,250],"camouflaged":[32,95,126],"object":[33],"detection":[34,48],"(VCOD)":[35],"approaches":[36],"take":[37],"noisy":[38],"motion":[39,45,74,129,152],"estimation":[40],"input":[42],"or":[43],"model":[44,198,217],"implicitly,":[46],"restricting":[47],"performance":[49],"complex":[51],"dynamic":[52],"scenes.":[53],"In":[54],"paper,":[56],"we":[57,165],"propose":[58],"novel":[60],"Explicit":[61],"Motion":[62],"handling":[63],"and":[64,97,128,136,140,180,225,256],"Interactive":[65],"Prompting":[66],"framework":[67],"for":[68,92],"VCOD,":[69],"dubbed":[70],"EMIP,":[71,194],"which":[72],"handles":[73],"cues":[75],"explicitly":[76],"using":[77],"frozen":[79],"pre-trained":[80],"optical":[81,98,158],"flow":[82,99,159],"fundamental":[83],"model.":[84],"EMIP":[85,179,199,224,226],"is":[86,114,154,264],"characterized":[87],"two-stream":[90],"architecture":[91],"simultaneously":[93],"conducting":[94],"segmentation":[96,243,251],"estimation.":[100],"Interactions":[101],"across":[102],"dual":[104],"streams":[105],"are":[106,131],"realized":[107],"an":[109],"interactive":[110],"prompting":[111],"way":[112],"that":[113,167,222],"inspired":[115],"emerging":[117],"visual":[118],"prompt":[119,148,177],"learning.":[120],"Two":[121],"learnable":[122],"modules,":[123],"i.e.":[124],"feeder":[127],"collector,":[130],"designed":[132],"to":[133,150],"incorporate":[134],"segmentation-to-motion":[135],"motion-to-segmentation":[137],"prompts,":[138],"respectively,":[139],"enhance":[141],"outputs":[142],"of":[143,214,249,260],"both":[145,223],"streams.":[146],"The":[147],"fed":[149],"stream":[153],"learned":[155],"supervising":[157],"self-supervised":[162],"manner.":[163],"Furthermore,":[164],"show":[166],"long-term":[168,197],"historical":[169],"information":[170],"also":[172],"be":[173],"incorporated":[174],"into":[178],"achieve":[181],"more":[182],"robust":[183],"results":[184,220],"temporal":[186],"consistency.":[187],"By":[188],"leveraging":[189],"promoting":[190],"techniques":[191],"based":[192],"on":[193,233,245],"proposed":[196],"${}^{\\dagger":[200,227],"}$":[201,228],"incurs":[202],"lower":[203],"training":[204],"cost":[205],"only":[207],"8.5M":[208],"trainable":[209],"parameters":[210],"(less":[211],"than":[212],"8%":[213],"total":[216],"parameters).":[218],"Experimental":[219],"demonstrate":[221,253],"set":[229],"new":[230],"state-of-the-art":[231],"records":[232],"popular":[234],"VCOD":[235],"benchmarks.":[236],"Additionally,":[237],"comparative":[238],"evaluations":[239],"against":[240],"other":[241],"models":[244],"wider":[247],"range":[248],"tasks":[252],"robustness":[255],"superior":[257],"generalization":[258],"capabilities":[259],"EMIP.":[261],"Our":[262],"code":[263],"made":[265],"publicly":[266],"available":[267],"at":[268],"https://github.com/zhangxin06/EMIP.":[269]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
