{"id":"https://openalex.org/W4402500933","doi":"https://doi.org/10.1145/3664647.3681192","title":"Language-Driven Interactive Shadow Detection","display_name":"Language-Driven Interactive Shadow Detection","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4402500933","doi":"https://doi.org/10.1145/3664647.3681192"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3681192","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2408.08543","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5074311923","display_name":"Hongqiu Wang","orcid":"https://orcid.org/0000-0001-9726-4253"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hongqiu Wang","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-9726-4253","affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Wei Wang","orcid":"https://orcid.org/0009-0003-5272-5062"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0009-0003-5272-5062","affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101644087","display_name":"Haipeng Zhou","orcid":"https://orcid.org/0000-0001-5398-7847"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Haipeng Zhou","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0001-5398-7847","affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Huihui Xu","orcid":"https://orcid.org/0009-0006-7868-1100"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huihui Xu","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China"],"raw_orcid":"https://orcid.org/0009-0006-7868-1100","affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou), Guangzhou, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100518821","display_name":"Shaozhi Wu","orcid":"https://orcid.org/0000-0001-5466-8119"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaozhi Wu","raw_affiliation_strings":["University of Electronic Science and Technology of China, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0001-5466-8119","affiliations":[{"raw_affiliation_string":"University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5016081925","display_name":"Lei Zhu","orcid":"https://orcid.org/0000-0003-3871-663X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lei Zhu","raw_affiliation_strings":["The Hong Kong University of Science and Technology (Guangzhou) &amp; The Hong Kong University of Science and Technology, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-3871-663X","affiliations":[{"raw_affiliation_string":"The Hong Kong University of Science and Technology (Guangzhou) &amp; The Hong Kong University of Science and Technology, Guangzhou, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5074311923"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6665,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.85372314,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5527","last_page":"5536"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12597","display_name":"Fire Detection and Safety Systems","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/2213","display_name":"Safety, Risk, Reliability and Quality"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8733358979225159},{"id":"https://openalex.org/keywords/shadow","display_name":"Shadow (psychology)","score":0.6294616460800171},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6109960079193115},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5865052938461304},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5369671583175659},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5004794597625732},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.49178555607795715}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8733358979225159},{"id":"https://openalex.org/C117797892","wikidata":"https://www.wikidata.org/wiki/Q286363","display_name":"Shadow (psychology)","level":2,"score":0.6294616460800171},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6109960079193115},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5865052938461304},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5369671583175659},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5004794597625732},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.49178555607795715},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3664647.3681192","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3681192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2408.08543","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.08543","pdf_url":"https://arxiv.org/pdf/2408.08543","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:repository.hkust.edu.hk:1783.1-148933","is_oa":false,"landing_page_url":"http://repository.hkust.edu.hk/ir/Record/1783.1-148933","pdf_url":null,"source":{"id":"https://openalex.org/S4306401796","display_name":"Rare & Special e-Zone (The Hong Kong University of Science and Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I200769079","host_organization_name":"Hong Kong University of Science and Technology","host_organization_lineage":["https://openalex.org/I200769079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Conference paper"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2408.08543","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2408.08543","pdf_url":"https://arxiv.org/pdf/2408.08543","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5400000214576721,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G7223822238","display_name":null,"funder_award_id":"2024A03J0618","funder_id":"https://openalex.org/F4320323537","funder_display_name":"Hong Kong University of Science and Technology"}],"funders":[{"id":"https://openalex.org/F4320321920","display_name":"Innovation and Technology Commission","ror":"https://ror.org/04vf9tr09"},{"id":"https://openalex.org/F4320323537","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4402500933.pdf","grobid_xml":"https://content.openalex.org/works/W4402500933.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W1816614560","https://openalex.org/W1906669240","https://openalex.org/W2027850463","https://openalex.org/W2043422482","https://openalex.org/W2073839959","https://openalex.org/W2113449189","https://openalex.org/W2123302273","https://openalex.org/W2138187652","https://openalex.org/W2147558395","https://openalex.org/W2166502676","https://openalex.org/W2176911336","https://openalex.org/W2194775991","https://openalex.org/W2206865673","https://openalex.org/W2251512949","https://openalex.org/W2565639579","https://openalex.org/W2605127024","https://openalex.org/W2771617895","https://openalex.org/W2895126795","https://openalex.org/W2962766617","https://openalex.org/W3030561198","https://openalex.org/W3034627419","https://openalex.org/W3035462037","https://openalex.org/W3102699694","https://openalex.org/W3107179267","https://openalex.org/W3175028288","https://openalex.org/W3175990321","https://openalex.org/W3178075329","https://openalex.org/W3188140417","https://openalex.org/W3205656514","https://openalex.org/W3205688125","https://openalex.org/W3206381516","https://openalex.org/W3207737630","https://openalex.org/W3215899623","https://openalex.org/W4211053420","https://openalex.org/W4226024706","https://openalex.org/W4304084084","https://openalex.org/W4309131501","https://openalex.org/W4312690830","https://openalex.org/W4383097625","https://openalex.org/W4387422830","https://openalex.org/W4387968016","https://openalex.org/W4388191286","https://openalex.org/W4390872515","https://openalex.org/W4390872868","https://openalex.org/W4390873204","https://openalex.org/W4399512996","https://openalex.org/W4400525960","https://openalex.org/W4401306839","https://openalex.org/W4402917209","https://openalex.org/W4403780784"],"related_works":["https://openalex.org/W2893218741","https://openalex.org/W4392589133","https://openalex.org/W2558319350","https://openalex.org/W1492594177","https://openalex.org/W1842742976","https://openalex.org/W2803235238","https://openalex.org/W3112085556","https://openalex.org/W399661440","https://openalex.org/W4392585872","https://openalex.org/W410356389"],"abstract_inverted_index":{"Traditional":[0],"shadow":[1,6,57,199,217],"detectors":[2],"often":[3],"identify":[4],"all":[5],"regions":[7],"of":[8,37,55,59,118,129,192,249],"static":[9],"images":[10],"or":[11],"video":[12,93,195,230],"sequences.":[13],"This":[14,48],"work":[15],"presents":[16],"the":[17,30,35,85,101,127,135,155,193,228],"Referring":[18,148],"Video":[19],"Shadow":[20,206],"Detection":[21],"(RVSD),":[22],"which":[23,110],"is":[24,134],"an":[25],"innovative":[26],"task":[27],"that":[28,235],"rejuvenates":[29],"classic":[31],"paradigm":[32],"by":[33,78,224],"facilitating":[34],"segmentation":[36,54],"particular":[38],"shadows":[39],"in":[40],"videos":[41,113],"based":[42,61],"on":[43,62,142],"descriptive":[44],"natural":[45,80],"language":[46,81],"prompts.":[47],"novel":[49],"RVSD":[50,102,108,156,242],"not":[51],"only":[52],"achieves":[53,238],"arbitrary":[56],"areas":[58],"interest":[60],"descriptions":[63,122],"(flexibility)":[64],"but":[65],"also":[66,202],"allows":[67],"users":[68],"to":[69,95,168,189,209,213],"interact":[70],"with":[71,123,227,243],"visual":[72,222],"content":[73],"more":[74,221],"directly":[75],"and":[76,114,173,178,253],"naturally":[77],"using":[79],"prompts":[82],"(interactivity),":[83],"paving":[84],"way":[86],"for":[87,138,153,197,219,241],"abundant":[88],"applications":[89],"ranging":[90],"from":[91],"advanced":[92],"editing":[94],"virtual":[96],"reality":[97],"experiences.":[98],"To":[99,126],"pioneer":[100],"research,":[103],"we":[104,145,161],"curated":[105],"a":[106,115,147,163,185,204,215,244],"well-annotated":[107],"dataset,":[109,144],"encompasses":[111],"86":[112],"rich":[116],"set":[117],"15,011":[119],"paired":[120],"textual":[121],"corresponding":[124],"shadows.":[125],"best":[128],"our":[130,159,236],"knowledge,":[131],"this":[132,143],"dataset":[133,254],"first":[136],"one":[137],"addressing":[139,154],"RVSD.":[140],"Based":[141],"propose":[146],"Shadow-Track":[149],"Memory":[150,166],"Network":[151],"(RSM-Net)":[152],"task.":[157],"In":[158],"RSM-Net,":[160],"devise":[162],"Twin-Track":[164],"Synergistic":[165],"(TSM)":[167],"store":[169],"intra-clip":[170],"memory":[171,176,182,186],"features":[172,183,191,223],"hierarchical":[174],"inter-clip":[175],"features,":[177],"then":[179],"pass":[180],"these":[181],"into":[184],"read":[187],"module":[188],"refine":[190],"current":[194],"frame":[196],"referring":[198],"detection.":[200],"We":[201],"develop":[203],"Mixed-Prior":[205],"Attention":[207],"(MSA)":[208],"utilize":[210],"physical":[211],"priors":[212],"obtain":[214],"coarse":[216],"map":[218],"learning":[220],"weighting":[225],"it":[226],"input":[229],"frame.":[231],"Experimental":[232],"results":[233],"show":[234],"RSM-Net":[237],"state-of-the-art":[239],"performance":[240],"notable":[245],"Overall":[246],"IOU":[247],"increase":[248],"4.4%.":[250],"Our":[251],"code":[252],"are":[255],"available":[256],"at":[257],"https://github.com/whq-xxh/RVSD.":[258]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
