{"id":"https://openalex.org/W4387197080","doi":"https://doi.org/10.1109/tcsvt.2023.3320688","title":"Detect Any Shadow: Segment Anything for Video Shadow Detection","display_name":"Detect Any Shadow: Segment Anything for Video Shadow Detection","publication_year":2023,"publication_date":"2023-09-29","ids":{"openalex":"https://openalex.org/W4387197080","doi":"https://doi.org/10.1109/tcsvt.2023.3320688"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3320688","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3320688","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100319201","display_name":"Yonghui Wang","orcid":"https://orcid.org/0000-0002-4741-8231"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yonghui Wang","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046805800","display_name":"Wengang Zhou","orcid":"https://orcid.org/0000-0003-1690-9836"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wengang Zhou","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","Institute of Artificial Intelligence, Hefei Comprehensive National Science Center, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Institute of Artificial Intelligence, Hefei Comprehensive National Science Center, Hefei, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088650924","display_name":"Yunyao Mao","orcid":"https://orcid.org/0000-0002-9427-9086"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunyao Mao","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5078141810","display_name":"Houqiang Li","orcid":"https://orcid.org/0000-0003-2188-3028"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Houqiang Li","raw_affiliation_strings":["Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","Institute of Artificial Intelligence, Hefei Comprehensive National Science Center, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Department of Electronic Engineering and Information Science, CAS Key Laboratory of Technology in Geo-Spatial Information Processing and Application System, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"Institute of Artificial Intelligence, Hefei Comprehensive National Science Center, Hefei, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100319201"],"corresponding_institution_ids":["https://openalex.org/I126520041"],"apc_list":null,"apc_paid":null,"fwci":3.4009,"has_fulltext":false,"cited_by_count":28,"citation_normalized_percentile":{"value":0.94150007,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"34","issue":"5","first_page":"3782","last_page":"3794"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9904000163078308,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7892698645591736},{"id":"https://openalex.org/keywords/bounding-overwatch","display_name":"Bounding overwatch","score":0.7745341062545776},{"id":"https://openalex.org/keywords/shadow","display_name":"Shadow (psychology)","score":0.7211695909500122},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6714310050010681},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6451340913772583},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6028963923454285},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.5711972117424011},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5278289914131165},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5197058320045471},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.45733529329299927},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.43467479944229126},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.416305273771286},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.12338748574256897}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7892698645591736},{"id":"https://openalex.org/C63584917","wikidata":"https://www.wikidata.org/wiki/Q333286","display_name":"Bounding overwatch","level":2,"score":0.7745341062545776},{"id":"https://openalex.org/C117797892","wikidata":"https://www.wikidata.org/wiki/Q286363","display_name":"Shadow (psychology)","level":2,"score":0.7211695909500122},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6714310050010681},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6451340913772583},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6028963923454285},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.5711972117424011},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5278289914131165},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5197058320045471},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.45733529329299927},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.43467479944229126},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.416305273771286},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.12338748574256897},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3320688","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3320688","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":78,"referenced_works":["https://openalex.org/W1522301498","https://openalex.org/W1566291503","https://openalex.org/W2004707373","https://openalex.org/W2023151535","https://openalex.org/W2062385571","https://openalex.org/W2073839959","https://openalex.org/W2078065374","https://openalex.org/W2085910047","https://openalex.org/W2100493112","https://openalex.org/W2108598243","https://openalex.org/W2111486566","https://openalex.org/W2118143383","https://openalex.org/W2122514671","https://openalex.org/W2130210787","https://openalex.org/W2132951367","https://openalex.org/W2133593693","https://openalex.org/W2139232681","https://openalex.org/W2141562793","https://openalex.org/W2143373691","https://openalex.org/W2159668031","https://openalex.org/W2159920946","https://openalex.org/W2170405326","https://openalex.org/W2519623608","https://openalex.org/W2544806203","https://openalex.org/W2560023338","https://openalex.org/W2560311620","https://openalex.org/W2565639579","https://openalex.org/W2765535295","https://openalex.org/W2771617895","https://openalex.org/W2890447039","https://openalex.org/W2895126795","https://openalex.org/W2895340898","https://openalex.org/W2899663614","https://openalex.org/W2916743882","https://openalex.org/W2916797271","https://openalex.org/W2948670693","https://openalex.org/W2955084925","https://openalex.org/W2963163009","https://openalex.org/W2963299740","https://openalex.org/W2965373594","https://openalex.org/W2986056979","https://openalex.org/W2990205821","https://openalex.org/W3034627419","https://openalex.org/W3035244041","https://openalex.org/W3096609285","https://openalex.org/W3102699694","https://openalex.org/W3115300452","https://openalex.org/W3120736405","https://openalex.org/W3138516171","https://openalex.org/W3171516518","https://openalex.org/W3175028288","https://openalex.org/W3192871594","https://openalex.org/W3195577433","https://openalex.org/W3204290641","https://openalex.org/W4200631531","https://openalex.org/W4288089799","https://openalex.org/W4292945941","https://openalex.org/W4309131501","https://openalex.org/W4312396403","https://openalex.org/W4312433277","https://openalex.org/W4312532041","https://openalex.org/W4312545381","https://openalex.org/W4313156423","https://openalex.org/W4379659756","https://openalex.org/W4385245566","https://openalex.org/W4390874575","https://openalex.org/W6631190155","https://openalex.org/W6754033419","https://openalex.org/W6755207826","https://openalex.org/W6755977528","https://openalex.org/W6759534164","https://openalex.org/W6769627184","https://openalex.org/W6784094891","https://openalex.org/W6791353385","https://openalex.org/W6796505553","https://openalex.org/W6797263693","https://openalex.org/W6800751262","https://openalex.org/W6842542540"],"related_works":["https://openalex.org/W2893218741","https://openalex.org/W3125011624","https://openalex.org/W1508631387","https://openalex.org/W2370917603","https://openalex.org/W4392589133","https://openalex.org/W2952760143","https://openalex.org/W2558319350","https://openalex.org/W1492594177","https://openalex.org/W2017776670","https://openalex.org/W1842742976"],"abstract_inverted_index":{"Segment":[0],"anything":[1],"model":[2],"(SAM)":[3],"has":[4],"achieved":[5],"great":[6],"success":[7],"in":[8,162],"the":[9,77,82,89,106,111,150,159,184],"field":[10],"of":[11,152,164,188],"natural":[12],"image":[13],"segmentation.":[14],"Nevertheless,":[15],"SAM":[16,44,70],"tends":[17],"to":[18,45,100,124,177],"consider":[19],"shadows":[20],"as":[21,115],"background":[22],"and":[23,131,166,186],"therefore":[24],"does":[25],"not":[26],"perform":[27],"segmentation":[28],"on":[29,71],"them.":[30],"In":[31],"this":[32],"paper,":[33],"we":[34,57,67,92,118],"propose":[35],"ShadowSAM,":[36],"a":[37,102,116,120],"simple":[38],"yet":[39],"effective":[40],"framework":[41],"for":[42,61],"fine-tuning":[43],"detect":[46,101],"shadows.":[47],"Besides,":[48],"by":[49,75,96],"combining":[50],"it":[51],"with":[52,155],"long":[53,121],"short-term":[54,122],"attention":[55],"mechanism,":[56],"extend":[58],"its":[59],"capability":[60],"efficient":[62],"video":[63,144,179],"shadow":[64,85,113,140,180],"detection.":[65],"Specifically,":[66],"first":[68,107],"fine-tune":[69],"ViSha":[72],"training":[73],"dataset":[74],"utilizing":[76],"bounding":[78,98],"boxes":[79,99],"obtained":[80],"from":[81],"ground":[83],"truth":[84],"mask.":[86],"Then":[87],"during":[88],"inference":[90,174],"stage,":[91],"simulate":[93],"user":[94],"interaction":[95],"providing":[97],"specific":[103],"frame":[104],"(e.g.,":[105],"frame).":[108],"Subsequently,":[109],"using":[110],"detected":[112],"mask":[114],"prior,":[117],"employ":[119],"network":[123],"learn":[125],"spatial":[126],"correlations":[127],"between":[128,134],"distant":[129],"frames":[130],"temporal":[132],"consistency":[133],"adjacent":[135],"frames,":[136],"thereby":[137],"achieving":[138],"precise":[139],"information":[141],"propagation":[142],"across":[143],"frames.":[145],"Extensive":[146],"experimental":[147],"results":[148],"demonstrate":[149],"effectiveness":[151,185],"our":[153,170,189],"method,":[154],"notable":[156],"margin":[157],"over":[158],"state-of-the-art":[160],"approaches":[161],"terms":[163],"MAE":[165],"IoU":[167],"metrics.":[168],"Moreover,":[169],"method":[171],"exhibits":[172],"accelerated":[173],"speed":[175],"compared":[176],"previous":[178],"detection":[181],"approaches,":[182],"validating":[183],"efficiency":[187],"method.":[190],"The":[191],"source":[192],"code":[193],"is":[194],"now":[195],"publicly":[196],"available":[197],"at":[198],"<uri":[199],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[200],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">https://github.com/harrytea/Detect-AnyShadow</uri>":[201],".":[202]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":14}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
