{"id":"https://openalex.org/W4415883054","doi":"https://doi.org/10.1109/tcsvt.2025.3628630","title":"Learning Confidence-Aware Prototypes for Weakly-Supervised Video Anomaly Detection","display_name":"Learning Confidence-Aware Prototypes for Weakly-Supervised Video Anomaly Detection","publication_year":2025,"publication_date":"2025-11-04","ids":{"openalex":"https://openalex.org/W4415883054","doi":"https://doi.org/10.1109/tcsvt.2025.3628630"},"language":null,"primary_location":{"id":"doi:10.1109/tcsvt.2025.3628630","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3628630","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100457290","display_name":"Zhao Xie","orcid":"https://orcid.org/0000-0001-9834-4730"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhao Xie","raw_affiliation_strings":["School of Computer and Information, Hefei University of Technology, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0001-9834-4730","affiliations":[{"raw_affiliation_string":"School of Computer and Information, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jinkang Luo","orcid":null},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinkang Luo","raw_affiliation_strings":["School of Computer and Information, Hefei University of Technology, Hefei, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer and Information, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100609001","display_name":"Kewei Wu","orcid":"https://orcid.org/0000-0002-7332-5653"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kewei Wu","raw_affiliation_strings":["School of Computer and Information, Hefei University of Technology, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-7332-5653","affiliations":[{"raw_affiliation_string":"School of Computer and Information, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052517470","display_name":"Zhehan Kan","orcid":"https://orcid.org/0000-0002-1069-649X"},"institutions":[{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhehan Kan","raw_affiliation_strings":["Shenzhen International Graduate School, Tsinghua University, Beijing, China","Shenzhen International Graduate School, Tsinghua University, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059530979","display_name":"Dan Guo","orcid":"https://orcid.org/0000-0003-2594-254X"},"institutions":[{"id":"https://openalex.org/I16365422","display_name":"Hefei University of Technology","ror":"https://ror.org/02czkny70","country_code":"CN","type":"education","lineage":["https://openalex.org/I16365422"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dan Guo","raw_affiliation_strings":["School of Computer and Information, Hefei University of Technology, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0003-2594-254X","affiliations":[{"raw_affiliation_string":"School of Computer and Information, Hefei University of Technology, Hefei, China","institution_ids":["https://openalex.org/I16365422"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.15211499,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"36","issue":"4","first_page":"5714","last_page":"5728"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9635999798774719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9635999798774719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.01730000041425228,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.005200000014156103,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/snippet","display_name":"Snippet","score":0.8281999826431274},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.6154999732971191},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5058000087738037},{"id":"https://openalex.org/keywords/bag-of-words-model","display_name":"Bag-of-words model","score":0.4284999966621399},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.42100000381469727},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.40380001068115234}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8499000072479248},{"id":"https://openalex.org/C2777822670","wikidata":"https://www.wikidata.org/wiki/Q1120538","display_name":"Snippet","level":2,"score":0.8281999826431274},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.6154999732971191},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5058000087738037},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4966999888420105},{"id":"https://openalex.org/C13672336","wikidata":"https://www.wikidata.org/wiki/Q3460803","display_name":"Bag-of-words model","level":2,"score":0.4284999966621399},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.42100000381469727},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.40380001068115234},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.396699994802475},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.37950000166893005},{"id":"https://openalex.org/C739882","wikidata":"https://www.wikidata.org/wiki/Q3560506","display_name":"Anomaly detection","level":2,"score":0.37389999628067017},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.2937000095844269},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.287200003862381},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2856999933719635},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2732999920845032},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2572999894618988},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.25290000438690186}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3628630","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3628630","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4862433228","display_name":null,"funder_award_id":"62272144","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5858203771","display_name":null,"funder_award_id":"62576131","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6212260119","display_name":null,"funder_award_id":"GXXT-2023-015","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334897","display_name":"Natural Science Foundation of Anhui Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Weakly":[0],"supervised":[1],"video":[2,33],"anomaly":[3,261,265],"detection":[4],"aims":[5],"to":[6,17,53,86,115,138,151,184,196,223,249,283],"identify":[7],"abnormal":[8,32],"snippets":[9,30,104,113,133,137,146,165,183,215],"in":[10,25,31,117,134,160,172,216],"untrimmed":[11],"videos.":[12],"Existing":[13],"methods":[14],"learn":[15,250],"prototypes":[16,234],"describe":[18],"global":[19],"representation":[20,202],"of":[21,100,288],"snippet":[22],"distributions.":[23],"But,":[24],"weakly-labeled":[26],"videos,":[27],"the":[28,61,98,118,135,155,161,168,200,204,217,245,251,258,276,286],"normal":[29,214],"may":[34,47,108,166],"take":[35,109],"high-uncertainty":[36,106,132,148],"labels":[37,107,149,195],"for":[38,260,297],"distribution":[39,210,219],"modeling.":[40],"Without":[41],"confidence-aware":[42,73,178],"modeling,":[43],"abnormal/normal":[44,121],"prototype":[45,74,79,82,141,156,174,187,201,209,226,232,247],"distributions":[46],"overlap":[48,119],"with":[49,105,147,203,220],"each":[50,101],"other,":[51],"leading":[52],"inaccurate":[54],"predictions.":[55],"In":[56],"this":[57],"work,":[58],"we":[59,198,291],"propose":[60],"Unified":[62],"Confident":[63],"Prototype":[64],"(UCP)":[65],"model,":[66],"which":[67,130,180,212],"contains":[68],"a":[69,72,77],"feature":[70],"extractor,":[71],"learner,":[75],"and":[76,91,279],"local-global":[78,246,254],"unifier.":[80],"The":[81],"learning":[83,97],"is":[84],"designed":[85],"ensure":[87,139,185,224],"proper":[88],"separability,":[89],"stability,":[90],"representation.":[92],"<italic":[93,143,189,228],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[94,144,190,229],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">First</i>,":[95],"after":[96,192],"weight":[99],"snippet\u2019s":[102],"loss,":[103],"small":[110],"weights.":[111],"These":[112,164],"tend":[114,150],"lie":[116],"between":[120],"distributions,":[122],"hindering":[123],"their":[124],"separation.":[125],"We":[126,176,207,242],"design":[127,177,208],"uncertainty-aware":[128],"sampling,":[129,179],"removes":[131,181],"small-weight":[136],"separable":[140],"learning.":[142,175,188,227],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Second</i>,":[145],"be":[152,236],"far":[153],"from":[154],"center,":[157],"thus":[158],"falling":[159],"low-confidence":[162,182],"region.":[163],"enlarge":[167],"distribution\u2019s":[169,205],"variation,":[170],"resulting":[171],"unstable":[173],"stable":[186],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Third</i>,":[191],"assigning":[193],"pseudo":[194],"prototypes,":[197],"measure":[199],"purity.":[206],"purification,":[211],"penalizes":[213],"abnormal-majority":[218],"purity":[221],"loss":[222],"representative":[225],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Fourth</i>,":[230],"beyond":[231],"learning,":[233],"can":[235],"enhanced":[237],"by":[238],"local/global":[239],"temporal":[240,299],"semantics.":[241],"further":[243,284,292],"introduce":[244],"unifier":[248],"relations":[252],"across":[253],"durations,":[255],"thereby":[256],"enhancing":[257],"semantics":[259],"detection.":[262],"For":[263],"weakly-supervised":[264,298],"detection,":[266],"experiments":[267,294],"demonstrate":[268],"that":[269],"our":[270,289],"method":[271],"achieves":[272],"state-of-the-art":[273],"performance":[274],"on":[275,295],"UCF-Crime,":[277],"ShanghaiTech,":[278],"XD-Violence":[280],"datasets.":[281],"Moreover,":[282],"verify":[285],"generality":[287],"method,":[290],"conduct":[293],"THUMOS\u201914":[296],"action":[300],"localization.":[301]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-04T00:00:00"}
