{"id":"https://openalex.org/W4413925581","doi":"https://doi.org/10.1109/tmm.2025.3604935","title":"IVAC-$\\mathbf {P^{2}L}$: Leveraging Irregular Repetition Priors for Improving Video Action Counting","display_name":"IVAC-$\\mathbf {P^{2}L}$: Leveraging Irregular Repetition Priors for Improving Video Action Counting","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4413925581","doi":"https://doi.org/10.1109/tmm.2025.3604935"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3604935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3604935","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100459499","display_name":"Hang Wang","orcid":"https://orcid.org/0000-0001-9876-8285"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hang Wang","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University, Xi&#x2019;An, China","Xi&#x0027;an Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University, Xi&#x2019;An, China","institution_ids":["https://openalex.org/I87445476"]},{"raw_affiliation_string":"Xi&#x0027;an Jiaotong University, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058898461","display_name":"Zhi-Qi Cheng","orcid":"https://orcid.org/0000-0002-1720-2085"},"institutions":[{"id":"https://openalex.org/I4210150356","display_name":"University of Washington Tacoma","ror":"https://ror.org/05n8t2628","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701","https://openalex.org/I4210150356"]},{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhi-Qi Cheng","raw_affiliation_strings":["Tacoma School of Engineering &amp; Technology, University of Washington, Tacoma, WA, USA","Language Technologies Institute, Carnegie Mellon University, Pittsburgh, PA, USA"],"affiliations":[{"raw_affiliation_string":"Tacoma School of Engineering &amp; Technology, University of Washington, Tacoma, WA, USA","institution_ids":["https://openalex.org/I4210150356"]},{"raw_affiliation_string":"Language Technologies Institute, Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074080669","display_name":"Youtian Du","orcid":"https://orcid.org/0000-0002-1714-3433"},"institutions":[{"id":"https://openalex.org/I87445476","display_name":"Xi'an Jiaotong University","ror":"https://ror.org/017zhmm22","country_code":"CN","type":"education","lineage":["https://openalex.org/I87445476"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youtian Du","raw_affiliation_strings":["Xi&#x2019;an Jiaotong University, Xi&#x2019;An, China","Xi&#x0027;an Jiaotong University, China"],"affiliations":[{"raw_affiliation_string":"Xi&#x2019;an Jiaotong University, Xi&#x2019;An, China","institution_ids":["https://openalex.org/I87445476"]},{"raw_affiliation_string":"Xi&#x0027;an Jiaotong University, China","institution_ids":["https://openalex.org/I87445476"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100433899","display_name":"Lei Zhang","orcid":"https://orcid.org/0000-0002-2078-4215"},"institutions":[{"id":"https://openalex.org/I14243506","display_name":"Hong Kong Polytechnic University","ror":"https://ror.org/0030zas98","country_code":"HK","type":"education","lineage":["https://openalex.org/I14243506"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Lei Zhang","raw_affiliation_strings":["The Hong Kong Polytechnic University, Hong Kong"],"affiliations":[{"raw_affiliation_string":"The Hong Kong Polytechnic University, Hong Kong","institution_ids":["https://openalex.org/I14243506"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100459499"],"corresponding_institution_ids":["https://openalex.org/I87445476"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.217284,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":null,"first_page":"8325","last_page":"8339"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9821000099182129,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8100180625915527},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.5993326306343079},{"id":"https://openalex.org/keywords/repetition","display_name":"Repetition (rhetorical device)","score":0.5781395435333252},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5349560976028442},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32049620151519775},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.12475085258483887}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8100180625915527},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.5993326306343079},{"id":"https://openalex.org/C2776141515","wikidata":"https://www.wikidata.org/wiki/Q1274479","display_name":"Repetition (rhetorical device)","level":2,"score":0.5781395435333252},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5349560976028442},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32049620151519775},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.12475085258483887},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3604935","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3604935","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4208651041","display_name":null,"funder_award_id":"T2341003","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G659122245","display_name":null,"funder_award_id":"62441238","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8983850641","display_name":null,"funder_award_id":"U24B20185","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1980331821","https://openalex.org/W2024398060","https://openalex.org/W2076087677","https://openalex.org/W2084681041","https://openalex.org/W2096733369","https://openalex.org/W2103253739","https://openalex.org/W2138621090","https://openalex.org/W2143023146","https://openalex.org/W2200707618","https://openalex.org/W2337500368","https://openalex.org/W2914426823","https://openalex.org/W2963073306","https://openalex.org/W2963514444","https://openalex.org/W2964290934","https://openalex.org/W3034491703","https://openalex.org/W3034527633","https://openalex.org/W3034572008","https://openalex.org/W3034802267","https://openalex.org/W3035358327","https://openalex.org/W3108316907","https://openalex.org/W3120494681","https://openalex.org/W3126432642","https://openalex.org/W3136965813","https://openalex.org/W3145385912","https://openalex.org/W3159619744","https://openalex.org/W3166712493","https://openalex.org/W3173632533","https://openalex.org/W3174490084","https://openalex.org/W3175220218","https://openalex.org/W3176411119","https://openalex.org/W3176780013","https://openalex.org/W3200162518","https://openalex.org/W3204090293","https://openalex.org/W3204116406","https://openalex.org/W4214727094","https://openalex.org/W4221166385","https://openalex.org/W4226146163","https://openalex.org/W4226380330","https://openalex.org/W4285806903","https://openalex.org/W4312385123","https://openalex.org/W4312403713","https://openalex.org/W4312453523","https://openalex.org/W4312509322","https://openalex.org/W4312560592","https://openalex.org/W4312772544","https://openalex.org/W4312939486","https://openalex.org/W4323065192","https://openalex.org/W4381233075","https://openalex.org/W4386231783","https://openalex.org/W4403002315"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4386190339","https://openalex.org/W2968424575","https://openalex.org/W3142333283","https://openalex.org/W2580650124","https://openalex.org/W3122088529","https://openalex.org/W3041320102","https://openalex.org/W2111669074"],"abstract_inverted_index":{"The":[0],"quantification":[1],"of":[2,76,127,147,169,271,278],"repetitive":[3],"actions":[4,128],"in":[5,21,26,43,83,116,156,232,274,281,291],"videos,":[6],"a":[7,18,60,117,140,165,176,189,201,229],"task":[8],"commonly":[9],"referred":[10],"to":[11,34,192,204],"as":[12,47],"Video":[13,68],"Action":[14,69],"Counting":[15,70],"(VAC),":[16],"is":[17],"critical":[19],"challenge":[20],"understanding":[22,293],"and":[23,29,49,98,150,171,200,209,244,258,294],"analyzing":[24],"content":[25],"sports,":[27],"fitness,":[28],"daily":[30],"activities.":[31],"Traditional":[32],"approaches":[33],"VAC":[35,237],"have":[36],"largely":[37],"overlooked":[38],"the":[39,74,78,107,125,145,153,194,216,236,269,276],"nuanced":[40],"irregularities":[41],"inherent":[42,154],"action":[44],"repetitions,":[45],"such":[46],"interruptions":[48],"variable":[50],"lengths":[51],"between":[52,129,144,207],"cycles.":[53],"Addressing":[54],"this":[55],"gap,":[56],"our":[57,221,240,272],"study":[58],"introduces":[59],"novel":[61,166],"perspective":[62],"on":[63,66,215,253],"VAC,":[64],"focusing":[65],"Irregular":[67],"(IVAC),":[71],"which":[72],"emphasizes":[73],"importance":[75],"modeling":[77],"irregular":[79,279],"repetition":[80],"priors":[81,89],"present":[82],"video":[84,118,248,292],"content.":[85,157],"We":[86],"conceptualize":[87],"these":[88,161],"through":[90],"two":[91,254],"key":[92],"aspects:":[93],"<italic":[94,99],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[95,100,109,120,131,181,223],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Inter-cycle":[96],"Consistency</i>":[97],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Cycle-interval":[101],"Inconsistency</i>.":[102],"Inter-cycle":[103],"Consistency":[104],"ensures":[105],"that":[106,220],"<bold":[108,119,130],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">spatiotemporal</b>":[110],"representations":[111,146],"across":[112,246],"all":[113],"cycle":[114,133,148,197,208],"segments":[115,149],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">remain</b>":[121],"homogeneous,":[122],"thereby":[123],"reflecting":[124],"uniformity":[126],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">different":[132],"segments</b>.":[134],"In":[135],"contrast,":[136],"Cycle-interval":[137],"Inconsistency":[138],"mandates":[139],"clear":[141],"semantic":[142],"distinction":[143],"intervals,":[151],"acknowledging":[152],"dissimilarities":[155],"To":[158],"effectively":[159],"encapsulate":[160],"priors,":[162],"we":[163],"introduce":[164],"methodology":[167],"consisting":[168],"consistency":[170],"inconsistency":[172],"modules,":[173],"underpinned":[174],"by":[175],"tailored":[177],"pull-push":[178],"loss":[179,191,203],"(<inline-formula":[180],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[182,224],"notation=\"LaTeX\">$\\mathrm":[183,225],"{P^{2}~L}$</tex-math></inline-formula>)":[184],"mechanism.":[185],"This":[186],"approach":[187,273],"employs":[188],"pull":[190],"enhance":[193],"cohesion":[195],"among":[196],"segment":[198,211],"features":[199],"push":[202],"distinctly":[205],"differentiate":[206],"interval":[210],"features.":[212],"Empirical":[213],"evaluations":[214],"RepCount":[217],"dataset":[218],"illustrate":[219],"IVAC-<inline-formula":[222],"{P^{2}~L}$</tex-math></inline-formula>":[226],"model":[227,241],"sets":[228],"new":[230,286],"benchmark":[231],"state-of-the-art":[233],"performance":[234,252],"for":[235,288],"task.":[238],"Moreover,":[239],"demonstrates":[242],"adaptability":[243],"generalization":[245],"diverse":[247],"content,":[249],"achieving":[250],"superior":[251],"additional":[255],"datasets,":[256],"UCFRep":[257],"Countix,":[259],"without":[260],"necessitating":[261],"dataset-specific":[262],"fine-tuning.":[263],"These":[264],"findings":[265],"not":[266],"only":[267],"validate":[268],"effectiveness":[270],"addressing":[275],"complexities":[277],"repetitions":[280],"videos":[282],"but":[283],"also":[284],"open":[285],"avenues":[287],"future":[289],"research":[290],"analysis.":[295]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
