{"id":"https://openalex.org/W4392847157","doi":"https://doi.org/10.1142/s0218001424500058","title":"Motion Vector-Based Self-Attention for Real-Time Human Activity Recognition in Compressed Videos: The MVViT Approach","display_name":"Motion Vector-Based Self-Attention for Real-Time Human Activity Recognition in Compressed Videos: The MVViT Approach","publication_year":2024,"publication_date":"2024-03-15","ids":{"openalex":"https://openalex.org/W4392847157","doi":"https://doi.org/10.1142/s0218001424500058"},"language":"en","primary_location":{"id":"doi:10.1142/s0218001424500058","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0218001424500058","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103166464","display_name":"S. M. Praveenkumar","orcid":null},"institutions":[{"id":"https://openalex.org/I3132975163","display_name":"KLE Technological University","ror":"https://ror.org/04yh52k23","country_code":"IN","type":"education","lineage":["https://openalex.org/I3132975163"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"S. M. Praveenkumar","raw_affiliation_strings":["Department of Computer Applications, KLE Technological University, Vidayanagr, Hubballi, Karnataka 580031, India"],"raw_orcid":"https://orcid.org/0000-0003-0296-4287","affiliations":[{"raw_affiliation_string":"Department of Computer Applications, KLE Technological University, Vidayanagr, Hubballi, Karnataka 580031, India","institution_ids":["https://openalex.org/I3132975163"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090769834","display_name":"Prakashgoud Patil","orcid":"https://orcid.org/0000-0002-2187-7667"},"institutions":[{"id":"https://openalex.org/I3132975163","display_name":"KLE Technological University","ror":"https://ror.org/04yh52k23","country_code":"IN","type":"education","lineage":["https://openalex.org/I3132975163"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Prakashgoud Patil","raw_affiliation_strings":["Department of Computer Applications, KLE Technological University, Vidayanagr, Hubballi, Karnataka 580031, India"],"raw_orcid":"https://orcid.org/0000-0002-2187-7667","affiliations":[{"raw_affiliation_string":"Department of Computer Applications, KLE Technological University, Vidayanagr, Hubballi, Karnataka 580031, India","institution_ids":["https://openalex.org/I3132975163"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101626362","display_name":"P. S. Hiremath","orcid":"https://orcid.org/0000-0001-7640-6937"},"institutions":[{"id":"https://openalex.org/I3132975163","display_name":"KLE Technological University","ror":"https://ror.org/04yh52k23","country_code":"IN","type":"education","lineage":["https://openalex.org/I3132975163"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"P. S. Hiremath","raw_affiliation_strings":["Department of Computer Applications, KLE Technological University, Vidayanagr, Hubballi, Karnataka 580031, India"],"raw_orcid":"https://orcid.org/0000-0001-7640-6937","affiliations":[{"raw_affiliation_string":"Department of Computer Applications, KLE Technological University, Vidayanagr, Hubballi, Karnataka 580031, India","institution_ids":["https://openalex.org/I3132975163"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5103166464"],"corresponding_institution_ids":["https://openalex.org/I3132975163"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.02392578,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"38","issue":"04","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7008997797966003},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6817760467529297},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5712385177612305},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4967039227485657},{"id":"https://openalex.org/keywords/activity-recognition","display_name":"Activity recognition","score":0.49634772539138794},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48978495597839355},{"id":"https://openalex.org/keywords/support-vector-machine","display_name":"Support vector machine","score":0.41700485348701477}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7008997797966003},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6817760467529297},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5712385177612305},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4967039227485657},{"id":"https://openalex.org/C121687571","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Activity recognition","level":2,"score":0.49634772539138794},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48978495597839355},{"id":"https://openalex.org/C12267149","wikidata":"https://www.wikidata.org/wiki/Q282453","display_name":"Support vector machine","level":2,"score":0.41700485348701477}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1142/s0218001424500058","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s0218001424500058","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1964591373","https://openalex.org/W2095242101","https://openalex.org/W2105101328","https://openalex.org/W2126579184","https://openalex.org/W2133728753","https://openalex.org/W2222512263","https://openalex.org/W2342776425","https://openalex.org/W2507009361","https://openalex.org/W2508429489","https://openalex.org/W2782776028","https://openalex.org/W2948048211","https://openalex.org/W2963155035","https://openalex.org/W2963163009","https://openalex.org/W2963370182","https://openalex.org/W2963524571","https://openalex.org/W2964274041","https://openalex.org/W2966926453","https://openalex.org/W2971387592","https://openalex.org/W2983918066","https://openalex.org/W3035619757","https://openalex.org/W3035697644","https://openalex.org/W3098621856","https://openalex.org/W3107322323","https://openalex.org/W3110854813","https://openalex.org/W3131922516","https://openalex.org/W3195479307","https://openalex.org/W4212917338","https://openalex.org/W4214612132","https://openalex.org/W4214614183","https://openalex.org/W4284965682","https://openalex.org/W4310895557","https://openalex.org/W4312356418","https://openalex.org/W4382467086","https://openalex.org/W4386057769","https://openalex.org/W4386065852"],"related_works":["https://openalex.org/W3195649134","https://openalex.org/W2090763504","https://openalex.org/W2281498195","https://openalex.org/W148178222","https://openalex.org/W2017526120","https://openalex.org/W2104657898","https://openalex.org/W2610664080","https://openalex.org/W1948992892","https://openalex.org/W2188304107","https://openalex.org/W1886884218"],"abstract_inverted_index":{"Herein,":[0],"a":[1,13,83,99,161,194],"novel":[2],"methodology":[3],"is":[4,30,144,164,226,231,273],"proposed":[5,65,121,183,258],"for":[6,49,77,218,266],"real-time":[7],"recognition":[8,78,158],"of":[9,16,79,96,104,180,193,198,237,256],"human":[10,80],"activity":[11],"in":[12,41,82,89,119,160,172,191,235,246,275],"compressed":[14,84,162],"domain":[15,163],"videos":[17,40],"based":[18],"on":[19,249],"motion":[20,33],"vectors":[21,34],"and":[22,28,35,43,72,108,131,134,154,156,200,216,221,269],"self-attention":[23],"mechanism":[24],"using":[25,124,128,147,263],"vision":[26,36],"transformers,":[27],"it":[29,225],"termed":[31],"as":[32,93,137,139],"transformers":[37],"(MVViT).":[38],"The":[39,142,182,253],"MPEG-4":[42,136],"H.264":[44,140],"compression":[45],"formats":[46],"are":[47,117],"considered":[48,61],"this":[50,90],"study.":[51],"Any":[52],"video":[53,70,85,174],"source":[54],"without":[55],"any":[56],"prior":[57],"setup":[58],"could":[59],"be":[60,167],"by":[62,123,213,233],"adopting":[63],"the":[64,68,120,148,157,229,242,247,250,257,270,278],"method":[66,122,185,259],"to":[67,166,169,241],"corresponding":[69],"codecs":[71,268],"camera":[73],"settings.":[74],"Existing":[75],"algorithms":[76],"action":[81],"have":[86],"some":[87],"limitations":[88,116],"regard,":[91],"such":[92],"(i)":[94],"requirement":[95],"keyframes":[97],"at":[98,177],"fixed":[100],"interval,":[101],"(ii)":[102],"usage":[103],"P":[105,130],"frames":[106],"only,":[107],"(iii)":[109],"normally":[110],"support":[111],"single":[112],"codec":[113],"only.":[114],"These":[115],"overcome":[118],"arbitrary":[125],"keyframe":[126],"intervals,":[127],"both":[129],"B":[132],"frames,":[133],"supporting":[135],"well":[138],"codecs.":[141],"experimentation":[143],"carried":[145],"out":[146],"benchmark":[149],"datasets,":[150],"namely,":[151],"UCF101,":[152,219],"HMDB51,":[153],"THUMOS14,":[155,222],"accuracy":[159,212],"found":[165],"comparable":[168],"that":[170,228],"observed":[171,227],"raw":[173],"data":[175],"but":[176],"reduced":[178],"cost":[179],"computation.":[181],"MVViT":[184,264],"has":[186,260],"outperformed":[187],"other":[188],"recent":[189],"methods":[190],"terms":[192],"lesser":[195],"(61.0%)":[196],"number":[197],"parameters":[199],"(63.7%)":[201],"Giga":[202],"Floating":[203],"Point":[204],"Operations":[205],"Per":[206],"Second":[207],"(GFLOPS),":[208],"while":[209],"significantly":[210],"improving":[211],"0.8%,":[214],"5.9%":[215],"16.6%":[217],"HMDB51":[220],"respectively.":[223],"Also,":[224],"speed":[230,244],"increased":[232],"8%":[234],"case":[236],"UCF101":[238],"when":[239],"compared":[240],"highest":[243],"reported":[245],"literature":[248],"same":[251],"dataset.":[252],"ablation":[254],"study":[255],"been":[261],"done":[262,274],"variants":[265],"different":[267],"performance":[271],"analysis":[272],"comparison":[276],"with":[277],"state-of-the-art":[279],"network":[280],"models.":[281]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
