{"id":"https://openalex.org/W4283816211","doi":"https://doi.org/10.1109/ncc55593.2022.9806811","title":"Unsupervised Learning of Spatio-Temporal Representation with Multi-Task Learning for Video Retrieval","display_name":"Unsupervised Learning of Spatio-Temporal Representation with Multi-Task Learning for Video Retrieval","publication_year":2022,"publication_date":"2022-05-24","ids":{"openalex":"https://openalex.org/W4283816211","doi":"https://doi.org/10.1109/ncc55593.2022.9806811"},"language":"en","primary_location":{"id":"doi:10.1109/ncc55593.2022.9806811","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ncc55593.2022.9806811","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 National Conference on Communications (NCC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5067767024","display_name":"Vidit Kumar","orcid":"https://orcid.org/0000-0002-6157-7562"},"institutions":[{"id":"https://openalex.org/I60054993","display_name":"Graphic Era University","ror":"https://ror.org/03wqgqd89","country_code":"IN","type":"education","lineage":["https://openalex.org/I60054993"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Vidit Kumar","raw_affiliation_strings":["Graphic Era deemed to be university,Department of Computer Science and Engineering,Dehradun,India","Department of Computer Science and Engineering, Graphic Era deemed to be university, Dehradun, India"],"affiliations":[{"raw_affiliation_string":"Graphic Era deemed to be university,Department of Computer Science and Engineering,Dehradun,India","institution_ids":["https://openalex.org/I60054993"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Graphic Era deemed to be university, Dehradun, India","institution_ids":["https://openalex.org/I60054993"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5067767024"],"corresponding_institution_ids":["https://openalex.org/I60054993"],"apc_list":null,"apc_paid":null,"fwci":0.5033,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.62776049,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"33","issue":null,"first_page":"118","last_page":"123"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9901000261306763,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8483005166053772},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7127346396446228},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.6005450487136841},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5946271419525146},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5891649723052979},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.5699318647384644},{"id":"https://openalex.org/keywords/multi-task-learning","display_name":"Multi-task learning","score":0.515209972858429},{"id":"https://openalex.org/keywords/generalizability-theory","display_name":"Generalizability theory","score":0.515170693397522},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.501492977142334},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.44650059938430786},{"id":"https://openalex.org/keywords/pascal","display_name":"Pascal (unit)","score":0.44323891401290894},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.4362082779407501},{"id":"https://openalex.org/keywords/task-analysis","display_name":"Task analysis","score":0.4324226379394531},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.42044204473495483},{"id":"https://openalex.org/keywords/unsupervised-learning","display_name":"Unsupervised learning","score":0.4172019362449646},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3616619408130646}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8483005166053772},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7127346396446228},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.6005450487136841},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5946271419525146},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5891649723052979},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.5699318647384644},{"id":"https://openalex.org/C28006648","wikidata":"https://www.wikidata.org/wiki/Q6934509","display_name":"Multi-task learning","level":3,"score":0.515209972858429},{"id":"https://openalex.org/C27158222","wikidata":"https://www.wikidata.org/wiki/Q5532422","display_name":"Generalizability theory","level":2,"score":0.515170693397522},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.501492977142334},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.44650059938430786},{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.44323891401290894},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.4362082779407501},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.4324226379394531},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.42044204473495483},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.4172019362449646},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3616619408130646},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ncc55593.2022.9806811","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ncc55593.2022.9806811","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 National Conference on Communications (NCC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.47999998927116394,"id":"https://metadata.un.org/sdg/10"},{"display_name":"Peace, Justice and strong institutions","score":0.4699999988079071,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W24089286","https://openalex.org/W1522734439","https://openalex.org/W1966485246","https://openalex.org/W1966582457","https://openalex.org/W1986482242","https://openalex.org/W2016053056","https://openalex.org/W2126579184","https://openalex.org/W2156303437","https://openalex.org/W2209763203","https://openalex.org/W2321533354","https://openalex.org/W2487442924","https://openalex.org/W2520610372","https://openalex.org/W2550462002","https://openalex.org/W2561238782","https://openalex.org/W2583662698","https://openalex.org/W2614042628","https://openalex.org/W2729738218","https://openalex.org/W2785325870","https://openalex.org/W2786585376","https://openalex.org/W2792007612","https://openalex.org/W2883451034","https://openalex.org/W2900790473","https://openalex.org/W2926645869","https://openalex.org/W2947803325","https://openalex.org/W2948242301","https://openalex.org/W2963155035","https://openalex.org/W2963814513","https://openalex.org/W2964037671","https://openalex.org/W2964152890","https://openalex.org/W2997907976","https://openalex.org/W3004085219","https://openalex.org/W3005680577","https://openalex.org/W3013743800","https://openalex.org/W3034215340","https://openalex.org/W3099677434","https://openalex.org/W3110190397","https://openalex.org/W3195119650","https://openalex.org/W3210278546","https://openalex.org/W3217250905","https://openalex.org/W4220757241","https://openalex.org/W4223965272","https://openalex.org/W4224315854","https://openalex.org/W4286768630","https://openalex.org/W4383820647","https://openalex.org/W6600983433","https://openalex.org/W6682864246","https://openalex.org/W6700872662","https://openalex.org/W6730179637","https://openalex.org/W6747899497","https://openalex.org/W6760653604","https://openalex.org/W6840322078","https://openalex.org/W6854322803"],"related_works":["https://openalex.org/W2237537322","https://openalex.org/W2950678851","https://openalex.org/W4301248618","https://openalex.org/W3174759195","https://openalex.org/W3167013339","https://openalex.org/W4287121366","https://openalex.org/W2165343651","https://openalex.org/W2343790552","https://openalex.org/W2242427765","https://openalex.org/W2075830955"],"abstract_inverted_index":{"The":[0,134],"majority":[1],"of":[2,19,54,80,93],"videos":[3],"in":[4],"the":[5,17,33,52,69,73,91,114,142,150,160,164],"internet":[6],"lack":[7],"semantic":[8],"tags,":[9],"which":[10,30,89,178],"complicates":[11],"indexing":[12],"and":[13,15,109,131,172],"retrieval,":[14],"mandates":[16],"adoption":[18],"critical":[20],"content-based":[21],"analysis":[22],"approaches.":[23],"Earlier":[24],"works":[25],"relies":[26],"on":[27,85],"hand-crafted":[28],"features,":[29],"hardly":[31],"represents":[32],"temporal":[34],"dynamics.":[35],"Later,":[36],"video":[37,63,106],"representations":[38],"learned":[39,143],"through":[40],"supervised":[41],"deep":[42],"learning":[43,65,92,108],"methods":[44,61,82],"were":[45],"found":[46],"to":[47,71,99,104,140],"be":[48],"effective,":[49],"but":[50],"at":[51],"cost":[53],"large":[55],"labeled":[56],"dataset.":[57],"Recently,":[58],"self-supervised":[59],"based":[60,84],"for":[62,146,163],"representation":[64,107],"are":[66,83],"proposed":[67],"within":[68],"community":[70],"harness":[72],"freely":[74],"available":[75],"unlabeled":[76],"videos.":[77],"However,":[78],"most":[79],"these":[81],"single":[86],"pretext":[87,102,120],"task,":[88,149],"limits":[90],"generalizable":[94],"representations.":[95],"This":[96],"work":[97],"proposes":[98],"leverage":[100],"multiple":[101,119],"tasks":[103,121],"enhance":[105],"generalizability.":[110],"We":[111,158],"jointly":[112],"optimized":[113],"C3D":[115],"network":[116,151],"by":[117],"using":[118],"such":[122],"as:":[123],"rotation":[124],"prediction,":[125,127],"speed":[126],"time":[128],"direction":[129],"prediction":[130],"instance":[132],"discrimination.":[133],"nearest":[135],"neighbour":[136],"task":[137],"is":[138,152,179],"used":[139],"analyze":[141],"features.":[144],"And":[145],"action":[147,175],"recognition":[148,176],"further":[153],"fine-tuned":[154,174],"with":[155],"pretrained":[156],"weights.":[157],"use":[159],"UCF-101":[161],"dataset":[162],"experiments":[165],"and,":[166],"achieves":[167],"28.45%":[168],"retrieval":[169],"accuracy":[170],"(Recall@l),":[171],"68.85%":[173],"accuracy,":[177],"better":[180],"than":[181],"state-of-the-arts.":[182]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
