{"id":"https://openalex.org/W4391590980","doi":"https://doi.org/10.48550/arxiv.2402.02335","title":"Video Editing for Video Retrieval","display_name":"Video Editing for Video Retrieval","publication_year":2024,"publication_date":"2024-02-04","ids":{"openalex":"https://openalex.org/W4391590980","doi":"https://doi.org/10.48550/arxiv.2402.02335"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.02335","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.02335","pdf_url":"https://arxiv.org/pdf/2402.02335","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.02335","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100619754","display_name":"Bin Zhu","orcid":"https://orcid.org/0000-0002-5478-1426"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhu, Bin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029289131","display_name":"Kevin C. Flanagan","orcid":"https://orcid.org/0009-0005-3364-1677"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Flanagan, Kevin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050356861","display_name":"Adriano Fragomeni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Fragomeni, Adriano","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049284007","display_name":"Michael Wray","orcid":"https://orcid.org/0000-0001-5918-9029"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wray, Michael","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5003103666","display_name":"Dima Damen","orcid":"https://orcid.org/0000-0001-8804-6238"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Damen, Dima","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100619754"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9415000081062317,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6474456191062927},{"id":"https://openalex.org/keywords/video-retrieval","display_name":"Video retrieval","score":0.6037849187850952},{"id":"https://openalex.org/keywords/non-linear-editing-system","display_name":"Non-linear editing system","score":0.4849269688129425},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4555763304233551},{"id":"https://openalex.org/keywords/video-editing","display_name":"Video editing","score":0.4265483319759369},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.42054125666618347},{"id":"https://openalex.org/keywords/video-capture","display_name":"Video capture","score":0.38271647691726685},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.37084686756134033},{"id":"https://openalex.org/keywords/smacker-video","display_name":"Smacker video","score":0.33731716871261597},{"id":"https://openalex.org/keywords/video-processing","display_name":"Video processing","score":0.32882237434387207},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.26318418979644775}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6474456191062927},{"id":"https://openalex.org/C2983174267","wikidata":"https://www.wikidata.org/wiki/Q3775098","display_name":"Video retrieval","level":2,"score":0.6037849187850952},{"id":"https://openalex.org/C137402728","wikidata":"https://www.wikidata.org/wiki/Q1330119","display_name":"Non-linear editing system","level":5,"score":0.4849269688129425},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4555763304233551},{"id":"https://openalex.org/C2780310081","wikidata":"https://www.wikidata.org/wiki/Q1154312","display_name":"Video editing","level":2,"score":0.4265483319759369},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.42054125666618347},{"id":"https://openalex.org/C151211776","wikidata":"https://www.wikidata.org/wiki/Q2778015","display_name":"Video capture","level":3,"score":0.38271647691726685},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.37084686756134033},{"id":"https://openalex.org/C108803254","wikidata":"https://www.wikidata.org/wiki/Q857512","display_name":"Smacker video","level":4,"score":0.33731716871261597},{"id":"https://openalex.org/C65483669","wikidata":"https://www.wikidata.org/wiki/Q3536669","display_name":"Video processing","level":2,"score":0.32882237434387207},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.26318418979644775}],"mesh":[],"locations_count":3,"locations":[{"id":"pmh:oai:arXiv.org:2402.02335","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.02335","pdf_url":"https://arxiv.org/pdf/2402.02335","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:ink.library.smu.edu.sg:sis_research-11235","is_oa":true,"landing_page_url":"https://ink.library.smu.edu.sg/sis_research/10235","pdf_url":null,"source":{"id":"https://openalex.org/S4306401925","display_name":"Singapore Management University Institutional Knowledge (InK) (Singapore Management University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I79891267","host_organization_name":"Singapore Management University","host_organization_lineage":["https://openalex.org/I79891267"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"https://doi.org/10.1007/978-3-031-92591-7_15","raw_type":"Conference Proceeding Article"},{"id":"doi:10.48550/arxiv.2402.02335","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.02335","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.02335","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.02335","pdf_url":"https://arxiv.org/pdf/2402.02335","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G397022313","display_name":"UMPIRE: United Model for the Perception of Interactions in visuoauditory REcognition","funder_award_id":"EP/T004991/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G49701852","display_name":null,"funder_award_id":"EP/S022937/1","funder_id":"https://openalex.org/F4320314731","funder_display_name":"UK Research and Innovation"},{"id":"https://openalex.org/G5003611146","display_name":"Visual AI: An Open World Interpretable Visual Transformer","funder_award_id":"EP/T028572/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G5715794163","display_name":null,"funder_award_id":"EP/S022937/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320314731","display_name":"UK Research and Innovation","ror":"https://ror.org/001aqnf71"},{"id":"https://openalex.org/F4320320360","display_name":"University of Bristol","ror":"https://ror.org/0524sp257"},{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391590980.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2787002358","https://openalex.org/W2373715384","https://openalex.org/W2188382975","https://openalex.org/W1481894793","https://openalex.org/W595697318","https://openalex.org/W2318748556","https://openalex.org/W2101636524","https://openalex.org/W2070078868","https://openalex.org/W2601353656","https://openalex.org/W2379857410"],"abstract_inverted_index":{"Though":[0],"pre-training":[1],"vision-language":[2],"models":[3],"have":[4],"demonstrated":[5],"significant":[6],"benefits":[7],"in":[8,59,105],"boosting":[9],"video-text":[10,52],"retrieval":[11,67,85,140,149,160,173,182],"performance":[12,129,174],"from":[13,57,123],"large-scale":[14],"web":[15],"videos,":[16],"fine-tuning":[17],"still":[18],"plays":[19],"a":[20,60,66,70],"critical":[21],"role":[22],"with":[23,27],"manually":[24],"annotated":[25],"clips":[26,56,104,170,177],"start":[28],"and":[29,136,153,164],"end":[30],"times,":[31],"which":[32],"requires":[33],"considerable":[34],"human":[35],"effort.":[36],"To":[37],"address":[38],"this":[39],"issue,":[40],"we":[41],"explore":[42],"an":[43],"alternative":[44],"cheaper":[45],"source":[46],"of":[47],"annotations,":[48],"single":[49],"timestamps,":[50],"for":[51,92],"retrieval.":[53],"We":[54,142],"initialise":[55],"timestamps":[58],"heuristic":[61],"way":[62],"to":[63,77,83,101,138],"warm":[64],"up":[65],"model.":[68],"Then":[69],"video":[71,93,159],"clip":[72,94],"editing":[73],"method":[74,132],"is":[75,90,99,133],"proposed":[76],"refine":[78],"the":[79,103,106,110,115,124,127,180],"initial":[80,176],"rough":[81],"boundaries":[82],"improve":[84,172],"performance.":[86],"A":[87],"student-teacher":[88],"network":[89],"introduced":[91],"editing.":[95],"The":[96,118],"teacher":[97,119],"model":[98,112,134],"employed":[100],"edit":[102],"training":[107],"set":[108],"whereas":[109],"student":[111],"trains":[113],"on":[114,146,157],"edited":[116,169],"clips.":[117],"weights":[120],"are":[121],"updated":[122],"student's":[125,128],"after":[126],"increases.":[130],"Our":[131],"agnostic":[135],"applicable":[137],"any":[139],"models.":[141,183],"conduct":[143],"experiments":[144],"based":[145],"three":[147,158,181],"state-of-the-art":[148],"models,":[150],"COOT,":[151],"VideoCLIP":[152],"CLIP4Clip.":[154],"Experiments":[155],"conducted":[156],"datasets,":[161],"YouCook2,":[162],"DiDeMo":[163],"ActivityNet-Captions":[165],"show":[166],"that":[167],"our":[168],"consistently":[171],"over":[175],"across":[178],"all":[179]},"counts_by_year":[],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
