{"id":"https://openalex.org/W7108325609","doi":"https://doi.org/10.1145/3767695.3769480","title":"A Flexible and Scalable Framework for Video Moment Search","display_name":"A Flexible and Scalable Framework for Video Moment Search","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W7108325609","doi":"https://doi.org/10.1145/3767695.3769480"},"language":"en","primary_location":{"id":"doi:10.1145/3767695.3769480","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3767695.3769480","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Annual International ACM SIGIR Conference on Research and Development in Information Retrieval in the Asia Pacific Region","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3767695.3769480","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Chongzhi Zhang","orcid":"https://orcid.org/0000-0003-1378-322X"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Chongzhi Zhang","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-1378-322X","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xizhou Zhu","orcid":"https://orcid.org/0009-0004-5262-9713"},"institutions":[{"id":"https://openalex.org/I4210128910","display_name":"Group Sense (China)","ror":"https://ror.org/036wd5777","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210128910"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xizhou Zhu","raw_affiliation_strings":["SenseTime Research, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0004-5262-9713","affiliations":[{"raw_affiliation_string":"SenseTime Research, Beijing, China","institution_ids":["https://openalex.org/I4210128910"]}]},{"author_position":"last","author":{"id":null,"display_name":"Aixin Sun","orcid":"https://orcid.org/0000-0003-0764-4258"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Aixin Sun","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"raw_orcid":"https://orcid.org/0000-0003-0764-4258","affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.57413906,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"313","last_page":"324"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7836999893188477,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.7836999893188477,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.12370000034570694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.05169999971985817,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.7706999778747559},{"id":"https://openalex.org/keywords/timestamp","display_name":"Timestamp","score":0.7401000261306763},{"id":"https://openalex.org/keywords/moment","display_name":"Moment (physics)","score":0.6924999952316284},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.5142999887466431},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5138000249862671},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4587000012397766}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8166000247001648},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.7706999778747559},{"id":"https://openalex.org/C113954288","wikidata":"https://www.wikidata.org/wiki/Q186885","display_name":"Timestamp","level":2,"score":0.7401000261306763},{"id":"https://openalex.org/C179254644","wikidata":"https://www.wikidata.org/wiki/Q13222844","display_name":"Moment (physics)","level":2,"score":0.6924999952316284},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.5142999887466431},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5138000249862671},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4587000012397766},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.45179998874664307},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.38089999556541443},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.36559998989105225},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.35589998960494995},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.35530000925064087},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.3246999979019165},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2903999984264374},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2800000011920929},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.2596000134944916}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3767695.3769480","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3767695.3769480","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Annual International ACM SIGIR Conference on Research and Development in Information Retrieval in the Asia Pacific Region","raw_type":"proceedings-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/205142","is_oa":false,"landing_page_url":"https://hdl.handle.net/10356/205142","pdf_url":null,"source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":null,"raw_type":"Conference Paper"}],"best_oa_location":{"id":"doi:10.1145/3767695.3769480","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3767695.3769480","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 Annual International ACM SIGIR Conference on Research and Development in Information Retrieval in the Asia Pacific Region","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1993924397","https://openalex.org/W2053448995","https://openalex.org/W2111078031","https://openalex.org/W2111993661","https://openalex.org/W2124509324","https://openalex.org/W2143331230","https://openalex.org/W2147717514","https://openalex.org/W2337252826","https://openalex.org/W2421218773","https://openalex.org/W2808399042","https://openalex.org/W2894280539","https://openalex.org/W2963017553","https://openalex.org/W2963469388","https://openalex.org/W2963524571","https://openalex.org/W2963916161","https://openalex.org/W2964089981","https://openalex.org/W2997429269","https://openalex.org/W3021397474","https://openalex.org/W3034743747","https://openalex.org/W3035635319","https://openalex.org/W3093174808","https://openalex.org/W3099700870","https://openalex.org/W3104862079","https://openalex.org/W3105232955","https://openalex.org/W3155721152","https://openalex.org/W3156636935","https://openalex.org/W3172119680","https://openalex.org/W3174364033","https://openalex.org/W3175402857","https://openalex.org/W3176763654","https://openalex.org/W3200217958","https://openalex.org/W3203711169","https://openalex.org/W3211772574","https://openalex.org/W3216765867","https://openalex.org/W4224933373","https://openalex.org/W4243333943","https://openalex.org/W4252076394","https://openalex.org/W4285606530","https://openalex.org/W4288723191","https://openalex.org/W4372260310","https://openalex.org/W4385571423","https://openalex.org/W4386076010","https://openalex.org/W4390871893","https://openalex.org/W4390872247","https://openalex.org/W4390873373","https://openalex.org/W4390962868","https://openalex.org/W4402704561"],"related_works":[],"abstract_inverted_index":{"Video":[0,74],"moment":[1,96,148],"search,":[2],"the":[3,84,164,169],"process":[4,86],"of":[5,56,60,116,163],"finding":[6],"relevant":[7],"moments":[8,57],"in":[9,62,182],"a":[10,15,28,46,53,67,70,130,151],"video":[11,117],"corpus":[12],"to":[13,65,134,158,196],"match":[14,66],"user's":[16],"query,":[17,69],"is":[18,156],"crucial":[19],"for":[20,51,193,203],"various":[21],"applications.":[22,205],"Existing":[23],"solutions,":[24],"however,":[25],"often":[26],"assume":[27],"single":[29],"perfect":[30],"matching":[31],"moment,":[32],"struggle":[33],"with":[34,40,98,107,179],"inefficient":[35],"inference,":[36],"and":[37,48,95,125,153,160,185],"have":[38],"limitations":[39],"hour-long":[41],"videos.":[42],"This":[43],"paper":[44],"introduces":[45],"flexible":[47,189],"scalable":[49,120],"framework":[50,175],"retrieving":[52],"ranked":[54],"list":[55],"from":[58],"collection":[59],"videos":[61,101],"any":[63],"length":[64],"text":[68],"task":[71],"termed":[72],"Ranked":[73],"Moment":[75],"Retrieval":[76],"(RVMR).":[77],"Our":[78],"framework,":[79],"called":[80],"Segment-Proposal-Ranking":[81],"(SPR),":[82],"simplifies":[83],"search":[85],"into":[87,104,129,146],"three":[88],"independent":[89,194],"stages:":[90],"segment":[91],"retrieval,":[92,122],"proposal":[93],"generation,":[94],"refinement":[97,152],"re-ranking.":[99],"Specifically,":[100],"are":[102,127,143,207],"divided":[103],"equal-length":[105],"segments":[106,124,142],"precomputed":[108],"embeddings":[109],"indexed":[110],"offline,":[111],"allowing":[112],"efficient":[113],"retrieval":[114],"regardless":[115],"length.":[118],"For":[119],"online":[121],"both":[123],"queries":[126],"projected":[128],"shared":[131],"feature":[132],"space":[133],"enable":[135],"approximate":[136],"nearest":[137],"neighbor":[138],"(ANN)":[139],"search.":[140],"Retrieved":[141],"then":[144],"merged":[145],"coarse-grained":[147,165],"proposals.":[149,166],"Then":[150],"re-ranking":[154],"module":[155],"designed":[157],"reorder":[159],"adjust":[161],"timestamps":[162],"Evaluations":[167],"on":[168],"TVR-Ranking":[170],"dataset":[171],"demonstrate":[172],"that":[173],"our":[174],"achieves":[176],"state-of-the-art":[177],"performance":[178],"significant":[180],"reductions":[181],"computational":[183],"cost":[184],"processing":[186],"time.":[187],"The":[188],"design":[190],"also":[191],"allows":[192],"improvements":[195],"each":[197],"stage,":[198],"making":[199],"SPR":[200],"highly":[201],"adaptable":[202],"large-scale":[204],"Codes":[206],"available":[208],"at":[209],"https://github.com/Ranking-VMR/SPR":[210]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-03T00:00:00"}
