{"id":"https://openalex.org/W4404370818","doi":"https://doi.org/10.1109/tcsvt.2024.3498599","title":"Learning to Diversify for Robust Video Moment Retrieval","display_name":"Learning to Diversify for Robust Video Moment Retrieval","publication_year":2024,"publication_date":"2024-11-14","ids":{"openalex":"https://openalex.org/W4404370818","doi":"https://doi.org/10.1109/tcsvt.2024.3498599"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3498599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3498599","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5016399027","display_name":"Huilin Ge","orcid":"https://orcid.org/0000-0001-9175-5668"},"institutions":[{"id":"https://openalex.org/I4210096899","display_name":"Jiangsu University of Science and Technology","ror":"https://ror.org/00tyjp878","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210096899"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huilin Ge","raw_affiliation_strings":["College of Ocean, Jiangsu University of Science and Technology, Zhenjiang, China","Jiangsu University of Science and Technology, Zhenjiang, China"],"raw_orcid":"https://orcid.org/0000-0001-9175-5668","affiliations":[{"raw_affiliation_string":"College of Ocean, Jiangsu University of Science and Technology, Zhenjiang, China","institution_ids":["https://openalex.org/I4210096899"]},{"raw_affiliation_string":"Jiangsu University of Science and Technology, Zhenjiang, China","institution_ids":["https://openalex.org/I4210096899"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xiaolei Liu","orcid":"https://orcid.org/0009-0003-2671-5709"},"institutions":[{"id":"https://openalex.org/I4210152380","display_name":"Shenzhen Technology University","ror":"https://ror.org/04qzpec27","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210152380"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolei Liu","raw_affiliation_strings":["Elevoc Technology Company Ltd., Shenzhen, China","Elevoc Technology Co., Ltd, Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0003-2671-5709","affiliations":[{"raw_affiliation_string":"Elevoc Technology Company Ltd., Shenzhen, China","institution_ids":["https://openalex.org/I4210152380"]},{"raw_affiliation_string":"Elevoc Technology Co., Ltd, Shenzhen, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zihang Guo","orcid":"https://orcid.org/0009-0004-8357-2254"},"institutions":[{"id":"https://openalex.org/I2722730","display_name":"Inner Mongolia University","ror":"https://ror.org/0106qb496","country_code":"CN","type":"education","lineage":["https://openalex.org/I2722730"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zihang Guo","raw_affiliation_strings":["College of Computer Science, Inner Mongolia University, Hohhot, China","College of Computer Science, Inner Mongolia University, China"],"raw_orcid":"https://orcid.org/0009-0004-8357-2254","affiliations":[{"raw_affiliation_string":"College of Computer Science, Inner Mongolia University, Hohhot, China","institution_ids":["https://openalex.org/I2722730"]},{"raw_affiliation_string":"College of Computer Science, Inner Mongolia University, China","institution_ids":["https://openalex.org/I2722730"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111277843","display_name":"Zhiwen Qiu","orcid":null},"institutions":[{"id":"https://openalex.org/I4210096899","display_name":"Jiangsu University of Science and Technology","ror":"https://ror.org/00tyjp878","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210096899"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwen Qiu","raw_affiliation_strings":["College of Ocean, Jiangsu University of Science and Technology, Zhenjiang, China","Jiangsu University of Science and Technology, Zhenjiang, China"],"raw_orcid":"https://orcid.org/0009-0008-5112-1757","affiliations":[{"raw_affiliation_string":"College of Ocean, Jiangsu University of Science and Technology, Zhenjiang, China","institution_ids":["https://openalex.org/I4210096899"]},{"raw_affiliation_string":"Jiangsu University of Science and Technology, Zhenjiang, China","institution_ids":["https://openalex.org/I4210096899"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.1870798,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"35","issue":"3","first_page":"2894","last_page":"2904"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6635022163391113},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4590964913368225},{"id":"https://openalex.org/keywords/moment","display_name":"Moment (physics)","score":0.455293208360672},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.36061549186706543},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.33624935150146484}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6635022163391113},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4590964913368225},{"id":"https://openalex.org/C179254644","wikidata":"https://www.wikidata.org/wiki/Q13222844","display_name":"Moment (physics)","level":2,"score":0.455293208360672},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36061549186706543},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33624935150146484},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C74650414","wikidata":"https://www.wikidata.org/wiki/Q11397","display_name":"Classical mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3498599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3498599","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1383338027","display_name":null,"funder_award_id":"62206137","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4236698393","display_name":null,"funder_award_id":"NJYT23105","funder_id":"https://openalex.org/F4320327830","funder_display_name":"Research Program of Science and Technology at Universities of Inner Mongolia Autonomous Region"},{"id":"https://openalex.org/G4856500953","display_name":null,"funder_award_id":"22JCQNJC00940","funder_id":"https://openalex.org/F4320323993","funder_display_name":"Natural Science Foundation of Tianjin City"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320323993","display_name":"Natural Science Foundation of Tianjin City","ror":null},{"id":"https://openalex.org/F4320327830","display_name":"Research Program of Science and Technology at Universities of Inner Mongolia Autonomous Region","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":53,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W2102605133","https://openalex.org/W2111078031","https://openalex.org/W2739107216","https://openalex.org/W2798354744","https://openalex.org/W2808647806","https://openalex.org/W2885013662","https://openalex.org/W2890502146","https://openalex.org/W2897628926","https://openalex.org/W2903901502","https://openalex.org/W2904291752","https://openalex.org/W2963017553","https://openalex.org/W2963247196","https://openalex.org/W2963393391","https://openalex.org/W2963524571","https://openalex.org/W2963735856","https://openalex.org/W2963916161","https://openalex.org/W2964089981","https://openalex.org/W2973131617","https://openalex.org/W2975813532","https://openalex.org/W2997429269","https://openalex.org/W3025323587","https://openalex.org/W3034464851","https://openalex.org/W3034743747","https://openalex.org/W3035339529","https://openalex.org/W3035356601","https://openalex.org/W3043840704","https://openalex.org/W3096935578","https://openalex.org/W3120889656","https://openalex.org/W3145807616","https://openalex.org/W3172655693","https://openalex.org/W3174364033","https://openalex.org/W3175817778","https://openalex.org/W3176201273","https://openalex.org/W3196930868","https://openalex.org/W3199096350","https://openalex.org/W3199858703","https://openalex.org/W3211953751","https://openalex.org/W4226382328","https://openalex.org/W4317796373","https://openalex.org/W4321780110","https://openalex.org/W4385268901","https://openalex.org/W4385825476","https://openalex.org/W4389890968","https://openalex.org/W4391528322","https://openalex.org/W4394862854","https://openalex.org/W6682864246","https://openalex.org/W6761423549","https://openalex.org/W6767457941","https://openalex.org/W6768851824","https://openalex.org/W6791353385","https://openalex.org/W6798195429","https://openalex.org/W6798784433"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"In":[0,124],"this":[1,125],"paper,":[2,126],"we":[3,127,156],"focus":[4,22],"on":[5,23,214],"diversifying":[6],"the":[7,31,37,41,51,57,85,89,101,110,138,142,150,167,173,177,183,192,201,221,234,248],"Video":[8],"Moment":[9],"Retrieval":[10],"(VMR)":[11],"model":[12,86,139,240],"into":[13,50],"more":[14],"scenes.":[15,71,93,229],"Most":[16],"existing":[17],"video":[18,25,132,174,216,237],"moment":[19,133,217,238],"retrieval":[20,134,218,239],"methods":[21,96],"aligning":[24],"moments":[26],"and":[27,152,171,185,195,223,251],"queries":[28,102],"by":[29,146,246],"capturing":[30,148,247],"cross-modal":[32,151,161,250],"relationship,":[33],"which":[34,83],"largely":[35],"ignores":[36],"cross-instance":[38,53,153,252],"relationship":[39,55],"behind":[40],"representation":[42],"learning.":[43,206],"Thus,":[44],"they":[45],"may":[46],"easily":[47],"get":[48],"trouble":[49],"inaccurate":[52],"contrastive":[54,205],"in":[56,99,204],"training":[58,222],"process:":[59],"1)":[60],"Existing":[61,95],"approaches":[62],"can":[63,241],"hardly":[64],"identify":[65],"similar":[66,117],"semantic":[67,122],"content":[68],"across":[69],"different":[70,121,228],"They":[72,106],"incorrectly":[73],"treat":[74],"such":[75],"instances":[76],"as":[77],"negative":[78,112,187,193],"samples":[79,113,188],"(termed":[80],"faulty":[81,184],"negatives),":[82],"forces":[84],"to":[87,108,116,200],"learn":[88],"features":[90,145],"from":[91,140,191,227],"query-irrelevant":[92,143],"2)":[94],"perform":[97],"unsatisfactorily":[98],"locating":[100],"with":[103],"subtle":[104],"differences.":[105],"neglect":[107],"mine":[109],"hard":[111,186],"that":[114,136,164,233],"belong":[115],"scenes":[118],"but":[119],"have":[120],"content.":[123],"propose":[128],"a":[129,159],"novel":[130],"robust":[131,236],"method":[135],"prevents":[137],"overfitting":[141],"scene":[144,169],"accurately":[147],"both":[149],"relationships.":[154,253],"Specifically,":[155],"first":[157],"develop":[158],"scene-independent":[160],"reasoning":[162],"module":[163],"filters":[165],"out":[166],"redundant":[168],"contents":[170],"infers":[172],"semantics":[175],"under":[176],"guidance":[178],"of":[179],"query":[180],"information.":[181],"Then,":[182],"are":[189,226],"mined":[190],"ones":[194],"calibrated":[196],"for":[197],"their":[198],"contribution":[199],"overall":[202],"loss":[203],"We":[207],"validate":[208],"our":[209],"contributions":[210],"through":[211],"extensive":[212],"experiments":[213],"cross-scene":[215],"settings,":[219],"where":[220],"test":[224],"data":[225],"Experimental":[230],"results":[231],"show":[232],"proposed":[235],"effectively":[242],"retrieve":[243],"target":[244],"videos":[245],"real":[249]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
