{"id":"https://openalex.org/W4396612943","doi":"https://doi.org/10.1145/3663571","title":"Exploiting Instance-level Relationships in Weakly Supervised Text-to-Video Retrieval","display_name":"Exploiting Instance-level Relationships in Weakly Supervised Text-to-Video Retrieval","publication_year":2024,"publication_date":"2024-05-03","ids":{"openalex":"https://openalex.org/W4396612943","doi":"https://doi.org/10.1145/3663571"},"language":"en","primary_location":{"id":"doi:10.1145/3663571","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3663571","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3663571","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3663571","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073775343","display_name":"Shukang Yin","orcid":"https://orcid.org/0000-0002-5356-1800"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shukang Yin","raw_affiliation_strings":["School of Data Science, University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0002-5356-1800","affiliations":[{"raw_affiliation_string":"School of Data Science, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090369859","display_name":"Sirui Zhao","orcid":"https://orcid.org/0000-0001-8103-0321"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]},{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Sirui Zhao","raw_affiliation_strings":["School of Computer Science and Technology, University of Science and Technology of China, Hefei, China and School of Computer Science and Technology, Southwest University of Science and Technology, Mianyang, China"],"raw_orcid":"https://orcid.org/0000-0001-8103-0321","affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, University of Science and Technology of China, Hefei, China and School of Computer Science and Technology, Southwest University of Science and Technology, Mianyang, China","institution_ids":["https://openalex.org/I1297991670","https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100446071","display_name":"Hao Wang","orcid":"https://orcid.org/0000-0001-9921-2078"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Wang","raw_affiliation_strings":["School of Data Science, University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0001-9921-2078","affiliations":[{"raw_affiliation_string":"School of Data Science, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025292786","display_name":"Tong Xu","orcid":"https://orcid.org/0000-0003-4246-5386"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Xu","raw_affiliation_strings":["School of Data Science, University of Science and Technology of China, Hefei, China"],"raw_orcid":"https://orcid.org/0000-0003-4246-5386","affiliations":[{"raw_affiliation_string":"School of Data Science, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5048237545","display_name":"Enhong Chen","orcid":"https://orcid.org/0000-0002-4835-4102"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Enhong Chen","raw_affiliation_strings":["School of Data Science, University of Science and Technology of China, Hefei China"],"raw_orcid":"https://orcid.org/0000-0002-4835-4102","affiliations":[{"raw_affiliation_string":"School of Data Science, University of Science and Technology of China, Hefei China","institution_ids":["https://openalex.org/I126520041"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0936,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.77517539,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"20","issue":"10","first_page":"1","last_page":"21"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8878614902496338},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.49288463592529297},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3936781883239746}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8878614902496338},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.49288463592529297},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3936781883239746}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3663571","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3663571","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3663571","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3663571","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3663571","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3663571","source":{"id":"https://openalex.org/S19610489","display_name":"ACM Transactions on Multimedia Computing Communications and Applications","issn_l":"1551-6857","issn":["1551-6857","1551-6865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Multimedia Computing, Communications, and Applications","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6302681207","display_name":null,"funder_award_id":"62222213, U22B2059, U23A20319, 62072423, 61727809","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4396612943.pdf"},"referenced_works_count":87,"referenced_works":["https://openalex.org/W1945608308","https://openalex.org/W1975517671","https://openalex.org/W1994488211","https://openalex.org/W2009070933","https://openalex.org/W2036424610","https://openalex.org/W2074466695","https://openalex.org/W2074992691","https://openalex.org/W2086199304","https://openalex.org/W2096733369","https://openalex.org/W2109325554","https://openalex.org/W2110045159","https://openalex.org/W2110119381","https://openalex.org/W2133288557","https://openalex.org/W2133564696","https://openalex.org/W2154318594","https://openalex.org/W2163474322","https://openalex.org/W2168749806","https://openalex.org/W2194775991","https://openalex.org/W2222512263","https://openalex.org/W2425121537","https://openalex.org/W2549139847","https://openalex.org/W2560886373","https://openalex.org/W2593390416","https://openalex.org/W2753311918","https://openalex.org/W2805072236","https://openalex.org/W2949611920","https://openalex.org/W2963017553","https://openalex.org/W2963524571","https://openalex.org/W2963916161","https://openalex.org/W2964089981","https://openalex.org/W2964420626","https://openalex.org/W2965373594","https://openalex.org/W2965458216","https://openalex.org/W2975813532","https://openalex.org/W2979933490","https://openalex.org/W2981716253","https://openalex.org/W2984008963","https://openalex.org/W2997429269","https://openalex.org/W3016970897","https://openalex.org/W3028831795","https://openalex.org/W3035339529","https://openalex.org/W3035356601","https://openalex.org/W3043840704","https://openalex.org/W3092820619","https://openalex.org/W3099181346","https://openalex.org/W3102887392","https://openalex.org/W3103934428","https://openalex.org/W3104862079","https://openalex.org/W3105232955","https://openalex.org/W3108328693","https://openalex.org/W3127686331","https://openalex.org/W3130796238","https://openalex.org/W3155721152","https://openalex.org/W3168433561","https://openalex.org/W3168640669","https://openalex.org/W3176471072","https://openalex.org/W3176719058","https://openalex.org/W3204588463","https://openalex.org/W3207042189","https://openalex.org/W4205811793","https://openalex.org/W4211053420","https://openalex.org/W4212848270","https://openalex.org/W4214582399","https://openalex.org/W4225935504","https://openalex.org/W4249142012","https://openalex.org/W4281488254","https://openalex.org/W4285606530","https://openalex.org/W4293083879","https://openalex.org/W4293567872","https://openalex.org/W4293861233","https://openalex.org/W4295135076","https://openalex.org/W4297734170","https://openalex.org/W4297808394","https://openalex.org/W4304142044","https://openalex.org/W4309764765","https://openalex.org/W4315705014","https://openalex.org/W4385245566","https://openalex.org/W4386232130","https://openalex.org/W4387947626","https://openalex.org/W4393259344","https://openalex.org/W4404356490","https://openalex.org/W6676748427","https://openalex.org/W6683033130","https://openalex.org/W6739901393","https://openalex.org/W6763146608","https://openalex.org/W6811139122","https://openalex.org/W6852989508"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"Text-to-Video":[0],"Retrieval":[1,56],"is":[2,58,227],"a":[3,14,28,49,70,88,103,175,191],"typical":[4],"cross-modal":[5,197],"retrieval":[6,145,164],"task":[7,51,86],"that":[8,65,223],"has":[9],"been":[10],"studied":[11],"extensively":[12],"under":[13],"conventional":[15],"supervised":[16,30],"setting.":[17,233],"Recently,":[18],"some":[19],"works":[20],"have":[21,118,212],"sought":[22],"to":[23,27,62,69,156,162,195],"extend":[24],"the":[25,75,85,127,133,158,187,214,230],"problem":[26],"weakly":[29],"formulation,":[31],"which":[32,60,136],"can":[33],"be":[34,237],"more":[35,41],"consistent":[36],"with":[37,110],"real-life":[38],"scenarios":[39],"and":[40,108,130,142,182,189,219],"efficient":[42],"in":[43,139,151,186,229],"annotation":[44],"cost.":[45],"In":[46],"this":[47,149,152,168],"context,":[48],"new":[50,176,192],"called":[52],"Partially":[53],"Relevant":[54],"Video":[55],"(PRVR)":[57],"proposed,":[59],"aims":[61],"retrieve":[63],"videos":[64,76],"are":[66],"partially":[67],"relevant":[68,82],"given":[71],"textual":[72],"query,":[73],"i.e.,":[74],"containing":[77],"at":[78,240],"least":[79],"one":[80],"semantically":[81],"moment.":[83],"Formulating":[84],"as":[87,102],"Multiple":[89],"Instance":[90],"Learning":[91],"(MIL)":[92],"ranking":[93,232],"problem,":[94,150],"prior":[95],"arts":[96],"rely":[97],"on":[98,167,207],"heuristics":[99],"algorithms":[100],"such":[101],"simple":[104],"greedy":[105],"search":[106],"strategy":[107],"deal":[109],"each":[111],"query":[112],"independently.":[113],"Although":[114],"these":[115],"early":[116],"explorations":[117],"achieved":[119],"decent":[120],"performance,":[121],"they":[122],"may":[123],"not":[124],"fully":[125],"utilize":[126],"bag-level":[128],"label":[129],"only":[131],"consider":[132],"local":[134],"optimum,":[135],"could":[137],"result":[138],"suboptimal":[140],"solutions":[141],"inferior":[143],"final":[144],"performance.":[146,165],"To":[147],"address":[148],"paper,":[153],"we":[154,170],"propose":[155],"exploit":[157],"relationships":[159,226],"between":[160,199],"instances":[161],"boost":[163],"Based":[166],"idea,":[169],"creatively":[171],"put":[172],"forward:":[173],"(1)":[174],"matching":[177],"scheme":[178],"for":[179],"pairing":[180],"queries":[181],"their":[183],"related":[184],"moments":[185],"video;":[188],"(2)":[190],"loss":[193],"function":[194],"facilitate":[196],"alignment":[198],"two":[200],"views":[201],"of":[202,216],"an":[203],"instance.":[204],"Extensive":[205],"validations":[206],"three":[208],"publicly":[209,238],"available":[210,239],"datasets":[211],"demonstrated":[213],"effectiveness":[215],"our":[217,221],"solution":[218],"verified":[220],"hypothesis":[222],"modeling":[224],"instance-level":[225],"beneficial":[228],"MIL":[231],"Our":[234],"code":[235],"will":[236],"https://github.com/xjtupanda/BGM-Net":[241],".":[242]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":3}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
