{"id":"https://openalex.org/W4397026222","doi":"https://doi.org/10.1109/tmm.2024.3402613","title":"MAC: Masked Contrastive Pre-Training for Efficient Video-Text Retrieval","display_name":"MAC: Masked Contrastive Pre-Training for Efficient Video-Text Retrieval","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4397026222","doi":"https://doi.org/10.1109/tmm.2024.3402613"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2024.3402613","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3402613","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052135698","display_name":"Fangxun Shu","orcid":null},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fangxun Shu","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059047717","display_name":"Biaolong Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I45928872","display_name":"Alibaba Group (China)","ror":"https://ror.org/00k642b80","country_code":"CN","type":"company","lineage":["https://openalex.org/I45928872"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Biaolong Chen","raw_affiliation_strings":["Alibaba Group, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Alibaba Group, Beijing, China","institution_ids":["https://openalex.org/I45928872"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002061412","display_name":"Yue Liao","orcid":"https://orcid.org/0000-0002-2671-0655"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yue Liao","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058420913","display_name":"Jinqiao Wang","orcid":"https://orcid.org/0000-0002-9118-2780"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]},{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinqiao Wang","raw_affiliation_strings":["National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China","School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Laboratory of Pattern Recognition, Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210100255","https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100330138","display_name":"Si Liu","orcid":"https://orcid.org/0000-0002-9180-2935"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Si Liu","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052135698"],"corresponding_institution_ids":["https://openalex.org/I45928872"],"apc_list":null,"apc_paid":null,"fwci":1.2249,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.79565626,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":"26","issue":null,"first_page":"9962","last_page":"9972"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8737857937812805},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5174277424812317},{"id":"https://openalex.org/keywords/video-retrieval","display_name":"Video retrieval","score":0.4909262955188751},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4570349454879761},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.443244069814682},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.41816315054893494},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.405538409948349},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.3626976013183594}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8737857937812805},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5174277424812317},{"id":"https://openalex.org/C2983174267","wikidata":"https://www.wikidata.org/wiki/Q3775098","display_name":"Video retrieval","level":2,"score":0.4909262955188751},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4570349454879761},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.443244069814682},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.41816315054893494},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.405538409948349},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.3626976013183594},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2024.3402613","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3402613","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2558812161","display_name":null,"funder_award_id":"U23B2010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3030772475","display_name":null,"funder_award_id":"2022C01082","funder_id":"https://openalex.org/F8142712028","funder_display_name":"Key Research and Development Program of Zhejiang Province"},{"id":"https://openalex.org/G5696407354","display_name":null,"funder_award_id":"62122010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F8142712028","display_name":"Key Research and Development Program of Zhejiang Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":90,"referenced_works":["https://openalex.org/W1927052826","https://openalex.org/W2185175083","https://openalex.org/W2194775991","https://openalex.org/W2425121537","https://openalex.org/W2507009361","https://openalex.org/W2618530766","https://openalex.org/W2746314669","https://openalex.org/W2752796333","https://openalex.org/W2808399042","https://openalex.org/W2883429621","https://openalex.org/W2886641317","https://openalex.org/W2896457183","https://openalex.org/W2952370363","https://openalex.org/W2956367483","https://openalex.org/W2963017553","https://openalex.org/W2978017171","https://openalex.org/W2981851019","https://openalex.org/W2984008963","https://openalex.org/W2990503944","https://openalex.org/W3035265375","https://openalex.org/W3035356601","https://openalex.org/W3035682985","https://openalex.org/W3043840704","https://openalex.org/W3090449556","https://openalex.org/W3094502228","https://openalex.org/W3105232955","https://openalex.org/W3118694826","https://openalex.org/W3126721948","https://openalex.org/W3128990302","https://openalex.org/W3138516171","https://openalex.org/W3145807616","https://openalex.org/W3168640669","https://openalex.org/W3173948887","https://openalex.org/W3204588463","https://openalex.org/W3204670646","https://openalex.org/W3207042189","https://openalex.org/W3216270236","https://openalex.org/W3217059257","https://openalex.org/W3217102353","https://openalex.org/W4210900713","https://openalex.org/W4214612132","https://openalex.org/W4221142658","https://openalex.org/W4225414521","https://openalex.org/W4226340378","https://openalex.org/W4281623693","https://openalex.org/W4281899128","https://openalex.org/W4283029876","https://openalex.org/W4285606530","https://openalex.org/W4286540937","https://openalex.org/W4292754598","https://openalex.org/W4294691145","https://openalex.org/W4297808394","https://openalex.org/W4304014690","https://openalex.org/W4312312750","https://openalex.org/W4312538879","https://openalex.org/W4312560592","https://openalex.org/W4312634508","https://openalex.org/W4312655527","https://openalex.org/W4312685069","https://openalex.org/W4312804044","https://openalex.org/W4313156423","https://openalex.org/W4313186260","https://openalex.org/W4323065192","https://openalex.org/W4379662646","https://openalex.org/W4385572645","https://openalex.org/W4386071687","https://openalex.org/W4386076084","https://openalex.org/W4386076661","https://openalex.org/W4387885937","https://openalex.org/W4394659899","https://openalex.org/W6631190155","https://openalex.org/W6637373629","https://openalex.org/W6684090549","https://openalex.org/W6743428213","https://openalex.org/W6766582784","https://openalex.org/W6767211374","https://openalex.org/W6768851824","https://openalex.org/W6784184991","https://openalex.org/W6789753369","https://openalex.org/W6796761347","https://openalex.org/W6797109355","https://openalex.org/W6797236868","https://openalex.org/W6805349323","https://openalex.org/W6810265253","https://openalex.org/W6838540985","https://openalex.org/W6838580846","https://openalex.org/W6838789689","https://openalex.org/W6842514839","https://openalex.org/W6844194202","https://openalex.org/W6864544085"],"related_works":["https://openalex.org/W230091440","https://openalex.org/W2233261550","https://openalex.org/W2810751659","https://openalex.org/W258997015","https://openalex.org/W2997094352","https://openalex.org/W3216976533","https://openalex.org/W100620283","https://openalex.org/W2495260952","https://openalex.org/W655728004","https://openalex.org/W2046272293"],"abstract_inverted_index":{"We":[0],"present":[1],"a":[2,36,54,95,128],"simple":[3],"yet":[4],"effective":[5],"end-to-end":[6,144],"Video-language":[7,13],"Pre-training":[8,14],"(VidLP)":[9],"framework,":[10],"Masked":[11],"Contrastive":[12],"(MAC),":[15],"for":[16,79,82,98],"video-text":[17,100,106,163],"retrieval":[18,107,164,187],"tasks.":[19,188],"Our":[20,156,171],"MAC":[21,157],"aims":[22],"to":[23,40,51,126,175],"reduce":[24],"video":[25],"representation's":[26],"spatial":[27,58,70],"and":[28,60,117,130,136,152,169],"temporal":[29,46],"redundancy":[30],"in":[31],"the":[32,66,75,88,124],"VidLP":[33],"model":[34,125],"by":[35],"mask":[37,53,76],"sampling":[38,77],"mechanism":[39],"improve":[41],"pre-training":[42],"efficiency.":[43],"Comparing":[44],"conventional":[45],"sparse":[47,69],"sampling,":[48],"we":[49,73,93,181],"propose":[50,94],"randomly":[52],"high":[55],"ratio":[56],"of":[57,85],"regions":[59,64],"only":[61],"take":[62],"visible":[63],"into":[65],"encoder":[67],"as":[68],"sampling.":[71],"Similarly,":[72],"adopt":[74],"technique":[78],"text":[80],"inputs":[81],"consistency.":[83],"Instead":[84],"blindly":[86],"applying":[87],"mask-then-prediction":[89],"paradigm":[90,97],"from":[91,134],"MAE,":[92],"masked-then-alignment":[96],"efficient":[99,143],"alignment.":[101],"The":[102],"motivation":[103],"is":[104,173],"that":[105],"tasks":[108],"rely":[109],"on":[110,161,185],"high-level":[111],"alignment":[112,119],"rather":[113],"than":[114],"low-level":[115],"reconstruction,":[116],"multimodal":[118,132],"with":[120],"masked":[121],"modeling":[122],"encourages":[123],"learn":[127],"robust":[129],"general":[131],"representation":[133],"incomplete":[135],"unstable":[137],"inputs.":[138],"Coupling":[139],"these":[140],"designs":[141],"enables":[142],"pre-training:":[145],"3\u00d7":[146],"speed":[147],"up,":[148],"60%+":[149],"computation":[150],"reduction,":[151],"4%+":[153],"performance":[154],"improvement.":[155],"achieves":[158],"state-of-the-art":[159],"results":[160,184],"various":[162],"datasets":[165],"including":[166],"MSR-VTT,":[167],"DiDeMo,":[168],"ActivityNet.":[170],"approach":[172],"omnivorous":[174],"input":[176],"modalities.":[177],"With":[178],"minimal":[179],"modifications,":[180],"achieve":[182],"competitive":[183],"image-text":[186]},"counts_by_year":[{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
