{"id":"https://openalex.org/W3211032667","doi":"https://doi.org/10.1145/3459637.3481937","title":"Multi-modal Dictionary BERT for Cross-modal Video Search in Baidu Advertising","display_name":"Multi-modal Dictionary BERT for Cross-modal Video Search in Baidu Advertising","publication_year":2021,"publication_date":"2021-10-26","ids":{"openalex":"https://openalex.org/W3211032667","doi":"https://doi.org/10.1145/3459637.3481937","mag":"3211032667"},"language":"en","primary_location":{"id":"doi:10.1145/3459637.3481937","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3459637.3481937","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018887598","display_name":"Tan Yu","orcid":"https://orcid.org/0000-0001-6071-0395"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Tan Yu","raw_affiliation_strings":["Baidu Research, Bellevue, WA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Baidu Research, Bellevue, WA, USA","institution_ids":["https://openalex.org/I4210108985"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100747784","display_name":"Yi Yang","orcid":"https://orcid.org/0000-0001-5077-4782"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100421473","display_name":"Yi Li","orcid":"https://orcid.org/0000-0002-2856-7290"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Li","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100383322","display_name":"Lin Liu","orcid":"https://orcid.org/0000-0002-8919-3173"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Liu","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103150619","display_name":"Mingming Sun","orcid":"https://orcid.org/0000-0002-6199-4905"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingming Sun","raw_affiliation_strings":["Baidu Research, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Baidu Research, Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100435527","display_name":"Ping Li","orcid":"https://orcid.org/0000-0002-5979-8868"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ping Li","raw_affiliation_strings":["Baidu Research, Bellevue, WA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Baidu Research, Bellevue, WA, USA","institution_ids":["https://openalex.org/I4210108985"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.1643,"has_fulltext":false,"cited_by_count":13,"citation_normalized_percentile":{"value":0.81039015,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"4341","last_page":"4351"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9952999949455261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7868590354919434},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.6154747605323792},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5643545389175415},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.47054818272590637},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.41617411375045776},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39114290475845337},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.32339656352996826}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7868590354919434},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.6154747605323792},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5643545389175415},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.47054818272590637},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.41617411375045776},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39114290475845337},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.32339656352996826},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3459637.3481937","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3459637.3481937","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1905882502","https://openalex.org/W1995609428","https://openalex.org/W2070753207","https://openalex.org/W2077815765","https://openalex.org/W2100235303","https://openalex.org/W2106277773","https://openalex.org/W2124509324","https://openalex.org/W2194775991","https://openalex.org/W2388114291","https://openalex.org/W2546696630","https://openalex.org/W2552579943","https://openalex.org/W2560835477","https://openalex.org/W2778940641","https://openalex.org/W2786148882","https://openalex.org/W2950960796","https://openalex.org/W2970231061","https://openalex.org/W2981851019","https://openalex.org/W2984020950","https://openalex.org/W2989550455","https://openalex.org/W2997591391","https://openalex.org/W2998356391","https://openalex.org/W3028864969","https://openalex.org/W3034709327","https://openalex.org/W3034727271","https://openalex.org/W3035265375","https://openalex.org/W3043840704","https://openalex.org/W3080510735","https://openalex.org/W3090449556","https://openalex.org/W3091588028","https://openalex.org/W3093559962","https://openalex.org/W3102995547","https://openalex.org/W3105232955","https://openalex.org/W3154430790","https://openalex.org/W3164904666","https://openalex.org/W3166304536","https://openalex.org/W3168851777","https://openalex.org/W3171668871","https://openalex.org/W3171927989","https://openalex.org/W3173220247","https://openalex.org/W3173789715","https://openalex.org/W3173839890","https://openalex.org/W3174010726","https://openalex.org/W3177155667","https://openalex.org/W3209275363"],"related_works":["https://openalex.org/W2384888906","https://openalex.org/W2144190808","https://openalex.org/W2376314740","https://openalex.org/W2366644548","https://openalex.org/W2357241418","https://openalex.org/W2115485936","https://openalex.org/W3137057511","https://openalex.org/W4285224442","https://openalex.org/W3162363894","https://openalex.org/W2500366714"],"abstract_inverted_index":{"Due":[0],"to":[1,55,190,196,206],"their":[2],"attractiveness,":[3],"video":[4,28,35,113,135,160,172,221],"advertisements":[5,29],"are":[6],"adored":[7],"by":[8,81,86,229],"advertisers.":[9],"Baidu,":[10],"as":[11,71,74],"one":[12],"of":[13,58],"the":[14,56,82,122,167,175,192,198,203,224],"leading":[15],"search":[16],"advertisement":[17,32,36,114,136],"platforms":[18],"in":[19,39,88,100,112,219,238],"China,":[20],"is":[21,46,157],"putting":[22],"more":[23,25],"and":[24,63,96,116,146,162,171,178],"effort":[26],"into":[27,174],"for":[30,134,236],"its":[31,75],"customers.":[33],"Search-based":[34],"display":[37],"is,":[38],"essence,":[40],"a":[41,108,153,213,232],"cross-modal":[42,92,101,109,148,182],"retrieval":[43],"problem,":[44],"which":[45,156],"normally":[47],"tackled":[48],"through":[49],"joint":[50,66,154],"embedding":[51,67],"methods.":[52],"Nevertheless,":[53],"due":[54],"lack":[57],"interactions":[59],"between":[60],"text":[61],"features":[62,161,170,173],"image":[64],"features,":[65],"methods":[68],"cannot":[69],"achieve":[70,97,207],"high":[72],"accuracy":[73],"counterpart":[76],"based":[77],"on":[78],"attention.":[79,183],"Inspired":[80],"great":[83],"success":[84],"achieved":[85,117],"BERT":[87,93,140,149],"NLP":[89],"tasks,":[90],"many":[91],"models":[94],"emerge":[95],"excellent":[98],"performance":[99,120],"retrieval.":[102],"Last":[103],"year,":[104],"Baidu":[105,220],"also":[106],"launched":[107],"BERT,":[110],"CAN,":[111],"platform,":[115,223],"considerably":[118],"better":[119],"than":[121],"previous":[123],"joint-embedding":[124],"model.":[125,142],"In":[126],"this":[127],"paper,":[128],"we":[129,188,201],"present":[130],"our":[131],"recent":[132],"work":[133],"retrieval,":[137],"Multi-modal":[138],"Dictionary":[139],"(MDBERT)":[141],"Compared":[143],"with":[144],"CAN":[145],"other":[147],"models,":[150],"MDBERT":[151,218],"integrates":[152],"dictionary,":[155],"shared":[158],"among":[159],"word":[163,169],"features.":[164],"It":[165],"maps":[166],"relevant":[168],"same":[176],"codeword":[177,193],"thus":[179],"fosters":[180],"effective":[181],"To":[184],"support":[185],"end-to-end":[186],"training,":[187],"propose":[189],"soften":[191],"assignment.":[194],"Meanwhile,":[195],"enhance":[197],"inference":[199],"efficiency,":[200],"adopt":[202],"product":[204],"quantization":[205],"fine-level":[208],"feature":[209],"space":[210],"partition":[211],"at":[212],"low":[214],"cost.":[215],"After":[216],"launching":[217],"advertising":[222],"conversion":[225],"ratio":[226],"(CVR)":[227],"increases":[228],"3.34%,":[230],"bringing":[231],"considerable":[233],"revenue":[234],"boost":[235],"advertisers":[237],"Baidu.":[239]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
