{"id":"https://openalex.org/W4409158187","doi":"https://doi.org/10.1145/3690624.3709401","title":"Large Vison-Language Foundation Model in Baidu AIGC Image Advertising","display_name":"Large Vison-Language Foundation Model in Baidu AIGC Image Advertising","publication_year":2025,"publication_date":"2025-04-04","ids":{"openalex":"https://openalex.org/W4409158187","doi":"https://doi.org/10.1145/3690624.3709401"},"language":"en","primary_location":{"id":"doi:10.1145/3690624.3709401","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3690624.3709401","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.1","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101725735","display_name":"Zhipeng Jin","orcid":"https://orcid.org/0009-0003-0863-2539"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhipeng Jin","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103325818","display_name":"Wen Tao","orcid":null},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wen Tao","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040477695","display_name":"Yafei Li","orcid":null},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yafei Li","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100747784","display_name":"Yi Yang","orcid":"https://orcid.org/0000-0001-5077-4782"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011745550","display_name":"Cong Han","orcid":"https://orcid.org/0009-0003-6516-1139"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Han","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086810479","display_name":"Shuanglong Li","orcid":"https://orcid.org/0009-0002-7346-5258"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuanglong Li","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5034880019","display_name":"Lin Liu","orcid":"https://orcid.org/0009-0003-7305-8940"},"institutions":[{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Liu","raw_affiliation_strings":["Baidu Inc., Beijing, China"],"affiliations":[{"raw_affiliation_string":"Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I98301712"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5101725735"],"corresponding_institution_ids":["https://openalex.org/I98301712"],"apc_list":null,"apc_paid":null,"fwci":1.3104,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.78783417,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"2303","last_page":"2312"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6871321797370911},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.6498763561248779},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4710127115249634},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.43352681398391724},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3870498538017273},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37694719433784485},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.3606170117855072},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.35794901847839355},{"id":"https://openalex.org/keywords/advertising","display_name":"Advertising","score":0.32796987891197205},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.325023889541626},{"id":"https://openalex.org/keywords/political-science","display_name":"Political science","score":0.09572085738182068},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.08136159181594849}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6871321797370911},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.6498763561248779},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4710127115249634},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.43352681398391724},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3870498538017273},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37694719433784485},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.3606170117855072},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.35794901847839355},{"id":"https://openalex.org/C112698675","wikidata":"https://www.wikidata.org/wiki/Q37038","display_name":"Advertising","level":1,"score":0.32796987891197205},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.325023889541626},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.09572085738182068},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.08136159181594849},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3690624.3709401","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3690624.3709401","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.1","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.41999998688697815,"display_name":"Decent work and economic growth","id":"https://metadata.un.org/sdg/8"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":62,"referenced_works":["https://openalex.org/W146900863","https://openalex.org/W2117340018","https://openalex.org/W2512971201","https://openalex.org/W2525579820","https://openalex.org/W2749708282","https://openalex.org/W2963527096","https://openalex.org/W2968880719","https://openalex.org/W2993466051","https://openalex.org/W3020257313","https://openalex.org/W3091588028","https://openalex.org/W3102566412","https://openalex.org/W3126337491","https://openalex.org/W3126792443","https://openalex.org/W3135367836","https://openalex.org/W3139669840","https://openalex.org/W3154430790","https://openalex.org/W3165938948","https://openalex.org/W3170767867","https://openalex.org/W3173789715","https://openalex.org/W3184735396","https://openalex.org/W3193402170","https://openalex.org/W3208314443","https://openalex.org/W4206238894","https://openalex.org/W4211015534","https://openalex.org/W4214708455","https://openalex.org/W4221167912","https://openalex.org/W4226182655","https://openalex.org/W4229042118","https://openalex.org/W4242655467","https://openalex.org/W4249736682","https://openalex.org/W4283388932","https://openalex.org/W4290877962","https://openalex.org/W4291125268","https://openalex.org/W4293342478","https://openalex.org/W4304014690","https://openalex.org/W4306316995","https://openalex.org/W4306820534","https://openalex.org/W4308241978","https://openalex.org/W4309130331","https://openalex.org/W4312057601","https://openalex.org/W4312747027","https://openalex.org/W4313484371","https://openalex.org/W4318147416","https://openalex.org/W4318211321","https://openalex.org/W4318718936","https://openalex.org/W4320495974","https://openalex.org/W4366344047","https://openalex.org/W4366850747","https://openalex.org/W4383472654","https://openalex.org/W4384652685","https://openalex.org/W4385570133","https://openalex.org/W4385970122","https://openalex.org/W4386066596","https://openalex.org/W4387195417","https://openalex.org/W4390873054","https://openalex.org/W4391335164","https://openalex.org/W4391602018","https://openalex.org/W4400529471","https://openalex.org/W6741832134","https://openalex.org/W6790978476","https://openalex.org/W6843350042","https://openalex.org/W6851592950"],"related_works":["https://openalex.org/W2381393187","https://openalex.org/W2332779545","https://openalex.org/W2358060160","https://openalex.org/W2035483685","https://openalex.org/W1969764885","https://openalex.org/W596947562","https://openalex.org/W2793937822","https://openalex.org/W2790817834","https://openalex.org/W2777605427","https://openalex.org/W2501983714"],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,103,195,221],"generative":[3],"artificial":[4],"intelligence":[5],"have":[6,212],"revolutionized":[7],"information":[8],"retrieval":[9],"and":[10,26,48,77,145,150,156,181],"content":[11],"generation,":[12],"opening":[13],"up":[14],"new":[15],"opportunities":[16],"for":[17,53,73,89,148],"the":[18,118,125,138,157,160,165],"e-commerce":[19],"industry.":[20],"Alignment":[21],"learning":[22,82],"between":[23],"small":[24],"models":[25,40,95],"parallel":[27],"corpora":[28,52],"cannot":[29],"meet":[30],"current":[31],"needs.":[32],"The":[33,170,190],"success":[34],"of":[35,121,159,167,173,192,225],"ChatGPT":[36],"demonstrates":[37,142],"that":[38,116],"large":[39,57],"need":[41],"to":[42,98,101,133,201],"first":[43],"establish":[44,66],"a":[45,56,67,79,214,222],"fundamental":[46,68],"understanding,":[47],"then":[49],"utilize":[50,110],"high-quality":[51],"generation.":[54],"Having":[55],"model":[58,71],"foundation":[59,72,140],"is":[60],"indispensable.":[61],"In":[62],"this":[63],"paper,":[64],"we":[65,109],"10B":[69],"multimodal":[70,74,139],"generation":[75,91],"tasks":[76],"propose":[78],"scene-based":[80],"alignment":[81,144],"approach":[83],"called":[84],"conditional":[85,154],"sample":[86],"supervised":[87],"fine-tuning":[88,155],"downstream":[90],"tasks.":[92],"Meanwhile,":[93],"diffusion":[94,113],"are":[96],"known":[97],"be":[99],"vulnerable":[100],"outliers":[102],"training":[104],"data.":[105],"To":[106],"address":[107],"this,":[108],"an":[111],"alternative":[112],"loss":[114,129,161],"function":[115,162],"preserves":[117],"high":[119],"quality":[120,166,171],"generated":[122,168,209],"data":[123],"like":[124],"original":[126],"squared":[127],"L2":[128],"while":[130],"being":[131],"robust":[132],"outliers.In":[134],"practical":[135],"test":[136],"sets,":[137],"fully":[141],"its":[143],"comprehension":[146],"abilities":[147],"graphic":[149],"textual":[151],"content.":[152,169],"Additionally,":[153],"design":[158],"significantly":[163],"enhance":[164],"rate":[172,218],"images":[174],"has":[175,184,199],"increased":[176],"by":[177,186],"34.3":[178],"percentage":[179,188],"points,":[180],"prompt":[182],"control":[183],"improved":[185],"19.8":[187],"points.":[189],"application":[191],"our":[193],"framework":[194],"Baidu":[196],"Search":[197],"Ads":[198],"led":[200],"significant":[202],"revenue":[203],"growth.":[204],"For":[205],"instance,":[206],"ads":[207],"with":[208],"image":[210],"creatives":[211],"achieved":[213],"29%":[215],"higher":[216],"click-through":[217],"(CTR),":[219],"resulting":[220],"daily":[223],"consumption":[224],"3":[226],"million":[227],"yuan.":[228]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
