{"id":"https://openalex.org/W4404526287","doi":"https://doi.org/10.1145/3687975","title":"StyleCrafter: Taming Artistic Video Diffusion with Reference-Augmented Adapter Learning","display_name":"StyleCrafter: Taming Artistic Video Diffusion with Reference-Augmented Adapter Learning","publication_year":2024,"publication_date":"2024-11-19","ids":{"openalex":"https://openalex.org/W4404526287","doi":"https://doi.org/10.1145/3687975"},"language":"en","primary_location":{"id":"doi:10.1145/3687975","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3687975","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3687975","source":{"id":"https://openalex.org/S185367456","display_name":"ACM Transactions on Graphics","issn_l":"0730-0301","issn":["0730-0301","1557-7368"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Graphics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3687975","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039191938","display_name":"Gongye Liu","orcid":"https://orcid.org/0009-0003-6536-282X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Gongye Liu","raw_affiliation_strings":["Tsinghua University, shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046222739","display_name":"Menghan Xia","orcid":"https://orcid.org/0000-0001-9664-4967"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Menghan Xia","raw_affiliation_strings":["Tencent AI lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100419834","display_name":"Yong Zhang","orcid":"https://orcid.org/0000-0003-0066-3448"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Zhang","raw_affiliation_strings":["Tencent AI lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024800495","display_name":"Haoxin Chen","orcid":"https://orcid.org/0009-0000-6085-2107"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoxin Chen","raw_affiliation_strings":["Tencent AI lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5066086464","display_name":"Jinbo Xing","orcid":"https://orcid.org/0000-0002-2181-1879"},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"HK","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jinbo Xing","raw_affiliation_strings":["The Chinese University of Hong Kong, HongKong, China"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong, HongKong, China","institution_ids":["https://openalex.org/I177725633"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100354968","display_name":"Yibo Wang","orcid":"https://orcid.org/0000-0002-2829-0156"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yibo Wang","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101538534","display_name":"Xintao Wang","orcid":"https://orcid.org/0000-0001-6585-8604"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xintao Wang","raw_affiliation_strings":["Tencent AI lab, ShenZhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI lab, ShenZhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102004349","display_name":"Ying Shan","orcid":"https://orcid.org/0000-0001-7673-8325"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ying Shan","raw_affiliation_strings":["Tencent AI lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tencent AI lab, Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5020953714","display_name":"Yujiu Yang","orcid":"https://orcid.org/0000-0002-6427-1024"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yujiu Yang","raw_affiliation_strings":["Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5039191938"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":1.9943,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.88203924,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"43","issue":"6","first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11105","display_name":"Advanced Image Processing Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9878000020980835,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adapter","display_name":"Adapter (computing)","score":0.7745981812477112},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6471819877624512},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.5473870635032654},{"id":"https://openalex.org/keywords/augmented-reality","display_name":"Augmented reality","score":0.526104748249054},{"id":"https://openalex.org/keywords/diffusion","display_name":"Diffusion","score":0.43567055463790894},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3691067695617676},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.36354076862335205},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.06383487582206726},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.061592429876327515}],"concepts":[{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.7745981812477112},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6471819877624512},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.5473870635032654},{"id":"https://openalex.org/C153715457","wikidata":"https://www.wikidata.org/wiki/Q254183","display_name":"Augmented reality","level":2,"score":0.526104748249054},{"id":"https://openalex.org/C69357855","wikidata":"https://www.wikidata.org/wiki/Q163214","display_name":"Diffusion","level":2,"score":0.43567055463790894},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3691067695617676},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.36354076862335205},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.06383487582206726},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.061592429876327515},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3687975","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3687975","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3687975","source":{"id":"https://openalex.org/S185367456","display_name":"ACM Transactions on Graphics","issn_l":"0730-0301","issn":["0730-0301","1557-7368"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Graphics","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3687975","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3687975","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3687975","source":{"id":"https://openalex.org/S185367456","display_name":"ACM Transactions on Graphics","issn_l":"0730-0301","issn":["0730-0301","1557-7368"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Graphics","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.5899999737739563,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G712080188","display_name":null,"funder_award_id":"61991451","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4404526287.pdf"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W569478347","https://openalex.org/W1987474052","https://openalex.org/W2102154096","https://openalex.org/W2125879936","https://openalex.org/W2292976057","https://openalex.org/W2344328033","https://openalex.org/W2475287302","https://openalex.org/W2603351312","https://openalex.org/W2603777577","https://openalex.org/W2956900569","https://openalex.org/W2969803502","https://openalex.org/W3003483634","https://openalex.org/W3024643182","https://openalex.org/W3027723803","https://openalex.org/W3036167779","https://openalex.org/W3048537404","https://openalex.org/W3086415202","https://openalex.org/W3102542372","https://openalex.org/W3137692012","https://openalex.org/W3159481202","https://openalex.org/W3177457352","https://openalex.org/W3202767484","https://openalex.org/W3204588463","https://openalex.org/W4225307095","https://openalex.org/W4281253515","https://openalex.org/W4306820534","https://openalex.org/W4312933868","https://openalex.org/W4313029666","https://openalex.org/W4386071613","https://openalex.org/W4386072096","https://openalex.org/W4386076027","https://openalex.org/W4386076425","https://openalex.org/W4386721758","https://openalex.org/W4389334985","https://openalex.org/W4390871782","https://openalex.org/W4390873135","https://openalex.org/W4390874393","https://openalex.org/W4402716124","https://openalex.org/W6600060591","https://openalex.org/W6600339963","https://openalex.org/W6600688380","https://openalex.org/W6602344735","https://openalex.org/W6693853403","https://openalex.org/W6779823529"],"related_works":["https://openalex.org/W2133028525","https://openalex.org/W4229060448","https://openalex.org/W4306381730","https://openalex.org/W2981692913","https://openalex.org/W3044188621","https://openalex.org/W3184035966","https://openalex.org/W2172197285","https://openalex.org/W2991048842","https://openalex.org/W2750280393","https://openalex.org/W2355696739"],"abstract_inverted_index":{"Text-to-video":[0],"(T2V)":[1],"models":[2,50],"have":[3],"shown":[4],"remarkable":[5],"capabilities":[6],"in":[7,25,59],"generating":[8],"diverse":[9],"videos.":[10],"However,":[11],"they":[12],"struggle":[13],"to":[14,20,76,93,112,123],"produce":[15],"user-desired":[16],"artistic":[17,71],"videos":[18,149],"due":[19],"(i)":[21],"text's":[22],"inherent":[23],"clumsiness":[24],"expressing":[26],"specific":[27],"styles":[28],"and":[29,131,141,158,174],"(ii)":[30],"the":[31,68,89,125,153,156,160,163],"generally":[32],"degraded":[33],"style":[34,53,61,80,133,142,161],"fidelity.":[35],"To":[36,101],"address":[37],"these":[38],"challenges,":[39],"we":[40,74,105,117],"introduce":[41],"StyleCrafter,":[42],"a":[43,52,64,79,97,119],"generic":[44],"method":[45],"that":[46,150,168],"enhances":[47],"pretrained":[48],"T2V":[49],"with":[51,152],"control":[54,81],"adapter,":[55],"allowing":[56],"video":[57,72,94],"generation":[58,95],"any":[60],"by":[62],"feeding":[63],"reference":[65,164],"image.":[66],"Considering":[67],"scarcity":[69],"of":[70,127,155,162],"data,":[73],"propose":[75,118],"first":[77],"train":[78],"adapter":[82],"using":[83],"style-rich":[84],"image":[85],"datasets,":[86],"then":[87],"transfer":[88],"learned":[90],"stylization":[91],"ability":[92],"through":[96],"tailor-made":[98],"finetuning":[99],"paradigm.":[100],"promote":[102],"content-style":[103],"disentanglement,":[104],"employ":[106],"carefully":[107],"designed":[108],"data":[109],"augmentation":[110],"strategies":[111],"enhance":[113],"decoupled":[114],"learning.":[115],"Additionally,":[116],"scale-adaptive":[120],"fusion":[121],"module":[122],"balance":[124],"influences":[126],"text-based":[128],"content":[129,154],"features":[130],"image-based":[132],"features,":[134],"which":[135],"helps":[136],"generalization":[137],"across":[138],"various":[139],"text":[140],"combinations.":[143],"StyleCrafter":[144],"efficiently":[145],"generates":[146],"high-quality":[147],"stylized":[148],"align":[151],"texts":[157],"resemble":[159],"images.":[165],"Experiments":[166],"demonstrate":[167],"our":[169],"approach":[170],"is":[171],"more":[172],"flexible":[173],"efficient":[175],"than":[176],"existing":[177],"competitors.":[178],"Project":[179],"page:":[180],"https://gongyeliu.github.io/StyleCrafter.github.io/":[181]},"counts_by_year":[{"year":2025,"cited_by_count":8}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
