{"id":"https://openalex.org/W4417125247","doi":"https://doi.org/10.1145/3757377.3764007","title":"FairyGen: Storied Cartoon Video from a Single Child-Drawn Character","display_name":"FairyGen: Storied Cartoon Video from a Single Child-Drawn Character","publication_year":2025,"publication_date":"2025-12-08","ids":{"openalex":"https://openalex.org/W4417125247","doi":"https://doi.org/10.1145/3757377.3764007"},"language":null,"primary_location":{"id":"doi:10.1145/3757377.3764007","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3757377.3764007","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036864992","display_name":"Jiayi Zheng","orcid":"https://orcid.org/0009-0001-9573-479X"},"institutions":[{"id":"https://openalex.org/I2799850029","display_name":"Dongguan University of Technology","ror":"https://ror.org/01m8p7q42","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799850029"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiayi Zheng","raw_affiliation_strings":["GVC Lab, Great Bay University, Dongguan, China"],"affiliations":[{"raw_affiliation_string":"GVC Lab, Great Bay University, Dongguan, China","institution_ids":["https://openalex.org/I2799850029"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5058799911","display_name":"Xiaodong Cun","orcid":"https://orcid.org/0000-0003-3607-2236"},"institutions":[{"id":"https://openalex.org/I2799850029","display_name":"Dongguan University of Technology","ror":"https://ror.org/01m8p7q42","country_code":"CN","type":"education","lineage":["https://openalex.org/I2799850029"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaodong Cun","raw_affiliation_strings":["GVC Lab, Great Bay University, Dongguan, China"],"affiliations":[{"raw_affiliation_string":"GVC Lab, Great Bay University, Dongguan, China","institution_ids":["https://openalex.org/I2799850029"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5036864992"],"corresponding_institution_ids":["https://openalex.org/I2799850029"],"apc_list":null,"apc_paid":null,"fwci":1.2158,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.85290581,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"11"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.4553000032901764,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.4553000032901764,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.30730000138282776,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.05400000140070915,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/character","display_name":"Character (mathematics)","score":0.5547999739646912},{"id":"https://openalex.org/keywords/animation","display_name":"Animation","score":0.4625000059604645},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.42260000109672546},{"id":"https://openalex.org/keywords/storytelling","display_name":"Storytelling","score":0.414000004529953},{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.3885999917984009},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.3799999952316284},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.37700000405311584},{"id":"https://openalex.org/keywords/adapter","display_name":"Adapter (computing)","score":0.35429999232292175}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6930999755859375},{"id":"https://openalex.org/C2780861071","wikidata":"https://www.wikidata.org/wiki/Q1062934","display_name":"Character (mathematics)","level":2,"score":0.5547999739646912},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5322999954223633},{"id":"https://openalex.org/C502989409","wikidata":"https://www.wikidata.org/wiki/Q11425","display_name":"Animation","level":2,"score":0.4625000059604645},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.42260000109672546},{"id":"https://openalex.org/C2776538412","wikidata":"https://www.wikidata.org/wiki/Q989963","display_name":"Storytelling","level":3,"score":0.414000004529953},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.3885999917984009},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.3799999952316284},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3799000084400177},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.37700000405311584},{"id":"https://openalex.org/C177284502","wikidata":"https://www.wikidata.org/wiki/Q1005390","display_name":"Adapter (computing)","level":2,"score":0.35429999232292175},{"id":"https://openalex.org/C90697248","wikidata":"https://www.wikidata.org/wiki/Q1062896","display_name":"Character animation","level":4,"score":0.3352000117301941},{"id":"https://openalex.org/C2777855551","wikidata":"https://www.wikidata.org/wiki/Q12310021","display_name":"Subject (documents)","level":2,"score":0.31769999861717224},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.3086000084877014},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C183003079","wikidata":"https://www.wikidata.org/wiki/Q1000371","display_name":"Personalization","level":2,"score":0.3027999997138977},{"id":"https://openalex.org/C126057942","wikidata":"https://www.wikidata.org/wiki/Q35158","display_name":"Stereoscopy","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.28519999980926514},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2824000120162964},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.2773999869823456},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.2669999897480011},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C11727466","wikidata":"https://www.wikidata.org/wiki/Q1628157","display_name":"Inpainting","level":3,"score":0.262800008058548},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.2574999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3757377.3764007","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3757377.3764007","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the SIGGRAPH Asia 2025 Conference Papers","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":27,"referenced_works":["https://openalex.org/W2963047368","https://openalex.org/W4312697499","https://openalex.org/W4312721788","https://openalex.org/W4312933868","https://openalex.org/W4313041141","https://openalex.org/W4366407873","https://openalex.org/W4385573943","https://openalex.org/W4386072096","https://openalex.org/W4386075924","https://openalex.org/W4386076425","https://openalex.org/W4386076676","https://openalex.org/W4389574988","https://openalex.org/W4390873054","https://openalex.org/W4394593186","https://openalex.org/W4402660110","https://openalex.org/W4402726937","https://openalex.org/W4402727496","https://openalex.org/W4402727699","https://openalex.org/W4402727736","https://openalex.org/W4402774246","https://openalex.org/W4403601997","https://openalex.org/W4403878131","https://openalex.org/W4403998619","https://openalex.org/W4404968242","https://openalex.org/W4409366101","https://openalex.org/W4412587771","https://openalex.org/W4415798001"],"related_works":[],"abstract_inverted_index":{"We":[0],"propose":[1],"FairyGen,":[2],"an":[3,130],"automatic":[4],"system":[5,167],"for":[6,77,185],"generating":[7,28],"story-driven":[8],"videos":[9],"from":[10],"a":[11,58,65,73,83,100,114,140,145],"single":[12,59],"child\u2019s":[13],"drawing,":[14],"while":[15],"faithfully":[16],"preserving":[17],"its":[18,183],"unique":[19],"artistic":[20],"style,":[21],"maintaining":[22],"consistent":[23],"identity":[24],"across":[25,49],"shots,":[26],"and":[27,54,93,154,176,187],"natural":[29,180],"anthropomorphic":[30],"motion.":[31],"Unlike":[32],"previous":[33],"works":[34],"focusing":[35],"solely":[36],"on":[37],"subject":[38],"or":[39],"motion,":[40,181],"we":[41,62,81,112],"treat":[42],"the":[43,89,97,109,160],"entire":[44],"storytelling":[45],"process":[46],"as":[47],"layered":[48],"character":[50,116],"modeling,":[51],"environment":[52],"generation,":[53,80],"shot":[55],"design.":[56],"Given":[57],"hand-drawn":[60],"image,":[61],"first":[63],"employ":[64],"Multimodal":[66],"Large":[67],"Language":[68],"Model":[69],"(MLLM)":[70],"to":[71,96,107,118,128],"generate":[72],"structured":[74],"storyboard.":[75,161],"Subsequently,":[76],"style-consistent":[78],"background":[79,102],"introduce":[82],"style":[84,92],"propagation":[85],"adapter":[86,143],"that":[87,165,170],"captures":[88],"character\u2019s":[90],"visual":[91],"propagates":[94],"it":[95],"background,":[98],"via":[99],"pre-trained":[101],"inpainting":[103],"diffusion":[104,133],"model.":[105],"Furthermore,":[106],"animate":[108],"generated":[110],"scenes,":[111],"reconstruct":[113],"3D":[115],"proxy":[117],"derive":[119],"plausible":[120],"motion":[121,138,141],"sequences.":[122],"These":[123],"sequences":[124],"are":[125,171],"then":[126],"used":[127],"fine-tune":[129],"MMDiT-based":[131],"image-to-video":[132],"model,":[134],"which":[135],"learns":[136],"complex":[137],"through":[139],"customization":[142],"with":[144,159],"timestep-shift":[146],"strategy.":[147],"Once":[148],"trained,":[149],"FairyGen":[150],"directly":[151],"renders":[152],"diverse":[153],"coherent":[155],"video":[156],"scenes":[157],"aligned":[158],"Extensive":[162],"experiments":[163],"demonstrate":[164],"our":[166],"produces":[168],"animations":[169],"stylistically":[172],"faithful,":[173],"narratively":[174],"structured,":[175],"rich":[177],"in":[178],"smooth,":[179],"highlighting":[182],"potential":[184],"personalized":[186],"engaging":[188],"story":[189],"animation.":[190]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-08T00:00:00"}
