{"id":"https://openalex.org/W7138230452","doi":"https://doi.org/10.48550/arxiv.2603.13506","title":"LibraGen: Playing a Balance Game in Subject-Driven Video Generation","display_name":"LibraGen: Playing a Balance Game in Subject-Driven Video Generation","publication_year":2026,"publication_date":"2026-03-13","ids":{"openalex":"https://openalex.org/W7138230452","doi":"https://doi.org/10.48550/arxiv.2603.13506"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.13506","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13506","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.13506","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5129750939","display_name":"Jiahao Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhu, Jiahao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086678836","display_name":"Shanshan Lao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lao, Shanshan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129736793","display_name":"Lijie Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Lijie","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129712667","display_name":"Gen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Gen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041901127","display_name":"T. F. Qi","orcid":"https://orcid.org/0000-0003-3649-5263"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qi, Tianhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129750103","display_name":"Wei Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Wei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129752426","display_name":"Bingchuan Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Bingchuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Fangfang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Fangfang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101970062","display_name":"Zehao Chen","orcid":"https://orcid.org/0009-0005-3247-8417"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Zhuowei","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129705580","display_name":"Tianxiang Ma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Tianxiang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129694545","display_name":"Qian HE","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"HE, Qian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129750839","display_name":"Yi Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129661719","display_name":"Xiaohua Xie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xie, Xiaohua","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5129750939"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6669999957084656,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.6669999957084656,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.11190000176429749,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.07190000265836716,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.6287999749183655},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5964000225067139},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5041000247001648},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.44020000100135803},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.41190001368522644},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4027000069618225},{"id":"https://openalex.org/keywords/core","display_name":"Core (optical fiber)","score":0.38760000467300415},{"id":"https://openalex.org/keywords/video-game","display_name":"Video game","score":0.35359999537467957}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7817999720573425},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.6287999749183655},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5964000225067139},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5041000247001648},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4684999883174896},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.44020000100135803},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4251999855041504},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.41190001368522644},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4027000069618225},{"id":"https://openalex.org/C2164484","wikidata":"https://www.wikidata.org/wiki/Q5170150","display_name":"Core (optical fiber)","level":2,"score":0.38760000467300415},{"id":"https://openalex.org/C3018412434","wikidata":"https://www.wikidata.org/wiki/Q7889","display_name":"Video game","level":2,"score":0.35359999537467957},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.32679998874664307},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.32519999146461487},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.28380000591278076},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.26809999346733093},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.2628999948501587},{"id":"https://openalex.org/C168031717","wikidata":"https://www.wikidata.org/wiki/Q1530280","display_name":"Balance (ability)","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2540000081062317},{"id":"https://openalex.org/C105002631","wikidata":"https://www.wikidata.org/wiki/Q4833645","display_name":"Subject-matter expert","level":3,"score":0.25369998812675476},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.2515999972820282},{"id":"https://openalex.org/C24756922","wikidata":"https://www.wikidata.org/wiki/Q1757694","display_name":"Data quality","level":3,"score":0.250900000333786},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2506999969482422}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.13506","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13506","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.13506","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.13506","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,25,57,92,97,107,134],"advancement":[2],"of":[3,28,59,95],"video":[4],"generation":[5,77],"foundation":[6,73],"models":[7,74,216],"(VGFMs),":[8],"customized":[9],"generation,":[10],"particularly":[11],"subject-to-video":[12],"(S2V),":[13],"has":[14],"attracted":[15],"growing":[16],"attention.":[17],"However,":[18],"a":[19,29,67,79,111,116,144,193],"key":[20],"challenge":[21],"lies":[22],"in":[23],"balancing":[24],"intrinsic":[26,83],"priors":[27],"VGFM,":[30],"such":[31],"as":[32,78,106],"motion":[33],"coherence,":[34],"visual":[35],"aesthetics,":[36],"and":[37,86,109,122,153,158,178,183,202,213],"prompt":[38],"alignment,":[39],"with":[40,138],"its":[41,139],"newly":[42],"derived":[43],"S2V":[44,76,87,140,215],"capability.":[45,88],"Existing":[46],"methods":[47],"often":[48],"neglect":[49],"this":[50,187],"balance":[51,80],"by":[52,91],"enhancing":[53],"one":[54],"aspect":[55],"at":[56],"expense":[58],"others.":[60],"To":[61,131],"address":[62],"this,":[63],"we":[64,102,142,191],"propose":[65],"LibraGen,":[66],"novel":[68],"framework":[69],"that":[70,119,208],"views":[71],"extending":[72],"for":[75],"game":[81],"between":[82],"VGFM":[84],"strengths":[85],"Specifically,":[89],"guided":[90],"core":[93],"philosophy":[94],"\"Raising":[96],"Fulcrum,":[98],"Tuning":[99],"to":[100,126,163,185,199],"Balance,\"":[101],"identify":[103],"data":[104,124,129,155],"quality":[105],"fulcrum":[108],"advocate":[110],"quality-over-quantity":[112],"approach.":[113],"We":[114],"construct":[115],"hybrid":[117],"pipeline":[118],"combines":[120],"automated":[121],"manual":[123],"filtering":[125],"improve":[127],"overall":[128],"quality.":[130],"further":[132],"harmonize":[133],"VGFM's":[135],"native":[136],"capabilities":[137],"extension,":[141],"introduce":[143,192],"Tune-to-Balance":[145],"post-training":[146],"paradigm.":[147],"During":[148,189],"supervised":[149],"fine-tuning,":[150],"both":[151,211],"cross-pair":[152],"in-pair":[154],"are":[156,181],"incorporated,":[157],"model":[159],"merging":[160],"is":[161],"employed":[162],"achieve":[164],"an":[165],"effective":[166],"trade-off.":[167],"Subsequently,":[168],"two":[169],"tailored":[170],"direct":[171],"preference":[172],"optimization":[173],"(DPO)":[174],"pipelines,":[175],"namely":[176],"Consis-DPO":[177],"Real-Fake":[179],"DPO,":[180],"designed":[182],"merged":[184],"consolidate":[186],"balance.":[188],"inference,":[190],"time-dependent":[194],"dynamic":[195],"classifier-free":[196],"guidance":[197],"scheme":[198],"enable":[200],"flexible":[201],"fine-grained":[203],"control.":[204],"Experimental":[205],"results":[206],"demonstrate":[207],"LibraGen":[209],"outperforms":[210],"open-source":[212],"commercial":[214],"using":[217],"only":[218],"thousand-scale":[219],"training":[220],"data.":[221]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2026-03-18T00:00:00"}
