{"id":"https://openalex.org/W4408324833","doi":"https://doi.org/10.1109/icassp49660.2025.10890233","title":"Follow-Your-MultiPose: Tuning-Free Multi-Character Text-to-Video Generation via Pose Guidance","display_name":"Follow-Your-MultiPose: Tuning-Free Multi-Character Text-to-Video Generation via Pose Guidance","publication_year":2025,"publication_date":"2025-03-11","ids":{"openalex":"https://openalex.org/W4408324833","doi":"https://doi.org/10.1109/icassp49660.2025.10890233"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10890233","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890233","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Beiyuan Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Beiyuan Zhang","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Yue Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I889458895","display_name":"University of Hong Kong","ror":"https://ror.org/02zhqgq86","country_code":"HK","type":"education","lineage":["https://openalex.org/I889458895"]},{"id":"https://openalex.org/I200769079","display_name":"Hong Kong University of Science and Technology","ror":"https://ror.org/00q4vv597","country_code":"HK","type":"education","lineage":["https://openalex.org/I200769079"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Yue Ma","raw_affiliation_strings":["Computer Science Engineer, The Hong Kong University of Science and Technology, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Computer Science Engineer, The Hong Kong University of Science and Technology, Hong Kong","institution_ids":["https://openalex.org/I200769079","https://openalex.org/I889458895"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chunlei Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I158842170","display_name":"Chongqing University","ror":"https://ror.org/023rhb549","country_code":"CN","type":"education","lineage":["https://openalex.org/I158842170"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunlei Fu","raw_affiliation_strings":["School of Big Data and Software Engineering, Chongqing University, Chongqing, China"],"affiliations":[{"raw_affiliation_string":"School of Big Data and Software Engineering, Chongqing University, Chongqing, China","institution_ids":["https://openalex.org/I158842170"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xinyang Song","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyang Song","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China;  New Laboratory of Pattern Recognition (NLPR), Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China;  New Laboratory of Pattern Recognition (NLPR), Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhenan Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhenan Sun","raw_affiliation_strings":["School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China\n4 New Laboratory of Pattern Recognition (NLPR), Institute of Automation, Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences, Beijing, China\n4 New Laboratory of Pattern Recognition (NLPR), Institute of Automation, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150"]}]},{"author_position":"last","author":{"id":null,"display_name":"Ziqiang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqiang Li","raw_affiliation_strings":["Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I158842170"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.08664353,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12667","display_name":"Economic and Technological Developments in Russia","score":0.1890999972820282,"subfield":{"id":"https://openalex.org/subfields/3303","display_name":"Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12667","display_name":"Economic and Technological Developments in Russia","score":0.1890999972820282,"subfield":{"id":"https://openalex.org/subfields/3303","display_name":"Development"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T14470","display_name":"Advanced Data Processing Techniques","score":0.1762000024318695,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/circuit-breaker","display_name":"Circuit breaker","score":0.8285095691680908},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.513496458530426},{"id":"https://openalex.org/keywords/electrical-engineering","display_name":"Electrical engineering","score":0.2556072473526001},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2011183798313141}],"concepts":[{"id":"https://openalex.org/C61352017","wikidata":"https://www.wikidata.org/wiki/Q211058","display_name":"Circuit breaker","level":2,"score":0.8285095691680908},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.513496458530426},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.2556072473526001},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2011183798313141}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10890233","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10890233","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2984529706","https://openalex.org/W3081727869","https://openalex.org/W3096831136","https://openalex.org/W3153469116","https://openalex.org/W4312881655","https://openalex.org/W4312933868","https://openalex.org/W4386076520","https://openalex.org/W4390190334","https://openalex.org/W4390871780","https://openalex.org/W4390872556","https://openalex.org/W4390872896","https://openalex.org/W4390873054","https://openalex.org/W4390873135","https://openalex.org/W4390873195","https://openalex.org/W4390874168","https://openalex.org/W4393148505","https://openalex.org/W4393148714","https://openalex.org/W4404965490","https://openalex.org/W4409262178","https://openalex.org/W4409369698","https://openalex.org/W6767264202","https://openalex.org/W6809885388","https://openalex.org/W6810940779","https://openalex.org/W6838639034","https://openalex.org/W6854463369","https://openalex.org/W6854866820","https://openalex.org/W6856518728","https://openalex.org/W6862585284","https://openalex.org/W6862589453","https://openalex.org/W6869101536","https://openalex.org/W6872690837","https://openalex.org/W6874599112"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2186957643","https://openalex.org/W4313289174","https://openalex.org/W2169296235","https://openalex.org/W2383147444","https://openalex.org/W2772771794","https://openalex.org/W2370462073","https://openalex.org/W2351129194"],"abstract_inverted_index":{"Text-editable":[0],"and":[1,60,81,101],"pose-controllable":[2],"character":[3,67,87],"video":[4,22,46,118],"generation":[5,23,47],"is":[6,54],"a":[7,36,43,50],"challenging":[8],"but":[9],"prevailing":[10],"topic":[11],"with":[12,24,90,157],"practical":[13],"applications.":[14],"However,":[15],"existing":[16],"approaches":[17],"mainly":[18],"focus":[19],"on":[20,56],"single-object":[21],"pose":[25,61,71],"guidance,":[26],"ignoring":[27],"the":[28,57,70,75,97,120,132,146],"realistic":[29],"situation":[30],"that":[31,150],"multi-character":[32,45,111],"appear":[33],"concurrently":[34],"in":[35,49],"scenario.":[37],"To":[38],"tackle":[39],"this,":[40],"we":[41,64],"propose":[42],"novel":[44],"framework":[48],"tuning-free":[51],"manner,":[52],"which":[53],"based":[55],"separated":[58],"text":[59,94],"guidance.":[62,95],"Specifically,":[63],"first":[65],"extract":[66],"masks":[68],"from":[69],"sequence":[72],"to":[73,107,140],"identify":[74],"spatial":[76],"position":[77],"for":[78,85,92,126],"each":[79,86],"character,":[80],"then":[82],"single":[83],"prompts":[84],"are":[88,105],"obtained":[89],"LLMs":[91],"precise":[93,121],"Moreover,":[96,145],"spatial-aligned":[98],"cross":[99],"attention":[100],"multi-branch":[102],"control":[103],"module":[104],"proposed":[106],"generate":[108],"fine-grained":[109],"controllable":[110],"video.":[112],"The":[113],"visualized":[114],"results":[115,148],"of":[116,123,134],"generating":[117],"demonstrate":[119],"controllability":[122],"our":[124,135,151],"method":[125,136],"multicharacter":[127],"generation.":[128],"We":[129],"also":[130],"verify":[131],"generality":[133],"by":[137],"applying":[138],"it":[139],"various":[141],"personalized":[142],"T2I":[143],"models.":[144],"quantitative":[147],"show":[149],"approach":[152],"achieves":[153],"superior":[154],"performance":[155],"compared":[156],"previous":[158],"works.":[159]},"counts_by_year":[],"updated_date":"2025-12-21T01:58:51.020947","created_date":"2025-03-12T00:00:00"}
