{"id":"https://openalex.org/W4409076630","doi":"https://doi.org/10.1109/tcsvt.2025.3556868","title":"Progressive Human Motion Generation Based on Text and Few Motion Frames","display_name":"Progressive Human Motion Generation Based on Text and Few Motion Frames","publication_year":2025,"publication_date":"2025-04-01","ids":{"openalex":"https://openalex.org/W4409076630","doi":"https://doi.org/10.1109/tcsvt.2025.3556868"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2025.3556868","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3556868","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2503.13300","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5079634733","display_name":"Ling-An Zeng","orcid":"https://orcid.org/0000-0002-8125-8024"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ling-An Zeng","raw_affiliation_strings":["School of Artificial Intelligence, Sun Yat-sen University, Zhuhai, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0002-8125-8024","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Sun Yat-sen University, Zhuhai, Guangdong, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101900911","display_name":"Gaojie Wu","orcid":"https://orcid.org/0000-0002-0752-8508"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Gaojie Wu","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0002-0752-8508","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, Guangdong, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049519486","display_name":"Ancong Wu","orcid":"https://orcid.org/0000-0002-7969-3190"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ancong Wu","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, Guangdong, China"],"raw_orcid":"https://orcid.org/0000-0002-7969-3190","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, Guangdong, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102336058","display_name":"Jian\u2013Fang Hu","orcid":"https://orcid.org/0009-0005-2678-5373"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian-Fang Hu","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, Guangdong, China"],"raw_orcid":"https://orcid.org/0009-0005-2678-5373","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, Guangdong, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108050904","display_name":"Wei\u2010Shi Zheng","orcid":"https://orcid.org/0000-0001-8327-0003"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei-Shi Zheng","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","School of Computer Science and Engineering, Sun Yat-sen University, China"],"raw_orcid":"https://orcid.org/0000-0001-8327-0003","affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, China","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.8084,"has_fulltext":true,"cited_by_count":2,"citation_normalized_percentile":{"value":0.83725533,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"35","issue":"9","first_page":"9205","last_page":"9217"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6095041632652283},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5920031070709229},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5857704877853394},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5775144100189209},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.5131019353866577},{"id":"https://openalex.org/keywords/computer-graphics","display_name":"Computer graphics (images)","score":0.33987557888031006}],"concepts":[{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6095041632652283},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5920031070709229},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5857704877853394},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5775144100189209},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.5131019353866577},{"id":"https://openalex.org/C121684516","wikidata":"https://www.wikidata.org/wiki/Q7600677","display_name":"Computer graphics (images)","level":1,"score":0.33987557888031006}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcsvt.2025.3556868","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3556868","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2503.13300","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.13300","pdf_url":"https://arxiv.org/pdf/2503.13300","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2503.13300","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.13300","pdf_url":"https://arxiv.org/pdf/2503.13300","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.41999998688697815,"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5"}],"awards":[{"id":"https://openalex.org/G1702828313","display_name":null,"funder_award_id":"U21A20471","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1730722784","display_name":null,"funder_award_id":"2023B1515040025","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3581596628","display_name":null,"funder_award_id":"2023YFA1008503","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G8949795292","display_name":null,"funder_award_id":"92470202","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W2474702929","https://openalex.org/W2889227713","https://openalex.org/W2982625143","https://openalex.org/W3006410788","https://openalex.org/W3044275224","https://openalex.org/W3048474702","https://openalex.org/W3120595940","https://openalex.org/W3144253442","https://openalex.org/W4210375380","https://openalex.org/W4286611287","https://openalex.org/W4297981470","https://openalex.org/W4312936899","https://openalex.org/W4381713281","https://openalex.org/W4385245566","https://openalex.org/W4386065848","https://openalex.org/W4386076288","https://openalex.org/W4386076405","https://openalex.org/W4389575066","https://openalex.org/W4390730260","https://openalex.org/W4390872247","https://openalex.org/W4390874125","https://openalex.org/W4390874263","https://openalex.org/W4390874627","https://openalex.org/W4391305822","https://openalex.org/W4401210548","https://openalex.org/W4401507000","https://openalex.org/W4402716136","https://openalex.org/W4402727037","https://openalex.org/W4402727046","https://openalex.org/W4402754111","https://openalex.org/W4403562310","https://openalex.org/W4403808867","https://openalex.org/W4403842319","https://openalex.org/W4403878062","https://openalex.org/W4404600557","https://openalex.org/W4404725561","https://openalex.org/W4404879538","https://openalex.org/W4404893135","https://openalex.org/W4409366151"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Although":[0],"existing":[1,192],"text-to-motion":[2],"(T2M)":[3],"methods":[4,195],"can":[5],"produce":[6],"realistic":[7],"human":[8],"motion":[9,21,54,119],"from":[10,74,120],"text":[11,28,75],"description,":[12],"it":[13],"is":[14,30,45,86,98,212],"still":[15],"difficult":[16],"to":[17,46,50,71,87,115,126,162],"align":[18],"the":[19,23,48,82,91,93,121,151,164,206],"generated":[20,140,157,173],"with":[22,123,128,200],"desired":[24,58],"postures":[25],"since":[26],"using":[27],"alone":[29],"insufficient":[31],"for":[32,183],"precisely":[33],"describing":[34,56],"diverse":[35],"postures.":[36,59],"To":[37],"achieve":[38],"more":[39],"controllable":[40],"generation,":[41],"an":[42],"intuitive":[43],"way":[44],"allow":[47],"user":[49],"input":[51],"a":[52,63,84,88,108,118,142,179,197],"few":[53,78],"frames":[55,122,138,156,174],"precise":[57],"Thus,":[60],"we":[61,106,177],"explore":[62],"new":[64,137],"Text-Frame-to-Motion":[65],"(TF2M)":[66],"generation":[67,194],"task":[68],"that":[69,188],"aims":[70],"generate":[72,117],"motions":[73],"and":[76,155],"very":[77],"given":[79,89,103,153,203],"frames.":[80],"Intuitively,":[81],"closer":[83],"frame":[85,97],"frame,":[90,204],"lower":[92],"uncertainty":[94,125,130],"of":[95,150,171,208],"this":[96,102],"when":[99],"conditioned":[100,146],"on":[101,147],"frame.":[104],"Hence,":[105],"propose":[107,178],"novel":[109],"Progressive":[110],"Motion":[111],"Generation":[112],"(PMG)":[113],"method":[114],"progressively":[116],"low":[124],"those":[127],"high":[129],"in":[131,158],"multiple":[132],"stages.":[133,160],"During":[134],"each":[135],"stage,":[136],"are":[139],"by":[141,168,196],"Text-Frame":[143],"Guided":[144],"Generator":[145],"frame-aware":[148],"semantics":[149],"text,":[152],"frames,":[154],"previous":[159],"Additionally,":[161],"alleviate":[163],"train-test":[165],"gap":[166],"caused":[167],"multi-stage":[169],"accumulation":[170],"incorrectly":[172],"during":[175],"testing,":[176],"Pseudo-frame":[180],"Replacement":[181],"Strategy":[182],"training.":[184],"Experimental":[185],"results":[186],"show":[187],"our":[189,209],"PMG":[190],"outperforms":[191],"T2M":[193],"large":[198],"margin":[199],"even":[201],"one":[202],"validating":[205],"effectiveness":[207],"PMG.":[210],"Code":[211],"available":[213],"here.":[214]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
