{"id":"https://openalex.org/W4417159285","doi":"https://doi.org/10.1109/iccv51701.2025.01226","title":"Align Your Rhythm: Generating Highly Aligned Dance Poses with Gating-Enhanced Rhythm-Aware Feature Representation","display_name":"Align Your Rhythm: Generating Highly Aligned Dance Poses with Gating-Enhanced Rhythm-Aware Feature Representation","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4417159285","doi":"https://doi.org/10.1109/iccv51701.2025.01226"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.01226","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.01226","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2503.17340","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Congyi Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Congyi Fan","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101669069","display_name":"Jian Guan","orcid":"https://orcid.org/0000-0002-5069-240X"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Guan","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114125453","display_name":"Xuanjia Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuanjia Zhao","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100778603","display_name":"Dan Xu","orcid":"https://orcid.org/0000-0003-4602-3550"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dongli Xu","raw_affiliation_strings":["Shanghai Academy of Artificial Intelligence for Science,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Shanghai Academy of Artificial Intelligence for Science,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056639653","display_name":"Youtian Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I36399199","display_name":"Nanjing University of Science and Technology","ror":"https://ror.org/00xp9wg62","country_code":"CN","type":"education","lineage":["https://openalex.org/I36399199"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Youtian Lin","raw_affiliation_strings":["School of Intelligence Science and Technology, Nanjing University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Intelligence Science and Technology, Nanjing University,China","institution_ids":["https://openalex.org/I36399199"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101446238","display_name":"Tong Ye","orcid":"https://orcid.org/0000-0003-3812-3105"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tong Ye","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041045446","display_name":"Pengming Feng","orcid":"https://orcid.org/0000-0001-5853-8100"},"institutions":[{"id":"https://openalex.org/I4210148107","display_name":"Space Engineering University","ror":"https://ror.org/04rj1td02","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210148107"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengming Feng","raw_affiliation_strings":["State Key Laboratory of Space-Ground Integrated Information Technology,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Space-Ground Integrated Information Technology,China","institution_ids":["https://openalex.org/I4210148107"]}]},{"author_position":"last","author":{"id":null,"display_name":"Haiwei Pan","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haiwei Pan","raw_affiliation_strings":["College of Computer Science and Technology, Harbin Engineering University,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Harbin Engineering University,China","institution_ids":["https://openalex.org/I151727225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I151727225"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.45175563,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"13193","last_page":"13202"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.91839998960495,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.91839998960495,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.022600000724196434,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.011699999682605267,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dance","display_name":"Dance","score":0.8953999876976013},{"id":"https://openalex.org/keywords/rhythm","display_name":"Rhythm","score":0.8216000199317932},{"id":"https://openalex.org/keywords/naturalness","display_name":"Naturalness","score":0.7318999767303467},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5315999984741211},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4959999918937683},{"id":"https://openalex.org/keywords/melody","display_name":"Melody","score":0.491100013256073},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.48019999265670776},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.444599986076355}],"concepts":[{"id":"https://openalex.org/C147446459","wikidata":"https://www.wikidata.org/wiki/Q11639","display_name":"Dance","level":2,"score":0.8953999876976013},{"id":"https://openalex.org/C135343436","wikidata":"https://www.wikidata.org/wiki/Q170406","display_name":"Rhythm","level":2,"score":0.8216000199317932},{"id":"https://openalex.org/C134537474","wikidata":"https://www.wikidata.org/wiki/Q17144832","display_name":"Naturalness","level":2,"score":0.7318999767303467},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6492999792098999},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5422000288963318},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5315999984741211},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4959999918937683},{"id":"https://openalex.org/C43803900","wikidata":"https://www.wikidata.org/wiki/Q170412","display_name":"Melody","level":3,"score":0.491100013256073},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.48019999265670776},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.444599986076355},{"id":"https://openalex.org/C189809214","wikidata":"https://www.wikidata.org/wiki/Q829522","display_name":"Beat (acoustics)","level":2,"score":0.4415999948978424},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.44130000472068787},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4171999990940094},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3734000027179718},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.33489999175071716},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.33219999074935913},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.31380000710487366},{"id":"https://openalex.org/C89805583","wikidata":"https://www.wikidata.org/wiki/Q192940","display_name":"Accelerometer","level":2,"score":0.2937999963760376},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.28859999775886536},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.287200003862381},{"id":"https://openalex.org/C183920142","wikidata":"https://www.wikidata.org/wiki/Q180856","display_name":"Choreography","level":3,"score":0.2849000096321106},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.28360000252723694},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.272599995136261},{"id":"https://openalex.org/C542774811","wikidata":"https://www.wikidata.org/wiki/Q10880526","display_name":"Prosody","level":2,"score":0.26809999346733093},{"id":"https://openalex.org/C2780226923","wikidata":"https://www.wikidata.org/wiki/Q929848","display_name":"Movement (music)","level":2,"score":0.25110000371932983}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.01226","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.01226","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2503.17340","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.17340","pdf_url":"https://arxiv.org/pdf/2503.17340","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2503.17340","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2503.17340","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2503.17340","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2503.17340","pdf_url":"https://arxiv.org/pdf/2503.17340","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Automatically":[0],"generating":[1,21],"natural,":[2],"diverse":[3],"and":[4,17,37,95,135,147,166],"rhythmic":[5,72,84,111,164],"human":[6],"dance":[7,22,62,68,115,151],"movements":[8,116],"driven":[9],"by":[10],"music":[11,26],"is":[12],"vital":[13],"for":[14,60],"virtual":[15],"reality":[16],"film":[18],"industries.":[19],"However,":[20],"that":[23,51,114,156],"naturally":[24],"follows":[25],"remains":[27],"a":[28,48],"challenge,":[29],"as":[30],"existing":[31],"methods":[32],"lack":[33],"proper":[34],"beat":[35],"alignment":[36,165],"exhibit":[38],"unnatural":[39],"motion":[40,167],"dynamics.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45,75,101],"propose":[46,102],"Danceba,":[47],"novel":[49],"framework":[50],"leverages":[52],"gating":[53],"mechanism":[54],"to":[55,81,107,131],"enhance":[56],"rhythm-aware":[57],"feature":[58],"representation":[59],"music-driven":[61],"generation,":[63],"which":[64],"achieves":[65],"highly":[66],"aligned":[67],"poses":[69],"with":[70,140],"enhanced":[71],"sensitivity.":[73],"Specifically,":[74],"introduce":[76,124],"Phase-Based":[77],"Rhythm":[78],"Extraction":[79],"(PRE)":[80],"precisely":[82],"extract":[83],"information":[85],"from":[86],"musical":[87,120,141],"phase":[88],"data,":[89],"capitalizing":[90],"on":[91,109],"the":[92,119,145],"intrinsic":[93],"periodicity":[94],"temporal":[96],"structures":[97],"of":[98,149],"music.":[99],"Additionally,":[100],"Temporal-Gated":[103],"Causal":[104],"Attention":[105],"(TGCA)":[106],"focus":[108],"global":[110],"features,":[112,142],"ensuring":[113],"closely":[117],"follow":[118],"rhythm.":[121],"We":[122],"also":[123],"Parallel":[125],"Mamba":[126],"Motion":[127],"Modeling":[128],"(PMMM)":[129],"architecture":[130],"separately":[132],"model":[133],"upper":[134],"lower":[136],"body":[137],"motions":[138],"along":[139],"thereby":[143],"improving":[144],"naturalness":[146],"diversity":[148],"generated":[150],"movements.":[152],"Extensive":[153],"experiments":[154],"confirm":[155],"Danceba":[157],"outperforms":[158],"state-of-the-art":[159],"methods,":[160],"achieving":[161],"significantly":[162],"better":[163],"diversity.":[168],"Project":[169],"page:":[170],"https://danceba.github.io/":[171],".":[172]},"counts_by_year":[],"updated_date":"2026-05-06T06:03:25.996018","created_date":"2025-10-10T00:00:00"}
