{"id":"https://openalex.org/W4392182697","doi":"https://doi.org/10.48550/arxiv.2402.15509","title":"Seamless Human Motion Composition with Blended Positional Encodings","display_name":"Seamless Human Motion Composition with Blended Positional Encodings","publication_year":2024,"publication_date":"2024-02-23","ids":{"openalex":"https://openalex.org/W4392182697","doi":"https://doi.org/10.48550/arxiv.2402.15509"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.15509","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.15509","pdf_url":"https://arxiv.org/pdf/2402.15509","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.15509","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030892971","display_name":"Germ\u00e1n Barquero","orcid":"https://orcid.org/0000-0001-8381-3549"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Barquero, German","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038228433","display_name":"S\u00e9rgio Escalera","orcid":"https://orcid.org/0000-0003-0617-8873"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Escalera, Sergio","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5056906303","display_name":"Cristina Palmero","orcid":"https://orcid.org/0000-0002-6085-6527"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Palmero, Cristina","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5030892971"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/composition","display_name":"Composition (language)","score":0.6353772878646851},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.6013182997703552},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.49408963322639465},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3590278923511505},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3455347418785095},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.09460476040840149}],"concepts":[{"id":"https://openalex.org/C40231798","wikidata":"https://www.wikidata.org/wiki/Q1333743","display_name":"Composition (language)","level":2,"score":0.6353772878646851},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.6013182997703552},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.49408963322639465},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3590278923511505},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3455347418785095},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.09460476040840149},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2402.15509","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.15509","pdf_url":"https://arxiv.org/pdf/2402.15509","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2402.15509","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.15509","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.15509","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.15509","pdf_url":"https://arxiv.org/pdf/2402.15509","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4392182697.pdf","grobid_xml":"https://content.openalex.org/works/W4392182697.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2772917594","https://openalex.org/W2775347418","https://openalex.org/W1969923398","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2079911747","https://openalex.org/W2170022336"],"abstract_inverted_index":{"Conditional":[0],"human":[1],"motion":[2,24,107,156],"generation":[3,45],"is":[4,109],"an":[5],"important":[6],"topic":[7],"with":[8,150],"many":[9],"applications":[10],"in":[11,34,100,133],"virtual":[12],"reality,":[13],"gaming,":[14],"and":[15,96,117,138,143,191],"robotics.":[16],"While":[17],"prior":[18],"works":[19],"have":[20],"focused":[21],"on":[22,140],"generating":[23],"guided":[25,50],"by":[26,51],"text,":[27],"music,":[28],"or":[29,78],"scenes,":[30],"these":[31],"typically":[32],"result":[33],"isolated":[35],"motions":[36],"confined":[37],"to":[38,159,175,197],"short":[39],"durations.":[40],"Instead,":[41],"we":[42,61,84,129,183],"address":[43,176],"the":[44,64,86,101,112,123,141,177,188,192,195],"of":[46,54,135,179],"long,":[47],"continuous":[48],"sequences":[49],"a":[52,90,127,152],"series":[53],"varying":[55,168],"textual":[56],"descriptions.":[57],"In":[58],"this":[59],"context,":[60],"introduce":[62,85],"FlowMDM,":[63],"first":[65],"diffusion-based":[66],"model":[67],"that":[68,92],"generates":[69],"seamless":[70],"Human":[71],"Motion":[72],"Compositions":[73],"(HMC)":[74],"without":[75],"any":[76],"postprocessing":[77],"redundant":[79],"denoising":[80,102],"steps.":[81],"For":[82],"this,":[83],"Blended":[87],"Positional":[88],"Encodings,":[89],"technique":[91],"leverages":[93],"both":[94],"absolute":[95,113],"relative":[97,124],"positional":[98],"encodings":[99],"chain.":[103],"More":[104],"specifically,":[105],"global":[106],"coherence":[108],"recovered":[110],"at":[111,122,171],"stage,":[114],"whereas":[115],"smooth":[116],"realistic":[118],"transitions":[119],"are":[120],"built":[121],"stage.":[125],"As":[126],"result,":[128],"achieve":[130],"state-of-the-art":[131],"results":[132],"terms":[134],"accuracy,":[136],"realism,":[137],"smoothness":[139],"Babel":[142],"HumanML3D":[144],"datasets.":[145],"FlowMDM":[146],"excels":[147],"when":[148],"trained":[149],"only":[151],"single":[153],"description":[154],"per":[155],"sequence":[157],"thanks":[158],"its":[160],"Pose-Centric":[161],"Cross-ATtention,":[162],"which":[163],"makes":[164],"it":[165],"robust":[166],"against":[167],"text":[169],"descriptions":[170],"inference":[172],"time.":[173],"Finally,":[174],"limitations":[178],"existing":[180],"HMC":[181],"metrics,":[182],"propose":[184],"two":[185],"new":[186],"metrics:":[187],"Peak":[189],"Jerk":[190],"Area":[193],"Under":[194],"Jerk,":[196],"detect":[198],"abrupt":[199],"transitions.":[200]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-10T00:00:00"}
