{"id":"https://openalex.org/W4372260409","doi":"https://doi.org/10.1109/icassp49357.2023.10096666","title":"Retrieval-Based Natural 3D Human Motion Generation","display_name":"Retrieval-Based Natural 3D Human Motion Generation","publication_year":2023,"publication_date":"2023-05-05","ids":{"openalex":"https://openalex.org/W4372260409","doi":"https://doi.org/10.1109/icassp49357.2023.10096666"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49357.2023.10096666","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10096666","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035994850","display_name":"Zehan Tan","orcid":"https://orcid.org/0000-0002-0931-8985"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zehan Tan","raw_affiliation_strings":["Fudan University,School of Computer Science,Shanghai,China","School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101865874","display_name":"Weidong Yang","orcid":"https://orcid.org/0000-0002-6473-9272"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weidong Yang","raw_affiliation_strings":["Fudan University,School of Computer Science,Shanghai,China","School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101874714","display_name":"Shuai Wu","orcid":"https://orcid.org/0009-0007-5824-6846"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Wu","raw_affiliation_strings":["Fudan University,School of Computer Science,Shanghai,China","School of Computer Science, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5035994850"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.03663693,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9883999824523926,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8311477303504944},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.6991340517997742},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6554040908813477},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6445170640945435},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5710157155990601},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5611506700515747},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5276119709014893},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4599195718765259},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.43244582414627075}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8311477303504944},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.6991340517997742},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6554040908813477},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6445170640945435},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5710157155990601},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5611506700515747},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5276119709014893},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4599195718765259},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.43244582414627075},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49357.2023.10096666","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49357.2023.10096666","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2023 - 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2101032778","https://openalex.org/W2152984213","https://openalex.org/W2474702929","https://openalex.org/W2614519765","https://openalex.org/W2780124704","https://openalex.org/W2862846329","https://openalex.org/W2897492344","https://openalex.org/W2982625143","https://openalex.org/W2997510589","https://openalex.org/W3090839706","https://openalex.org/W3102619627","https://openalex.org/W3124346429","https://openalex.org/W3125772723","https://openalex.org/W3153832461","https://openalex.org/W3176252609","https://openalex.org/W3181695292","https://openalex.org/W4206332913","https://openalex.org/W4288079574","https://openalex.org/W4312635677","https://openalex.org/W6770208262","https://openalex.org/W6912820848"],"related_works":["https://openalex.org/W2081900870","https://openalex.org/W4295532600","https://openalex.org/W2063823869","https://openalex.org/W2047973478","https://openalex.org/W2067569035","https://openalex.org/W4390516098","https://openalex.org/W2090985514","https://openalex.org/W2181948922","https://openalex.org/W2384362569","https://openalex.org/W2113666009"],"abstract_inverted_index":{"It":[0],"is":[1,126,165],"challenging":[2],"to":[3,41,141],"generate":[4],"3D":[5,78],"human":[6],"motions":[7,17,79,121],"automatically":[8],"from":[9,122],"text.":[10,62,134],"In":[11,63],"an":[12],"ideal":[13],"scenario,":[14],"the":[15,20,27,30,56,90,94,97,109,118,123,129,138,143,147,154,183],"generated":[16,149],"should":[18],"explore":[19],"text-grounded":[21],"motion":[22,59,73,104,140],"space":[23],"while":[24],"accurately":[25],"depicting":[26],"content":[28],"in":[29,45],"prescribed":[31],"text":[32],"descriptions.":[33],"Text2length":[34],"and":[35,61,75,160,172],"text2motion":[36],"training":[37,124],"have":[38],"been":[39],"used":[40],"address":[42],"this":[43,64],"problem":[44],"previous":[46,91,115],"research.":[47],"There":[48],"is,":[49],"however,":[50],"a":[51,84,101,133,168],"lack":[52],"of":[53,93,100,114,156],"knowledge":[54],"about":[55],"relationship":[57],"between":[58],"length":[60],"work,":[65],"context-aware":[66,85],"retrieval-based":[67],"approaches":[68],"are":[69],"proposed":[70],"for":[71,146],"predicting":[72],"lengths":[74],"generating":[76],"proper":[77],"(C-MO).":[80],"Specifically,":[81],"we":[82,136],"train":[83],"encoder-decoder":[86],"model":[87,110,131],"that":[88,108,177],"uses":[89],"output":[92],"decoder":[95],"or":[96],"embedding":[98],"vector":[99],"ground":[102],"truth":[103],"as":[105],"context":[106],"so":[107],"becomes":[111],"increasingly":[112],"aware":[113],"alignments.":[116],"Retrieving":[117],"most":[119],"similar":[120],"set":[125],"based":[127],"on":[128,167],"trained":[130],"given":[132],"Finally,":[135],"use":[137],"retrieval":[139,159],"guide":[142],"probability":[144],"distribution":[145],"final":[148],"motions.":[150],"Our":[151],"method":[152],"combines":[153],"advantages":[155],"both":[157],"information":[158],"neural":[161],"machine":[162],"translation.":[163],"C-MO":[164],"evaluated":[166],"large-scale":[169],"dataset,":[170],"KIT,":[171],"its":[173],"experimental":[174],"results":[175],"show":[176],"it":[178],"achieves":[179],"great":[180],"improvements":[181],"over":[182],"state-of-the-art.":[184]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
