{"id":"https://openalex.org/W2977816919","doi":"https://doi.org/10.1109/ijcnn.2019.8851872","title":"Weakly-Supervised Deep Recurrent Neural Networks for Basic Dance Step Generation","display_name":"Weakly-Supervised Deep Recurrent Neural Networks for Basic Dance Step Generation","publication_year":2019,"publication_date":"2019-07-01","ids":{"openalex":"https://openalex.org/W2977816919","doi":"https://doi.org/10.1109/ijcnn.2019.8851872","mag":"2977816919"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn.2019.8851872","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2019.8851872","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112575316","display_name":"Nelson Yalta","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Nelson Yalta","raw_affiliation_strings":["Department of Intermedia Art and Science, Waseda University, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Intermedia Art and Science, Waseda University, Tokyo, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001291873","display_name":"Shinji Watanabe","orcid":"https://orcid.org/0000-0002-5970-8631"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["Johns Hopkins University, Baltimore, USA"],"affiliations":[{"raw_affiliation_string":"Johns Hopkins University, Baltimore, USA","institution_ids":["https://openalex.org/I145311948"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091708408","display_name":"Kazuhiro Nakadai","orcid":"https://orcid.org/0000-0002-6134-4558"},"institutions":[{"id":"https://openalex.org/I1283473643","display_name":"Honda (Japan)","ror":"https://ror.org/03jzay846","country_code":"JP","type":"company","lineage":["https://openalex.org/I1283473643"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazuhiro Nakadai","raw_affiliation_strings":["Honda Research Institute Japan, Saitama, Japan"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute Japan, Saitama, Japan","institution_ids":["https://openalex.org/I1283473643"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5055922202","display_name":"Tetsuya Ogata","orcid":"https://orcid.org/0000-0001-7015-0379"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsuya Ogata","raw_affiliation_strings":["Department of Intermedia Art and Science, Waseda University, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Intermedia Art and Science, Waseda University, Tokyo, Japan","institution_ids":["https://openalex.org/I150744194"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5112575316"],"corresponding_institution_ids":["https://openalex.org/I150744194"],"apc_list":null,"apc_paid":null,"fwci":4.9895,"has_fulltext":false,"cited_by_count":55,"citation_normalized_percentile":{"value":0.95838762,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.766571581363678},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.620612382888794},{"id":"https://openalex.org/keywords/dance","display_name":"Dance","score":0.5699914693832397},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5342273712158203},{"id":"https://openalex.org/keywords/motion-capture","display_name":"Motion capture","score":0.4905768930912018},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.49051350355148315},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4803948998451233},{"id":"https://openalex.org/keywords/beat","display_name":"Beat (acoustics)","score":0.4707534909248352},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.4441211521625519},{"id":"https://openalex.org/keywords/decodes","display_name":"Decodes","score":0.42428573966026306},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3899487257003784},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.351318895816803},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.30949532985687256},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.1064644455909729},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.104768306016922}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.766571581363678},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.620612382888794},{"id":"https://openalex.org/C147446459","wikidata":"https://www.wikidata.org/wiki/Q11639","display_name":"Dance","level":2,"score":0.5699914693832397},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5342273712158203},{"id":"https://openalex.org/C48007421","wikidata":"https://www.wikidata.org/wiki/Q676252","display_name":"Motion capture","level":3,"score":0.4905768930912018},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.49051350355148315},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4803948998451233},{"id":"https://openalex.org/C189809214","wikidata":"https://www.wikidata.org/wiki/Q829522","display_name":"Beat (acoustics)","level":2,"score":0.4707534909248352},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.4441211521625519},{"id":"https://openalex.org/C2778858076","wikidata":"https://www.wikidata.org/wiki/Q5249539","display_name":"Decodes","level":3,"score":0.42428573966026306},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3899487257003784},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.351318895816803},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.30949532985687256},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.1064644455909729},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.104768306016922},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn.2019.8851872","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn.2019.8851872","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":38,"referenced_works":["https://openalex.org/W75292264","https://openalex.org/W1483977290","https://openalex.org/W1522301498","https://openalex.org/W1600744878","https://openalex.org/W1836465849","https://openalex.org/W2003996974","https://openalex.org/W2054459540","https://openalex.org/W2068357230","https://openalex.org/W2100907900","https://openalex.org/W2112949182","https://openalex.org/W2130942839","https://openalex.org/W2140013053","https://openalex.org/W2157364932","https://openalex.org/W2185758820","https://openalex.org/W2354870669","https://openalex.org/W2402172128","https://openalex.org/W2405656250","https://openalex.org/W2737749690","https://openalex.org/W2897492344","https://openalex.org/W2903908313","https://openalex.org/W2963285578","https://openalex.org/W2963413667","https://openalex.org/W2963952344","https://openalex.org/W2964051853","https://openalex.org/W2964121744","https://openalex.org/W3103314642","https://openalex.org/W4294621855","https://openalex.org/W6603166286","https://openalex.org/W6631190155","https://openalex.org/W6638667902","https://openalex.org/W6679436768","https://openalex.org/W6680873201","https://openalex.org/W6685562342","https://openalex.org/W6686368241","https://openalex.org/W6741681139","https://openalex.org/W6741698137","https://openalex.org/W6756941398","https://openalex.org/W6894076085"],"related_works":["https://openalex.org/W597595235","https://openalex.org/W3200585538","https://openalex.org/W2357651146","https://openalex.org/W1574267311","https://openalex.org/W2501127304","https://openalex.org/W3209785493","https://openalex.org/W3120492113","https://openalex.org/W2299690913","https://openalex.org/W2762501427","https://openalex.org/W2039848376"],"abstract_inverted_index":{"Synthesizing":[0],"human's":[1],"movements":[2],"such":[3],"as":[4,114],"dancing":[5],"is":[6,55],"a":[7,51,88,99,123,166,215,243,265],"flourishing":[8],"research":[9],"field":[10],"which":[11],"has":[12,148],"several":[13],"applications":[14],"in":[15,33],"computer":[16],"graphics.":[17],"Recent":[18],"studies":[19],"have":[20],"demonstrated":[21],"the":[22,69,73,78,82,131,140,172,175,188,192,199,205,210,228,246],"advantages":[23],"of":[24,53,59,91,157,160,194,264],"deep":[25,102,136],"neural":[26],"networks":[27],"(DNNs)":[28],"for":[29,41,47,105,219],"achieving":[30],"remarkable":[31],"performance":[32],"motion":[34,79,178,189,213,231],"and":[35,84,122,177,180,209,223,230,256],"music":[36,54,70,176,229],"tasks":[37],"with":[38,110,183,214,233,252],"little":[39],"effort":[40],"feature":[42],"pre-processing.":[43],"However,":[44],"applying":[45],"DNNs":[46,61,86],"generating":[48],"dance":[49,108,142,162,221,250],"to":[50,63,76,81,129,170,262],"piece":[52],"nevertheless":[56],"challenging,":[57],"because":[58],"1)":[60,149],"need":[62],"generate":[64],"large":[65,161,220],"sequences":[66],"while":[67],"mapping":[68,173],"input,":[71],"2)":[72,164],"DNN":[74],"needs":[75],"constraint":[77],"beat":[80,232],"music,":[83],"3)":[85,181],"require":[87],"considerable":[89],"amount":[90,193],"hand-crafted":[92,195],"data.":[93,196],"In":[94],"this":[95,145],"study,":[96],"we":[97],"propose":[98],"weakly":[100],"supervised":[101],"recurrent":[103],"method":[104],"real-time":[106],"basic":[107,249],"generation":[109],"audio":[111,132],"power":[112],"spectrum":[113],"input.":[115,133],"The":[116],"proposed":[117,200],"model":[118,247],"employs":[119],"convolutional":[120],"layers":[121],"multilayered":[124],"Long":[125],"Short-Term":[126],"memory":[127],"(LSTM)":[128],"process":[130],"Then,":[134],"another":[135],"LSTM":[137],"layer":[138],"decodes":[139],"target":[141],"sequence.":[143],"Notably,":[144],"end-to-end":[146],"approach":[147],"an":[150,234,258],"auto-conditioned":[151],"decode":[152],"configuration":[153],"that":[154,263],"reduces":[155],"accumulation":[156],"feedback":[158],"error":[159],"sequence,":[163],"uses":[165],"contrastive":[167],"cost":[168],"function":[169],"regulate":[171],"between":[174,207,227],"beat,":[179,190],"trains":[182],"weak":[184],"labels":[185],"generated":[186,208],"from":[187],"reducing":[191],"We":[197],"evaluate":[198],"network":[201],"based":[202],"on":[203],"i)":[204],"similarities":[206],"baseline":[211,266],"dancer":[212],"cross":[216,254],"entropy":[217,255],"measure":[218],"sequences,":[222],"ii)":[224],"accurate":[225],"timing":[226],"F-measure.":[235],"Experimental":[236],"results":[237],"revealed":[238],"that,":[239],"after":[240],"training":[241],"using":[242],"small":[244],"dataset,":[245],"generates":[248],"steps":[251],"low":[253],"maintains":[257],"F-measure":[259],"score":[260],"similar":[261],"dancer.":[267]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":7},{"year":2021,"cited_by_count":11},{"year":2020,"cited_by_count":11},{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
