{"id":"https://openalex.org/W4387421802","doi":"https://doi.org/10.1145/3577190.3614175","title":"Frame-Level Event Representation Learning for Semantic-Level Generation and Editing of Avatar Motion","display_name":"Frame-Level Event Representation Learning for Semantic-Level Generation and Editing of Avatar Motion","publication_year":2023,"publication_date":"2023-10-07","ids":{"openalex":"https://openalex.org/W4387421802","doi":"https://doi.org/10.1145/3577190.3614175"},"language":"en","primary_location":{"id":"doi:10.1145/3577190.3614175","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1145/3577190.3614175","pdf_url":null,"source":{"id":"https://openalex.org/S4363608440","display_name":"INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"http://dx.doi.org/10.1145/3577190.3614175","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088959789","display_name":"Ayaka Ideno","orcid":"https://orcid.org/0009-0000-0973-9993"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Ayaka Ideno","raw_affiliation_strings":["The University of Tokyo, Japan"],"raw_orcid":"https://orcid.org/0009-0000-0973-9993","affiliations":[{"raw_affiliation_string":"The University of Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020693766","display_name":"Takuhiro Kaneko","orcid":"https://orcid.org/0009-0000-8016-5144"},"institutions":[{"id":"https://openalex.org/I2251713219","display_name":"NTT (Japan)","ror":"https://ror.org/00berct97","country_code":"JP","type":"company","lineage":["https://openalex.org/I2251713219"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Takuhiro Kaneko","raw_affiliation_strings":["NTT Corporation, Japan"],"raw_orcid":"https://orcid.org/0009-0000-8016-5144","affiliations":[{"raw_affiliation_string":"NTT Corporation, Japan","institution_ids":["https://openalex.org/I2251713219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042711470","display_name":"Tatsuya Harada","orcid":"https://orcid.org/0000-0002-3712-3691"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tatsuya Harada","raw_affiliation_strings":["The University of Tokyo, Japan and RIKEN, Japan"],"raw_orcid":"https://orcid.org/0000-0002-3712-3691","affiliations":[{"raw_affiliation_string":"The University of Tokyo, Japan and RIKEN, Japan","institution_ids":["https://openalex.org/I74801974"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5088959789"],"corresponding_institution_ids":["https://openalex.org/I74801974"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.25974026,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"903","issue":null,"first_page":"292","last_page":"300"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12290","display_name":"Human Motion and Animation","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7897416353225708},{"id":"https://openalex.org/keywords/avatar","display_name":"Avatar","score":0.7158094644546509},{"id":"https://openalex.org/keywords/frame","display_name":"Frame (networking)","score":0.6145460605621338},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5247802138328552},{"id":"https://openalex.org/keywords/event","display_name":"Event (particle physics)","score":0.4878706932067871},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46524178981781006},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.4561637043952942},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.39194607734680176},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35967355966567993}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7897416353225708},{"id":"https://openalex.org/C2777365542","wikidata":"https://www.wikidata.org/wiki/Q83090","display_name":"Avatar","level":2,"score":0.7158094644546509},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.6145460605621338},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5247802138328552},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.4878706932067871},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46524178981781006},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.4561637043952942},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.39194607734680176},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35967355966567993},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3577190.3614175","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1145/3577190.3614175","pdf_url":null,"source":{"id":"https://openalex.org/S4363608440","display_name":"INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3577190.3614175","is_oa":true,"landing_page_url":"http://dx.doi.org/10.1145/3577190.3614175","pdf_url":null,"source":{"id":"https://openalex.org/S4363608440","display_name":"INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"INTERNATIONAL CONFERENCE ON MULTIMODAL INTERACTION","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W120317145","https://openalex.org/W2005958977","https://openalex.org/W2064675550","https://openalex.org/W2248685949","https://openalex.org/W2250539671","https://openalex.org/W2469134594","https://openalex.org/W2543074387","https://openalex.org/W2614519765","https://openalex.org/W2862846329","https://openalex.org/W2913668833","https://openalex.org/W2964076328","https://openalex.org/W3045038252","https://openalex.org/W3144253442","https://openalex.org/W4297981470","https://openalex.org/W4297989763","https://openalex.org/W4312429630","https://openalex.org/W4312635677","https://openalex.org/W4312936899"],"related_works":["https://openalex.org/W3138471234","https://openalex.org/W4247958311","https://openalex.org/W4396832849","https://openalex.org/W2785089443","https://openalex.org/W2265117524","https://openalex.org/W1467576422","https://openalex.org/W4220730560","https://openalex.org/W4224273434","https://openalex.org/W3183783168","https://openalex.org/W170056888"],"abstract_inverted_index":{"Understanding":[0],"an":[1,75],"avatar\u2019s":[2,24,64,72,176],"motion":[3,25,73,85,102,105,128,149,159,162,177,198,208,222,245,251],"and":[4,13,21,33,93,99,103,123,150,152,160,238,266],"controlling":[5],"its":[6],"content":[7,11,126],"is":[8,55,113,210],"important":[9,56],"for":[10],"creation":[12],"has":[14],"been":[15],"actively":[16],"studied":[17],"in":[18,83,158,221],"computer":[19],"vision":[20],"graphics.":[22],"An":[23],"consists":[26],"of":[27,36,52,62,71,95,127,148,257,262,269],"frames":[28,37,92],"representing":[29],"poses":[30],"each":[31,207],"time,":[32],"a":[34,42,68,169],"subsequence":[35],"can":[38,196,218,243],"be":[39,87],"grouped":[40],"into":[41],"segment":[43],"based":[44,108,129],"on":[45,109,130,234],"semantic":[46,60,69],"meaning.":[47],"To":[48,135],"enable":[49],"semantic-level":[50],"control":[51,124],"motion,":[53],"it":[54,112,154],"to":[57,118,155],"understand":[58],"the":[59,63,81,84,90,96,120,125,131,146,164,175,179,187,190,200,204,213,225,235,247,255,258,263,267],"division":[61,70],"motion.":[65],"We":[66,230],"define":[67],"as":[74],"\u201cevent\u201d,":[76],"which":[77],"switches":[78],"only":[79],"when":[80],"frame":[82,209],"cannot":[86],"predicted":[88],"from":[89,106,145,163,178,189,199,246],"previous":[91],"information":[94],"last":[97],"event,":[98],"tackled":[100],"editing":[101,224,250],"inferring":[104,186],"text":[107,151,248],"events.":[110],"However,":[111],"challenging":[114],"because":[115],"we":[116,139,167,195,217],"need":[117],"obtain":[119],"event":[121,133,143,171,182,205,215,227,259,264],"information,":[122],"obtained":[132],"information.":[134],"overcome":[136],"this":[137],"challenge,":[138],"propose":[140],"obtaining":[141],"frame-level":[142,170,181],"representation":[144,172,183,228],"pair":[147],"using":[153],"edit":[156,219],"events":[157,220],"predict":[161,197],"text.":[165,191,201],"Specifically,":[166],"learn":[168],"by":[173,223],"reconstructing":[174],"corresponding":[180,214,226],"sequence":[184,188],"while":[185,249],"By":[192],"doing":[193],"so,":[194],"Also,":[202],"since":[203],"at":[206],"represented":[211],"with":[212],"representation,":[216],"sequence.":[229],"evaluated":[231],"our":[232,241],"method":[233],"HumanML3D":[236],"dataset":[237],"demonstrated":[239],"that":[240],"model":[242],"generate":[244],"flexibly":[252],"(e.g.,":[253],"allowing":[254],"change":[256],"duration,":[260],"modification":[261],"characteristics,":[265],"addition":[268],"new":[270],"events).":[271]},"counts_by_year":[],"updated_date":"2025-12-22T23:10:17.713674","created_date":"2025-10-10T00:00:00"}
