{"id":"https://openalex.org/W2914050240","doi":"https://doi.org/10.23919/mva.2019.8757943","title":"Visual Rhythm Prediction with Feature-Aligning Network","display_name":"Visual Rhythm Prediction with Feature-Aligning Network","publication_year":2019,"publication_date":"2019-05-01","ids":{"openalex":"https://openalex.org/W2914050240","doi":"https://doi.org/10.23919/mva.2019.8757943","mag":"2914050240"},"language":"en","primary_location":{"id":"doi:10.23919/mva.2019.8757943","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva.2019.8757943","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 16th International Conference on Machine Vision Applications (MVA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011835422","display_name":"Yutong Xie","orcid":"https://orcid.org/0000-0002-6644-1250"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yutong Xie","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100438290","display_name":"Haiyang Wang","orcid":"https://orcid.org/0009-0004-4283-1950"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haiyang Wang","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100708037","display_name":"Hao Yan","orcid":"https://orcid.org/0000-0003-0796-8076"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yan Hao","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108050757","display_name":"Zihao Xu","orcid":"https://orcid.org/0000-0003-4753-2664"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zihao Xu","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5011835422"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.00957408,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7847773432731628},{"id":"https://openalex.org/keywords/timeline","display_name":"Timeline","score":0.7828654646873474},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6804090738296509},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5995272397994995},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.591765820980072},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5836488008499146},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.524231493473053},{"id":"https://openalex.org/keywords/rhythm","display_name":"Rhythm","score":0.5110834836959839},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.47483116388320923},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.45850425958633423},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4527400732040405},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.43750712275505066},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.43162840604782104},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4140670597553253}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7847773432731628},{"id":"https://openalex.org/C4438859","wikidata":"https://www.wikidata.org/wiki/Q186117","display_name":"Timeline","level":2,"score":0.7828654646873474},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6804090738296509},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5995272397994995},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.591765820980072},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5836488008499146},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.524231493473053},{"id":"https://openalex.org/C135343436","wikidata":"https://www.wikidata.org/wiki/Q170406","display_name":"Rhythm","level":2,"score":0.5110834836959839},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.47483116388320923},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.45850425958633423},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4527400732040405},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.43750712275505066},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.43162840604782104},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4140670597553253},{"id":"https://openalex.org/C107038049","wikidata":"https://www.wikidata.org/wiki/Q35986","display_name":"Aesthetics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.23919/mva.2019.8757943","is_oa":false,"landing_page_url":"https://doi.org/10.23919/mva.2019.8757943","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 16th International Conference on Machine Vision Applications (MVA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1565206031","https://openalex.org/W1992941345","https://openalex.org/W2042390666","https://openalex.org/W2054459540","https://openalex.org/W2076849475","https://openalex.org/W2079735306","https://openalex.org/W2139238328","https://openalex.org/W2194775991","https://openalex.org/W2293202270","https://openalex.org/W2497406591","https://openalex.org/W2808040094","https://openalex.org/W2811167645","https://openalex.org/W2962902328","https://openalex.org/W2963403868","https://openalex.org/W2963781481","https://openalex.org/W3113172960","https://openalex.org/W4385245566","https://openalex.org/W6669731727","https://openalex.org/W6687483927","https://openalex.org/W6697154816","https://openalex.org/W6697171384","https://openalex.org/W6730734845","https://openalex.org/W6739901393"],"related_works":["https://openalex.org/W1858249912","https://openalex.org/W2114034199","https://openalex.org/W2317428717","https://openalex.org/W2734259032","https://openalex.org/W4385261515","https://openalex.org/W3094038556","https://openalex.org/W4296345146","https://openalex.org/W2014772881","https://openalex.org/W4254228154","https://openalex.org/W3049477255"],"abstract_inverted_index":{"In":[0,26],"this":[1,77,91],"paper,":[2],"we":[3,29,61,150],"propose":[4],"a":[5,153],"data-driven":[6],"visual":[7,47],"rhythm":[8],"prediction":[9],"method,":[10],"which":[11,103],"overcomes":[12],"the":[13,72,81,93,137,141,166],"previous":[14],"works'":[15],"deficiency":[16],"that":[17,63,76],"predictions":[18],"are":[19,65,87,96,122],"made":[20],"primarily":[21],"by":[22,98,156],"human-crafted":[23],"hard":[24],"rules.":[25],"our":[27,170],"approach,":[28],"first":[30],"extract":[31],"features":[32,48,70,86,95,121],"including":[33],"original":[34],"frames":[35],"and":[36,43,74,115,132,147,165],"their":[37],"residuals,":[38],"optical":[39],"flow,":[40],"scene":[41],"change,":[42],"body":[44],"pose.":[45],"These":[46],"will":[49],"be":[50,106],"next":[51],"taken":[52],"into":[53,124],"an":[54,99],"end-to-end":[55],"neural":[56],"network":[57],"as":[58],"inputs.":[59],"Here":[60],"observe":[62],"there":[64],"some":[66],"slight":[67],"misaligning":[68],"between":[69,83],"over":[71],"timeline":[73],"assume":[75],"is":[78],"due":[79],"to":[80,108,135,140],"distinctions":[82],"how":[84],"different":[85],"computed.":[88],"To":[89],"solve":[90],"problem,":[92],"extracted":[94],"aligned":[97,120],"elaborately":[100],"designed":[101],"layer,":[102],"can":[104],"also":[105],"applied":[107],"other":[109],"models":[110],"suffering":[111],"from":[112],"mismatched":[113],"features,":[114],"boost":[116],"performance.":[117],"Then":[118],"these":[119],"fed":[123],"sequence":[125],"labeling":[126],"layers":[127],"implemented":[128],"with":[129],"BiLSTM":[130],"[9]":[131],"CRF":[133],"[10]":[134],"predict":[136],"onsets.":[138],"Due":[139],"lack":[142],"of":[143,169],"existing":[144],"public":[145],"training":[146],"evaluation":[148],"set,":[149],"experiment":[151],"on":[152,159],"dataset":[154],"constructed":[155],"ourselves":[157],"based":[158],"professionally":[160],"edited":[161],"Music":[162],"Videos":[163],"(MVs),":[164],"F1":[167],"score":[168],"approach":[171],"reaches":[172],"79.6.":[173]},"counts_by_year":[{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
