{"id":"https://openalex.org/W2993489713","doi":"https://doi.org/10.1109/mlsp.2019.8918813","title":"Multi-Step Chord Sequence Prediction Based On Aggregated Multi-Scale Encoder-Decoder Networks","display_name":"Multi-Step Chord Sequence Prediction Based On Aggregated Multi-Scale Encoder-Decoder Networks","publication_year":2019,"publication_date":"2019-10-01","ids":{"openalex":"https://openalex.org/W2993489713","doi":"https://doi.org/10.1109/mlsp.2019.8918813","mag":"2993489713"},"language":"en","primary_location":{"id":"doi:10.1109/mlsp.2019.8918813","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp.2019.8918813","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 29th International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-02364054","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5026032571","display_name":"Tristan Carsault","orcid":null},"institutions":[{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I4389425508","display_name":"Sciences et Technologies de la Musique et du Son","ror":"https://ror.org/025xvn046","country_code":null,"type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I2802818602","https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4210102700","https://openalex.org/I4389425508"]},{"id":"https://openalex.org/I35345632","display_name":"Institut de Recherche et Coordination Acoustique Musique","ror":"https://ror.org/0121jnt59","country_code":"FR","type":"education","lineage":["https://openalex.org/I35345632"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Tristan Carsault","raw_affiliation_strings":["IRCAM, CNRS, Sorbonne Universit\u00e9, UMR 9912 STMS, Paris, France"],"affiliations":[{"raw_affiliation_string":"IRCAM, CNRS, Sorbonne Universit\u00e9, UMR 9912 STMS, Paris, France","institution_ids":["https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4389425508","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002469859","display_name":"Andrew McLeod","orcid":"https://orcid.org/0000-0003-2700-2076"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Andrew McLeod","raw_affiliation_strings":["Graduate School of Informatics, Kyoto University, Sakyo-ku, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Kyoto University, Sakyo-ku, Kyoto, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085170922","display_name":"Philippe Esling","orcid":"https://orcid.org/0000-0002-1655-7909"},"institutions":[{"id":"https://openalex.org/I4389425508","display_name":"Sciences et Technologies de la Musique et du Son","ror":"https://ror.org/025xvn046","country_code":null,"type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I2802818602","https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4210102700","https://openalex.org/I4389425508"]},{"id":"https://openalex.org/I35345632","display_name":"Institut de Recherche et Coordination Acoustique Musique","ror":"https://ror.org/0121jnt59","country_code":"FR","type":"education","lineage":["https://openalex.org/I35345632"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Philippe Esling","raw_affiliation_strings":["IRCAM, CNRS, Sorbonne Universit\u00e9, UMR 9912 STMS, Paris, France"],"affiliations":[{"raw_affiliation_string":"IRCAM, CNRS, Sorbonne Universit\u00e9, UMR 9912 STMS, Paris, France","institution_ids":["https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4389425508","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036166568","display_name":"J\u00e9r\u00f4me Nika","orcid":"https://orcid.org/0000-0002-7946-1648"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"funder","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I35345632","display_name":"Institut de Recherche et Coordination Acoustique Musique","ror":"https://ror.org/0121jnt59","country_code":"FR","type":"education","lineage":["https://openalex.org/I35345632"]},{"id":"https://openalex.org/I39804081","display_name":"Sorbonne Universit\u00e9","ror":"https://ror.org/02en5vm52","country_code":"FR","type":"education","lineage":["https://openalex.org/I39804081"]},{"id":"https://openalex.org/I4389425508","display_name":"Sciences et Technologies de la Musique et du Son","ror":"https://ror.org/025xvn046","country_code":null,"type":"facility","lineage":["https://openalex.org/I1294671590","https://openalex.org/I2802818602","https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4210102700","https://openalex.org/I4389425508"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Jerome Nika","raw_affiliation_strings":["IRCAM, CNRS, Sorbonne Universit\u00e9, UMR 9912 STMS, Paris, France"],"affiliations":[{"raw_affiliation_string":"IRCAM, CNRS, Sorbonne Universit\u00e9, UMR 9912 STMS, Paris, France","institution_ids":["https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4389425508","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043140898","display_name":"Eita Nakamura","orcid":"https://orcid.org/0000-0003-4097-6027"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Eita Nakamura","raw_affiliation_strings":["Graduate School of Informatics, Kyoto University, Sakyo-ku, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Kyoto University, Sakyo-ku, Kyoto, Japan","institution_ids":["https://openalex.org/I22299242"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5067956319","display_name":"Kazuyoshi Yoshii","orcid":"https://orcid.org/0000-0001-8387-8609"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Kazuyoshi Yoshii","raw_affiliation_strings":["Graduate School of Informatics, Kyoto University, Sakyo-ku, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Graduate School of Informatics, Kyoto University, Sakyo-ku, Kyoto, Japan","institution_ids":["https://openalex.org/I22299242"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5026032571"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I35345632","https://openalex.org/I39804081","https://openalex.org/I4389425508"],"apc_list":null,"apc_paid":null,"fwci":0.167,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.47586585,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.9937999844551086,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8145153522491455},{"id":"https://openalex.org/keywords/chord","display_name":"Chord (peer-to-peer)","score":0.7363374829292297},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.682545006275177},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.49635177850723267},{"id":"https://openalex.org/keywords/ground-truth","display_name":"Ground truth","score":0.48146072030067444},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.47554799914360046},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.43491053581237793},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.42045876383781433},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.35723593831062317}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8145153522491455},{"id":"https://openalex.org/C194147245","wikidata":"https://www.wikidata.org/wiki/Q1076368","display_name":"Chord (peer-to-peer)","level":2,"score":0.7363374829292297},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.682545006275177},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49635177850723267},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.48146072030067444},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.47554799914360046},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.43491053581237793},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.42045876383781433},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.35723593831062317},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/mlsp.2019.8918813","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp.2019.8918813","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 29th International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:HAL:hal-02364054v1","is_oa":true,"landing_page_url":"https://hal.science/hal-02364054","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"MLSP 2019, Oct 2019, Pittsburgh, United States","raw_type":"Conference papers"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-02364054v1","is_oa":true,"landing_page_url":"https://hal.science/hal-02364054","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"MLSP 2019, Oct 2019, Pittsburgh, United States","raw_type":"Conference papers"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7699999809265137}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1599300385","https://openalex.org/W1989916294","https://openalex.org/W2016589492","https://openalex.org/W2130942839","https://openalex.org/W2137414850","https://openalex.org/W2137619888","https://openalex.org/W2141440284","https://openalex.org/W2152756914","https://openalex.org/W2172140247","https://openalex.org/W2183774388","https://openalex.org/W2338312508","https://openalex.org/W2395935897","https://openalex.org/W2513234653","https://openalex.org/W2552400013","https://openalex.org/W2556490290","https://openalex.org/W2575129390","https://openalex.org/W2745229848","https://openalex.org/W2771265026","https://openalex.org/W2781042349","https://openalex.org/W2886597424","https://openalex.org/W2902983770","https://openalex.org/W2949408457","https://openalex.org/W2964199361","https://openalex.org/W3099271704","https://openalex.org/W3159324329","https://openalex.org/W4285719527","https://openalex.org/W4294568831","https://openalex.org/W6679436768","https://openalex.org/W6680768788","https://openalex.org/W6682743674","https://openalex.org/W6686295308","https://openalex.org/W6703879901","https://openalex.org/W6726267598","https://openalex.org/W6746411809","https://openalex.org/W6753775506","https://openalex.org/W6756673966"],"related_works":["https://openalex.org/W1657880117","https://openalex.org/W2595172197","https://openalex.org/W2127970246","https://openalex.org/W2084856301","https://openalex.org/W1001352512","https://openalex.org/W4382618745","https://openalex.org/W2885125400","https://openalex.org/W1989889224","https://openalex.org/W2748922771","https://openalex.org/W1987128138"],"abstract_inverted_index":{"This":[0],"paper":[1],"studies":[2],"the":[3,24,62,82,137,178,181,187],"prediction":[4,42],"of":[5,19,27,65,78,101,136,164,177,183],"chord":[6,51,139,144],"progressions":[7],"for":[8,30,104],"jazz":[9],"music":[10,33],"by":[11],"relying":[12],"on":[13,73,95,133,190],"machine":[14],"learning":[15],"models.":[16],"The":[17],"motivation":[18],"our":[20,156],"study":[21],"comes":[22,60],"from":[23,61],"recent":[25],"success":[26],"neural":[28],"networks":[29,103],"performing":[31],"automatic":[32],"composition.":[34],"Although":[35],"high":[36],"accuracies":[37],"are":[38,88],"obtained":[39],"in":[40,122,162],"single-step":[41],"scenarios,":[43],"most":[44],"models":[45,152],"fail":[46],"to":[47,124],"generate":[48],"accurate":[49],"multistep":[50],"predictions.":[52],"In":[53,108],"this":[54,59],"paper,":[55],"we":[56,97,112,131],"postulate":[57],"that":[58,155],"multi-scale":[63,157],"structure":[64],"musical":[66,175],"information":[67],"and":[68,84,153,166,192],"propose":[69],"new":[70],"architectures":[71],"based":[72],"an":[74],"iterative":[75],"temporal":[76,93,106],"aggregation":[77],"input":[79,83],"labels.":[80],"Specifically,":[81],"ground":[85],"truth":[86],"labels":[87],"merged":[89],"into":[90,141],"increasingly":[91],"large":[92],"bags,":[94],"which":[96],"train":[98,125],"a":[99,109,126,196],"family":[100],"encoder-decoder":[102,128],"each":[105,120],"scale.":[107],"second":[110],"step,":[111],"use":[113],"these":[114],"pretrained":[115],"encoder":[116],"bottleneck":[117],"features":[118],"at":[119],"scale":[121],"order":[123],"final":[127],"network.":[129],"Furthermore,":[130],"rely":[132],"different":[134],"reductions":[135],"initial":[138],"alphabet":[140],"three":[142],"adapted":[143],"alphabets.":[145],"We":[146,173],"perform":[147],"evaluations":[148],"against":[149],"several":[150],"state-of-the-art":[151],"show":[154],"architecture":[158],"outperforms":[159],"existing":[160],"methods":[161],"terms":[163],"accuracy":[165],"perplexity,":[167],"while":[168],"requiring":[169],"relatively":[170],"few":[171],"parameters.":[172],"analyze":[174],"properties":[176],"results,":[179],"showing":[180],"influence":[182],"downbeat":[184],"position":[185],"within":[186],"analysis":[188],"window":[189],"accuracy,":[191],"evaluate":[193],"errors":[194],"using":[195],"musically-informed":[197],"distance":[198],"metric.":[199]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
