{"id":"https://openalex.org/W7131388063","doi":"https://doi.org/10.1109/access.2026.3667939","title":"Mu-Mixer: A Hierarchical MLP-Based Framework for Cover Song Identification","display_name":"Mu-Mixer: A Hierarchical MLP-Based Framework for Cover Song Identification","publication_year":2026,"publication_date":"2026-01-01","ids":{"openalex":"https://openalex.org/W7131388063","doi":"https://doi.org/10.1109/access.2026.3667939"},"language":"en","primary_location":{"id":"doi:10.1109/access.2026.3667939","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3667939","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1109/access.2026.3667939","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5046942516","display_name":"Jungwoo Heo","orcid":"https://orcid.org/0009-0008-7977-2789"},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jungwoo Heo","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0008-7977-2789","affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006973604","display_name":"Hyun-seo Shin","orcid":"https://orcid.org/0009-0005-6022-7674"},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyun-Seo Shin","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0005-6022-7674","affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036516187","display_name":"Chan-yeong Lim","orcid":"https://orcid.org/0009-0001-6671-5004"},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Chan-Yeong Lim","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0001-6671-5004","affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113361555","display_name":"Kyo-Won Koo","orcid":null},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Kyo-Won Koo","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028147662","display_name":"Seung-bin Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seung-Bin Kim","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0004-7036-072X","affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042447743","display_name":"Jisoo Son","orcid":null},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jisoo Son","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0007-2245-5945","affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030475312","display_name":"Ha-Jin Yu","orcid":"https://orcid.org/0000-0003-3657-0665"},"institutions":[{"id":"https://openalex.org/I124633538","display_name":"University of Seoul","ror":"https://ror.org/05en5nh73","country_code":"KR","type":"education","lineage":["https://openalex.org/I124633538"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Ha-Jin Yu","raw_affiliation_strings":["University of Seoul, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0003-3657-0665","affiliations":[{"raw_affiliation_string":"University of Seoul, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I124633538"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I124633538"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21768787,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"14","issue":null,"first_page":"35485","last_page":"35494"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.8098000288009644,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.8098000288009644,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.07370000332593918,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.014299999922513962,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4957999885082245},{"id":"https://openalex.org/keywords/block","display_name":"Block (permutation group theory)","score":0.4893999993801117},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4796999990940094},{"id":"https://openalex.org/keywords/receptive-field","display_name":"Receptive field","score":0.45840001106262207},{"id":"https://openalex.org/keywords/music-information-retrieval","display_name":"Music information retrieval","score":0.4458000063896179},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41510000824928284},{"id":"https://openalex.org/keywords/cover","display_name":"Cover (algebra)","score":0.4047999978065491},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.38499999046325684},{"id":"https://openalex.org/keywords/contrast","display_name":"Contrast (vision)","score":0.3700999915599823}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7734000086784363},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4957999885082245},{"id":"https://openalex.org/C2777210771","wikidata":"https://www.wikidata.org/wiki/Q4927124","display_name":"Block (permutation group theory)","level":2,"score":0.4893999993801117},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4796999990940094},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46959999203681946},{"id":"https://openalex.org/C19071747","wikidata":"https://www.wikidata.org/wiki/Q1755207","display_name":"Receptive field","level":2,"score":0.45840001106262207},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.4458000063896179},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41510000824928284},{"id":"https://openalex.org/C2780428219","wikidata":"https://www.wikidata.org/wiki/Q16952335","display_name":"Cover (algebra)","level":2,"score":0.4047999978065491},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.38499999046325684},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.3700999915599823},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.365200012922287},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.362199991941452},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3614000082015991},{"id":"https://openalex.org/C135343436","wikidata":"https://www.wikidata.org/wiki/Q170406","display_name":"Rhythm","level":2,"score":0.35830000042915344},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.3564999997615814},{"id":"https://openalex.org/C144745244","wikidata":"https://www.wikidata.org/wiki/Q4927286","display_name":"Blocking (statistics)","level":2,"score":0.3434000015258789},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.32190001010894775},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.2964000105857849},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26460000872612},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.263700008392334},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.26030001044273376},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.25459998846054077},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.2533000111579895}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2026.3667939","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3667939","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:c1edb4809fd3499983a55505865429e4","is_oa":true,"landing_page_url":"https://doaj.org/article/c1edb4809fd3499983a55505865429e4","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 14, Pp 35485-35494 (2026)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2026.3667939","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2026.3667939","pdf_url":null,"source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3268536186","display_name":null,"funder_award_id":"2023R1A2C1005744","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Cover":[0],"Song":[1],"Identification":[2],"(CSI)":[3],"is":[4,138],"a":[5,47,77,126,140],"fundamental":[6],"task":[7],"in":[8,147],"music":[9],"information":[10,70],"retrieval,":[11],"essential":[12],"for":[13,52,142],"copyright":[14],"protection":[15],"and":[16,24,36,132],"content":[17],"organization.":[18],"While":[19],"Convolutional":[20],"Neural":[21],"Networks":[22],"(CNNs)":[23],"Transformers":[25],"have":[26],"significantly":[27],"advanced":[28],"CSI,":[29],"they":[30],"suffer":[31],"from":[32],"limited":[33],"receptive":[34,57],"fields":[35,58],"quadratic":[37],"computational":[38,133],"complexity,":[39],"respectively.":[40],"In":[41,62],"this":[42],"paper,":[43],"we":[44],"propose":[45],"Mu-Mixer,":[46],"novel":[48],"all-MLP":[49],"architecture":[50],"tailored":[51],"CSI":[53],"that":[54,123,136],"achieves":[55,117],"global":[56],"with":[59],"linear":[60],"complexity.":[61],"contrast":[63],"to":[64,96],"image-based":[65],"MLP-Mixers,":[66],"which":[67],"indiscriminately":[68],"mix":[69],"across":[71],"the":[72,87,110],"temporal":[73],"axis,":[74],"Mu-Mixer":[75,108,124],"incorporates":[76],"Multi-scale":[78],"Temporal":[79],"Mixing":[80],"Block":[81],"(MTMB).":[82],"This":[83],"strategy":[84],"hierarchically":[85],"segments":[86],"time":[88],"dimension":[89],"<italic":[90],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[91],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">T</i>":[92],"into":[93],"multiple":[94],"scales":[95],"preserve":[97],"local":[98],"rhythmic":[99],"motifs":[100],"while":[101],"capturing":[102],"long-range":[103,144],"structural":[104],"dependencies.":[105],"We":[106],"evaluate":[107],"on":[109],"AI-Hub":[111],"Music":[112],"Similarity":[113],"dataset,":[114],"where":[115],"it":[116],"state-of-the-art":[118],"performance.":[119],"Our":[120],"results":[121],"demonstrate":[122],"provides":[125],"superior":[127],"balance":[128],"between":[129],"identification":[130],"accuracy":[131],"efficiency,":[134],"proving":[135],"self-attention":[137],"not":[139],"prerequisite":[141],"modeling":[143],"acoustic":[145],"dependencies":[146],"musical":[148],"signals.":[149]},"counts_by_year":[],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2026-02-26T00:00:00"}
