{"id":"https://openalex.org/W7108754076","doi":"https://doi.org/10.5281/zenodo.17811370","title":"Universal Music Representations? Evaluating Foundation Models on World Music Corpora","display_name":"Universal Music Representations? Evaluating Foundation Models on World Music Corpora","publication_year":2025,"publication_date":"2025-09-21","ids":{"openalex":"https://openalex.org/W7108754076","doi":"https://doi.org/10.5281/zenodo.17811370"},"language":null,"primary_location":{"id":"doi:10.5281/zenodo.17811370","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.17811370","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":""},"type":"article","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.5281/zenodo.17811370","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Charilaos Papaioannou","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Charilaos Papaioannou","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Emmanouil Benetos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Emmanouil Benetos","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Alexandros Potamianos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexandros Potamianos","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.62884132,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9909999966621399,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.0006000000284984708,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10788","display_name":"Neuroscience and Music Perception","score":0.0005000000237487257,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.8158000111579895},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.6728000044822693},{"id":"https://openalex.org/keywords/music-information-retrieval","display_name":"Music information retrieval","score":0.5788999795913696},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.5573999881744385},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.44519999623298645}],"concepts":[{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.8158000111579895},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.6728000044822693},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.5788999795913696},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5709999799728394},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.5573999881744385},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4472000002861023},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.44519999623298645},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.382099986076355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29019999504089355},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.28060001134872437},{"id":"https://openalex.org/C542929976","wikidata":"https://www.wikidata.org/wiki/Q9730","display_name":"Classical music","level":3,"score":0.2768000066280365},{"id":"https://openalex.org/C163175372","wikidata":"https://www.wikidata.org/wiki/Q3339222","display_name":"Linear model","level":2,"score":0.2599000036716461}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.5281/zenodo.17811370","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.17811370","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":""}],"best_oa_location":{"id":"doi:10.5281/zenodo.17811370","is_oa":true,"landing_page_url":"https://doi.org/10.5281/zenodo.17811370","pdf_url":null,"source":{"id":"https://openalex.org/S4306400562","display_name":"Zenodo (CERN European Organization for Nuclear Research)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I67311998","host_organization_name":"European Organization for Nuclear Research","host_organization_lineage":["https://openalex.org/I67311998"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":""},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Foundation":[0],"models":[1,30,82,113,137,155],"have":[2],"revolutionized":[3],"music":[4,116,160],"information":[5],"retrieval,":[6],"but":[7],"questions":[8],"remain":[9],"about":[10],"their":[11],"ability":[12],"to":[13,49,57,150],"generalize":[14],"across":[15,31,132],"diverse":[16],"musical":[17,33,141],"traditions.":[18,43,94],"This":[19],"paper":[20],"presents":[21],"a":[22],"comprehensive":[23],"evaluation":[24,144],"of":[25,64,104,111],"five":[26,102],"state-of-the-art":[27,99],"audio":[28],"foundation":[29,112,136],"six":[32,105],"corpora":[34],"spanning":[35],"Western":[36],"popular,":[37],"Greek,":[38],"Turkish,":[39],"and":[40,67,146],"Indian":[41],"classical":[42],"We":[44,118],"employ":[45],"three":[46],"complementary":[47],"methodologies":[48],"investigate":[50],"these":[51],"models'":[52],"cross-cultural":[53,78],"capabilities:":[54],"linear":[55,130],"probing":[56,131],"assess":[58],"inherent":[59],"representations,":[60],"targeted":[61,123],"supervised":[62],"fine-tuning":[63,124],"1-2":[65],"layers,":[66],"multi-label":[68],"few-shot":[69],"learning":[70],"for":[71,91,114,165],"low-resource":[72],"scenarios.":[73],"Our":[74,143],"analysis":[75],"shows":[76],"varying":[77],"generalization,":[79],"with":[80],"larger":[81],"typically":[83],"outperforming":[84],"on":[85,101],"non-Western":[86],"music,":[87],"though":[88],"results":[89,148],"decline":[90],"culturally":[92],"distant":[93],"Notably,":[95],"our":[96,122],"approaches":[97],"achieve":[98],"performance":[100],"out":[103],"evaluated":[106],"datasets,":[107],"demonstrating":[108],"the":[109],"effectiveness":[110],"world":[115],"understanding.":[117],"also":[119],"find":[120],"that":[121],"approach":[125],"does":[126],"not":[127],"consistently":[128],"outperform":[129],"all":[133],"settings,":[134],"suggesting":[135],"already":[138],"encode":[139],"substantial":[140],"knowledge.":[142],"framework":[145],"benchmarking":[147],"contribute":[149],"understanding":[151],"how":[152],"far":[153],"current":[154],"are":[156],"from":[157],"achieving":[158],"universal":[159],"representations":[161],"while":[162],"establishing":[163],"metrics":[164],"future":[166],"progress.":[167]},"counts_by_year":[],"updated_date":"2025-12-05T23:25:22.460635","created_date":"2025-12-05T00:00:00"}
