{"id":"https://openalex.org/W3015847222","doi":"https://doi.org/10.1109/icassp40776.2020.9053257","title":"Similarity Learning For Cover Song Identification Using Cross-Similarity Matrices of Multi-Level Deep Sequences","display_name":"Similarity Learning For Cover Song Identification Using Cross-Similarity Matrices of Multi-Level Deep Sequences","publication_year":2020,"publication_date":"2020-04-09","ids":{"openalex":"https://openalex.org/W3015847222","doi":"https://doi.org/10.1109/icassp40776.2020.9053257","mag":"3015847222"},"language":"en","primary_location":{"id":"doi:10.1109/icassp40776.2020.9053257","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5062777592","display_name":"Chaoya Jiang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chaoya Jiang","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University"],"affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100885747","display_name":"Deshun Yang","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Deshun Yang","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University"],"affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017207620","display_name":"Xiaoou Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoou Chen","raw_affiliation_strings":["Wangxuan Institute of Computer Technology, Peking University"],"affiliations":[{"raw_affiliation_string":"Wangxuan Institute of Computer Technology, Peking University","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5062777592"],"corresponding_institution_ids":["https://openalex.org/I20231570"],"apc_list":null,"apc_paid":null,"fwci":1.8184,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.85437788,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"26","last_page":"30"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9857000112533569,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.8720594048500061},{"id":"https://openalex.org/keywords/similarity-learning","display_name":"Similarity learning","score":0.6850852966308594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6809053421020508},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6534163355827332},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.6050130128860474},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5870639085769653},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.573599100112915},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5564278364181519},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5316710472106934},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5161626935005188},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5155184268951416},{"id":"https://openalex.org/keywords/similitude","display_name":"Similitude","score":0.4535546898841858},{"id":"https://openalex.org/keywords/cover","display_name":"Cover (algebra)","score":0.4518454074859619},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.443400114774704},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.4116997718811035},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07158148288726807},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.07051011919975281}],"concepts":[{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.8720594048500061},{"id":"https://openalex.org/C2779597229","wikidata":"https://www.wikidata.org/wiki/Q17146505","display_name":"Similarity learning","level":3,"score":0.6850852966308594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6809053421020508},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6534163355827332},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.6050130128860474},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5870639085769653},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.573599100112915},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5564278364181519},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5316710472106934},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5161626935005188},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5155184268951416},{"id":"https://openalex.org/C143271835","wikidata":"https://www.wikidata.org/wiki/Q254515","display_name":"Similitude","level":2,"score":0.4535546898841858},{"id":"https://openalex.org/C2780428219","wikidata":"https://www.wikidata.org/wiki/Q16952335","display_name":"Cover (algebra)","level":2,"score":0.4518454074859619},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.443400114774704},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.4116997718811035},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07158148288726807},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.07051011919975281},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp40776.2020.9053257","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp40776.2020.9053257","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2020 - 2020 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W166844666","https://openalex.org/W216397362","https://openalex.org/W1486009449","https://openalex.org/W1493535305","https://openalex.org/W1505667669","https://openalex.org/W2076608692","https://openalex.org/W2101642281","https://openalex.org/W2111007352","https://openalex.org/W2112796928","https://openalex.org/W2131739315","https://openalex.org/W2137319814","https://openalex.org/W2191779130","https://openalex.org/W2295756080","https://openalex.org/W2408482937","https://openalex.org/W2538860156","https://openalex.org/W2587288237","https://openalex.org/W2611198916","https://openalex.org/W2727839354","https://openalex.org/W2740932163","https://openalex.org/W2772072643","https://openalex.org/W2896276533","https://openalex.org/W2903337088","https://openalex.org/W2963840672","https://openalex.org/W2965178495","https://openalex.org/W4206856897","https://openalex.org/W6608682707","https://openalex.org/W6628883615","https://openalex.org/W6630030631","https://openalex.org/W6676368125","https://openalex.org/W6696085341","https://openalex.org/W6714078465","https://openalex.org/W6729231832","https://openalex.org/W6746244618","https://openalex.org/W6756466442","https://openalex.org/W6807223892"],"related_works":["https://openalex.org/W2372745973","https://openalex.org/W2366015234","https://openalex.org/W1845928302","https://openalex.org/W3015847222","https://openalex.org/W4205694692","https://openalex.org/W3208753052","https://openalex.org/W2945501053","https://openalex.org/W2890533838","https://openalex.org/W4286892842","https://openalex.org/W4226448809"],"abstract_inverted_index":{"In":[0,53],"recent":[1],"years,":[2],"several":[3,132],"deep":[4,83,107],"learning":[5,81],"models":[6],"have":[7,16],"been":[8,17],"proposed":[9,140],"for":[10,24,38,63,80],"cover":[11],"song":[12],"identification":[13],"and":[14,89,120],"they":[15],"designed":[18],"to":[19,122],"learn":[20],"fixed-length":[21,51],"feature":[22],"vectors":[23],"music":[25,64,87],"tracks.":[26,113],"However,":[27],"the":[28,40,82,90,101,106,136,139],"aspect":[29],"of":[30,33,72,86,109,112,138],"temporal":[31],"progression":[32],"music,":[34],"which":[35,97],"is":[36,46,77,92],"important":[37],"measuring":[39],"melody":[41,65,125],"similarity":[42,66,94,126],"between":[43],"two":[44,73,115],"tracks,":[45,88],"not":[47],"well":[48],"represented":[49],"by":[50],"vectors.":[52],"this":[54],"paper,":[55],"we":[56],"propose":[57],"a":[58,78,93,110],"new":[59],"Siamese":[60],"network":[61,79,96],"architecture":[62,70],"metric":[67],"learning.":[68],"The":[69,114],"consists":[71],"parts.":[74],"One":[75],"part":[76],"sequence":[84],"representation":[85],"other":[91],"estimation":[95],"takes":[98],"as":[99],"input":[100],"cross-similarity":[102],"matrices":[103],"calculated":[104],"from":[105],"sequences":[108],"pair":[111],"networks":[116],"are":[117],"jointly":[118],"trained":[119],"optimized":[121],"achieve":[123],"high":[124],"prediction":[127],"accuracy.":[128],"Experiments":[129],"conducted":[130],"on":[131],"public":[133],"datasets":[134],"demonstrate":[135],"superiority":[137],"architecture.":[141]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2}],"updated_date":"2026-01-13T01:12:25.745995","created_date":"2025-10-10T00:00:00"}
