{"id":"https://openalex.org/W4390463217","doi":"https://doi.org/10.1587/transinf.2023mul0003","title":"CQTXNet: A Modified Xception Network with Attention Modules for Cover Song Identification","display_name":"CQTXNet: A Modified Xception Network with Attention Modules for Cover Song Identification","publication_year":2023,"publication_date":"2023-12-31","ids":{"openalex":"https://openalex.org/W4390463217","doi":"https://doi.org/10.1587/transinf.2023mul0003"},"language":"en","primary_location":{"id":"doi:10.1587/transinf.2023mul0003","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2023mul0003","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E107.D/1/E107.D_2023MUL0003/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://www.jstage.jst.go.jp/article/transinf/E107.D/1/E107.D_2023MUL0003/_pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113085531","display_name":"Jinsoo SEO","orcid":null},"institutions":[{"id":"https://openalex.org/I133533813","display_name":"Gangneung\u2013Wonju National University","ror":"https://ror.org/0461cvh40","country_code":"KR","type":"education","lineage":["https://openalex.org/I133533813"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Jinsoo SEO","raw_affiliation_strings":["Department of Electrical Engineering, Gangneung-Wonju National University"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Gangneung-Wonju National University","institution_ids":["https://openalex.org/I133533813"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100349772","display_name":"Jung-Hyun Kim","orcid":"https://orcid.org/0000-0002-9500-1537"},"institutions":[{"id":"https://openalex.org/I142401562","display_name":"Electronics and Telecommunications Research Institute","ror":"https://ror.org/03ysstz10","country_code":"KR","type":"facility","lineage":["https://openalex.org/I142401562","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Junghyun KIM","raw_affiliation_strings":["Content Research Division, Electronics and Telecommunications Research Institute"],"affiliations":[{"raw_affiliation_string":"Content Research Division, Electronics and Telecommunications Research Institute","institution_ids":["https://openalex.org/I142401562"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076443181","display_name":"Hyemi Kim","orcid":"https://orcid.org/0000-0003-4713-4658"},"institutions":[{"id":"https://openalex.org/I142401562","display_name":"Electronics and Telecommunications Research Institute","ror":"https://ror.org/03ysstz10","country_code":"KR","type":"facility","lineage":["https://openalex.org/I142401562","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Hyemi KIM","raw_affiliation_strings":["Content Research Division, Electronics and Telecommunications Research Institute"],"affiliations":[{"raw_affiliation_string":"Content Research Division, Electronics and Telecommunications Research Institute","institution_ids":["https://openalex.org/I142401562"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113085531"],"corresponding_institution_ids":["https://openalex.org/I133533813"],"apc_list":null,"apc_paid":null,"fwci":0.6022,"has_fulltext":true,"cited_by_count":3,"citation_normalized_percentile":{"value":0.67930137,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":99},"biblio":{"volume":"E107.D","issue":"1","first_page":"49","last_page":"52"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13996","display_name":"Diverse Musicological Studies","score":0.9843999743461609,"subfield":{"id":"https://openalex.org/subfields/1210","display_name":"Music"},"field":{"id":"https://openalex.org/fields/12","display_name":"Arts and Humanities"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8567146062850952},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.8449261784553528},{"id":"https://openalex.org/keywords/cover","display_name":"Cover (algebra)","score":0.6884915232658386},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.6164824962615967},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5762052536010742},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.4898187816143036},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.48345741629600525},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4678502678871155},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4213590621948242},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.4123508334159851},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37320277094841003},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3635615110397339}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8567146062850952},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.8449261784553528},{"id":"https://openalex.org/C2780428219","wikidata":"https://www.wikidata.org/wiki/Q16952335","display_name":"Cover (algebra)","level":2,"score":0.6884915232658386},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.6164824962615967},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5762052536010742},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.4898187816143036},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.48345741629600525},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4678502678871155},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4213590621948242},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.4123508334159851},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37320277094841003},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3635615110397339},{"id":"https://openalex.org/C59822182","wikidata":"https://www.wikidata.org/wiki/Q441","display_name":"Botany","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1587/transinf.2023mul0003","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2023mul0003","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E107.D/1/E107.D_2023MUL0003/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1587/transinf.2023mul0003","is_oa":true,"landing_page_url":"https://doi.org/10.1587/transinf.2023mul0003","pdf_url":"https://www.jstage.jst.go.jp/article/transinf/E107.D/1/E107.D_2023MUL0003/_pdf","source":{"id":"https://openalex.org/S2486202937","display_name":"IEICE Transactions on Information and Systems","issn_l":"0916-8532","issn":["0916-8532","1745-1361"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4320800604","host_organization_name":"Institute of Electronics, Information and Communication Engineers","host_organization_lineage":["https://openalex.org/P4320800604"],"host_organization_lineage_names":["Institute of Electronics, Information and Communication Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEICE Transactions on Information and Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4489101550","display_name":null,"funder_award_id":"CR202104004","funder_id":"https://openalex.org/F4320322006","funder_display_name":"Ministry of Culture, Sports and Tourism"},{"id":"https://openalex.org/G6880294078","display_name":null,"funder_award_id":"CR202104004","funder_id":"https://openalex.org/F4320323890","funder_display_name":"Korea Creative Content Agency"}],"funders":[{"id":"https://openalex.org/F4320322006","display_name":"Ministry of Culture, Sports and Tourism","ror":"https://ror.org/02fkk6k65"},{"id":"https://openalex.org/F4320323890","display_name":"Korea Creative Content Agency","ror":"https://ror.org/036vyg793"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4390463217.pdf","grobid_xml":"https://content.openalex.org/works/W4390463217.grobid-xml"},"referenced_works_count":16,"referenced_works":["https://openalex.org/W1486009449","https://openalex.org/W2137319814","https://openalex.org/W2154473523","https://openalex.org/W2191779130","https://openalex.org/W2194775991","https://openalex.org/W2531409750","https://openalex.org/W2884585870","https://openalex.org/W2896276533","https://openalex.org/W2963163009","https://openalex.org/W2963420686","https://openalex.org/W2998127937","https://openalex.org/W3015271757","https://openalex.org/W3015666964","https://openalex.org/W3146366485","https://openalex.org/W3161928252","https://openalex.org/W4307545940"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W3148229873","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W2091301346","https://openalex.org/W1517524280","https://openalex.org/W4389760904","https://openalex.org/W2964954556","https://openalex.org/W3019910406"],"abstract_inverted_index":{"Song-level":[0],"feature":[1,27],"summarization":[2],"is":[3],"fundamental":[4],"for":[5,24,29],"the":[6,52,66,72],"browsing,":[7],"retrieval,":[8],"and":[9,41,71],"indexing":[10],"of":[11,51,68,74],"digital":[12],"music":[13],"archives.":[14],"This":[15],"study":[16],"proposes":[17],"a":[18],"deep":[19],"neural":[20],"network":[21,39,69],"model,":[22],"CQTXNet,":[23],"extracting":[25],"song-level":[26],"summary":[28],"cover":[30,61],"song":[31,62],"identification.":[32],"CQTXNet":[33,54],"incorporates":[34],"depth-wise":[35],"separable":[36],"convolution,":[37],"residual":[38],"connections,":[40],"attention":[42,75],"models":[43],"to":[44],"extend":[45],"previous":[46],"approaches.":[47],"An":[48],"experimental":[49],"evaluation":[50],"proposed":[53],"was":[55],"performed":[56],"on":[57],"two":[58],"publicly":[59],"available":[60],"datasets":[63],"by":[64],"varying":[65],"number":[67],"layers":[70],"type":[73],"modules.":[76]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
