{"id":"https://openalex.org/W2160147944","doi":"https://doi.org/10.1109/icassp.2006.1661199","title":"Enhancing Similarity Matrices for Music Audio Analysis","display_name":"Enhancing Similarity Matrices for Music Audio Analysis","publication_year":2006,"publication_date":"2006-08-02","ids":{"openalex":"https://openalex.org/W2160147944","doi":"https://doi.org/10.1109/icassp.2006.1661199","mag":"2160147944"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2006.1661199","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2006.1661199","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2006 IEEE International Conference on Acoustics Speed and Signal Processing Proceedings","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109881851","display_name":"Meinard M\u00fcller","orcid":null},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"M. Muller","raw_affiliation_strings":["Department of Computer Science III, University of Bonn, Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science III, University of Bonn, Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009152780","display_name":"Frank Kurth","orcid":"https://orcid.org/0000-0002-9992-083X"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"F. Kurth","raw_affiliation_strings":["Department of Computer Science III, University of Bonn, Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science III, University of Bonn, Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5109881851"],"corresponding_institution_ids":["https://openalex.org/I135140700"],"apc_list":null,"apc_paid":null,"fwci":3.5465,"has_fulltext":false,"cited_by_count":38,"citation_normalized_percentile":{"value":0.9319406,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"5","issue":null,"first_page":"V","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9945999979972839,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7712913155555725},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.7682434916496277},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5838831067085266},{"id":"https://openalex.org/keywords/sketch","display_name":"Sketch","score":0.5724676847457886},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5036508440971375},{"id":"https://openalex.org/keywords/audio-analyzer","display_name":"Audio analyzer","score":0.4592890441417694},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.44257014989852905},{"id":"https://openalex.org/keywords/synchronization","display_name":"Synchronization (alternating current)","score":0.4385102093219757},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.4262388050556183},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.4216213524341583},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.37520334124565125},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.37269920110702515},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35531994700431824},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3405376672744751},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2870211601257324},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.20762845873832703},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.11184141039848328}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7712913155555725},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.7682434916496277},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5838831067085266},{"id":"https://openalex.org/C2779231336","wikidata":"https://www.wikidata.org/wiki/Q7534724","display_name":"Sketch","level":2,"score":0.5724676847457886},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5036508440971375},{"id":"https://openalex.org/C160372630","wikidata":"https://www.wikidata.org/wiki/Q4819855","display_name":"Audio analyzer","level":5,"score":0.4592890441417694},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.44257014989852905},{"id":"https://openalex.org/C2778562939","wikidata":"https://www.wikidata.org/wiki/Q1298791","display_name":"Synchronization (alternating current)","level":3,"score":0.4385102093219757},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.4262388050556183},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.4216213524341583},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.37520334124565125},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37269920110702515},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35531994700431824},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3405376672744751},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2870211601257324},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.20762845873832703},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.11184141039848328},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/icassp.2006.1661199","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2006.1661199","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2006 IEEE International Conference on Acoustics Speed and Signal Processing Proceedings","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.128.1956","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.128.1956","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.uni-bonn.de/~meinard/publications/06_MuKu_ICASSP.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":10,"referenced_works":["https://openalex.org/W9205999","https://openalex.org/W152645600","https://openalex.org/W166844666","https://openalex.org/W2008765103","https://openalex.org/W2106374173","https://openalex.org/W2139107403","https://openalex.org/W2143235280","https://openalex.org/W2153331925","https://openalex.org/W6600360952","https://openalex.org/W6652214876"],"related_works":["https://openalex.org/W2098934641","https://openalex.org/W2494533082","https://openalex.org/W1975359510","https://openalex.org/W4214771044","https://openalex.org/W4387698063","https://openalex.org/W4382560817","https://openalex.org/W1611900921","https://openalex.org/W3110605476","https://openalex.org/W2766269877","https://openalex.org/W2363106653"],"abstract_inverted_index":{"Similarity":[0],"matrices":[1,31,54],"have":[2],"become":[3],"an":[4,45,108],"important":[5],"tool":[6],"in":[7,97],"music":[8],"audio":[9,69,121,124],"analysis.":[10],"However,":[11],"the":[12,21,25,49,86,103,112,118],"quadratic":[13],"time":[14],"and":[15,67,100,123,128],"space":[16],"complexity":[17],"as":[18,20],"well":[19],"intricacy":[22],"of":[23,52,65,114,120],"extracting":[24],"desired":[26],"structural":[27,50],"information":[28,84],"from":[29],"these":[30],"are":[32],"often":[33],"prohibitive":[34],"with":[35],"regard":[36],"to":[37,94,117],"real-world":[38],"applications.":[39],"In":[40],"this":[41],"paper,":[42],"we":[43,60,80,110],"describe":[44],"approach":[46],"for":[47],"enhancing":[48],"properties":[51],"similarity":[53,88],"based":[55],"on":[56],"two":[57],"concepts:":[58],"first,":[59],"introduce":[61],"a":[62,77],"new":[63],"class":[64],"robust":[66],"scalable":[68],"features":[70],"which":[71],"absorb":[72],"local":[73,87],"temporal":[74],"variations.":[75],"As":[76,107],"second":[78],"contribution,":[79],"then":[81],"incorporate":[82],"contextual":[83],"into":[85],"measure.":[89],"The":[90],"resulting":[91],"enhancement":[92],"leads":[93],"significant":[95],"reduction":[96],"matrix":[98],"size":[99],"also":[101],"eases":[102],"structure":[104],"extraction":[105],"step.":[106],"example,":[109],"sketch":[111],"application":[113],"our":[115],"techniques":[116],"problems":[119],"summarization":[122],"synchronization,":[125],"obtaining":[126],"effective":[127],"computationally":[129],"feasible":[130],"algorithms":[131]},"counts_by_year":[{"year":2023,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":4},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":4}],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-10T00:00:00"}
