{"id":"https://openalex.org/W2906214917","doi":"https://doi.org/10.1109/msp.2018.2869928","title":"Automatic Music Transcription: An Overview","display_name":"Automatic Music Transcription: An Overview","publication_year":2018,"publication_date":"2018-12-25","ids":{"openalex":"https://openalex.org/W2906214917","doi":"https://doi.org/10.1109/msp.2018.2869928","mag":"2906214917"},"language":"en","primary_location":{"id":"doi:10.1109/msp.2018.2869928","is_oa":false,"landing_page_url":"https://doi.org/10.1109/msp.2018.2869928","pdf_url":null,"source":{"id":"https://openalex.org/S120977877","display_name":"IEEE Signal Processing Magazine","issn_l":"1053-5888","issn":["1053-5888","1558-0792"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Magazine","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://qmro.qmul.ac.uk/xmlui/bitstream/123456789/54987/1/Benetos%20Automatic%20Music%20Transcription%202019%20Accepted.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084672392","display_name":"Emmanouil Benetos","orcid":null},"institutions":[{"id":"https://openalex.org/I166337079","display_name":"Queen Mary University of London","ror":"https://ror.org/026zzn846","country_code":"GB","type":"education","lineage":["https://openalex.org/I124357947","https://openalex.org/I166337079"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Emmanouil Benetos","raw_affiliation_strings":["Electronic engineering, Queen Mary University of London"],"affiliations":[{"raw_affiliation_string":"Electronic engineering, Queen Mary University of London","institution_ids":["https://openalex.org/I166337079"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5077484271","display_name":"Simon Dixon","orcid":"https://orcid.org/0000-0002-6098-481X"},"institutions":[{"id":"https://openalex.org/I129604602","display_name":"The University of Sydney","ror":"https://ror.org/0384j8v12","country_code":"AU","type":"education","lineage":["https://openalex.org/I129604602"]}],"countries":["AU"],"is_corresponding":false,"raw_author_name":"Simon Dixon","raw_affiliation_strings":["Computer science, University of Sydney, Australia"],"affiliations":[{"raw_affiliation_string":"Computer science, University of Sydney, Australia","institution_ids":["https://openalex.org/I129604602"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102749436","display_name":"Zhiyao Duan","orcid":"https://orcid.org/0000-0002-8334-9974"},"institutions":[{"id":"https://openalex.org/I5388228","display_name":"University of Rochester","ror":"https://ror.org/022kthw22","country_code":"US","type":"education","lineage":["https://openalex.org/I5388228"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhiyao Duan","raw_affiliation_strings":["Electrical and Computer Engineering Department, University of Rochester, New York"],"affiliations":[{"raw_affiliation_string":"Electrical and Computer Engineering Department, University of Rochester, New York","institution_ids":["https://openalex.org/I5388228"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001413512","display_name":"Sebastian Ewert","orcid":"https://orcid.org/0000-0002-0718-0476"},"institutions":[{"id":"https://openalex.org/I135140700","display_name":"University of Bonn","ror":"https://ror.org/041nas322","country_code":"DE","type":"education","lineage":["https://openalex.org/I135140700"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Sebastian Ewert","raw_affiliation_strings":["Computer science, University of Bonn, Germany"],"affiliations":[{"raw_affiliation_string":"Computer science, University of Bonn, Germany","institution_ids":["https://openalex.org/I135140700"]}]}],"institutions":[],"countries_distinct_count":4,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5084672392"],"corresponding_institution_ids":["https://openalex.org/I166337079"],"apc_list":null,"apc_paid":null,"fwci":12.9468,"has_fulltext":true,"cited_by_count":272,"citation_normalized_percentile":{"value":0.99184552,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"36","issue":"1","first_page":"20","last_page":"30"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7359145283699036},{"id":"https://openalex.org/keywords/musical-notation","display_name":"Musical notation","score":0.7335213422775269},{"id":"https://openalex.org/keywords/notation","display_name":"Notation","score":0.6238664388656616},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.598797082901001},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5808910131454468},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.5406519770622253},{"id":"https://openalex.org/keywords/music-perception","display_name":"Music perception","score":0.523106575012207},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.5201557278633118},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.4962771534919739},{"id":"https://openalex.org/keywords/music-psychology","display_name":"Music psychology","score":0.4417489767074585},{"id":"https://openalex.org/keywords/audio-signal","display_name":"Audio signal","score":0.42598670721054077},{"id":"https://openalex.org/keywords/music-theory","display_name":"Music theory","score":0.418832004070282},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3879253566265106},{"id":"https://openalex.org/keywords/musical","display_name":"Musical","score":0.3651743233203888},{"id":"https://openalex.org/keywords/speech-coding","display_name":"Speech coding","score":0.08471560478210449}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7359145283699036},{"id":"https://openalex.org/C88639978","wikidata":"https://www.wikidata.org/wiki/Q233861","display_name":"Musical notation","level":3,"score":0.7335213422775269},{"id":"https://openalex.org/C45357846","wikidata":"https://www.wikidata.org/wiki/Q2001982","display_name":"Notation","level":2,"score":0.6238664388656616},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.598797082901001},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5808910131454468},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.5406519770622253},{"id":"https://openalex.org/C2987788386","wikidata":"https://www.wikidata.org/wiki/Q476590","display_name":"Music perception","level":3,"score":0.523106575012207},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.5201557278633118},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.4962771534919739},{"id":"https://openalex.org/C146902061","wikidata":"https://www.wikidata.org/wiki/Q476590","display_name":"Music psychology","level":3,"score":0.4417489767074585},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.42598670721054077},{"id":"https://openalex.org/C143857728","wikidata":"https://www.wikidata.org/wiki/Q193544","display_name":"Music theory","level":3,"score":0.418832004070282},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3879253566265106},{"id":"https://openalex.org/C558565934","wikidata":"https://www.wikidata.org/wiki/Q2743","display_name":"Musical","level":2,"score":0.3651743233203888},{"id":"https://openalex.org/C13895895","wikidata":"https://www.wikidata.org/wiki/Q3270773","display_name":"Speech coding","level":2,"score":0.08471560478210449},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0},{"id":"https://openalex.org/C94375191","wikidata":"https://www.wikidata.org/wiki/Q11205","display_name":"Arithmetic","level":1,"score":0.0},{"id":"https://openalex.org/C153349607","wikidata":"https://www.wikidata.org/wiki/Q36649","display_name":"Visual arts","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/msp.2018.2869928","is_oa":false,"landing_page_url":"https://doi.org/10.1109/msp.2018.2869928","pdf_url":null,"source":{"id":"https://openalex.org/S120977877","display_name":"IEEE Signal Processing Magazine","issn_l":"1053-5888","issn":["1053-5888","1558-0792"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Signal Processing Magazine","raw_type":"journal-article"},{"id":"pmh:oai:qmro.qmul.ac.uk:123456789/54987","is_oa":true,"landing_page_url":"https://qmro.qmul.ac.uk/xmlui/handle/123456789/54987","pdf_url":"https://qmro.qmul.ac.uk/xmlui/bitstream/123456789/54987/1/Benetos%20Automatic%20Music%20Transcription%202019%20Accepted.pdf","source":{"id":"https://openalex.org/S4306400530","display_name":"Queen Mary Research Online (Queen Mary University of London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I166337079","host_organization_name":"Queen Mary University of London","host_organization_lineage":["https://openalex.org/I166337079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":{"id":"pmh:oai:qmro.qmul.ac.uk:123456789/54987","is_oa":true,"landing_page_url":"https://qmro.qmul.ac.uk/xmlui/handle/123456789/54987","pdf_url":"https://qmro.qmul.ac.uk/xmlui/bitstream/123456789/54987/1/Benetos%20Automatic%20Music%20Transcription%202019%20Accepted.pdf","source":{"id":"https://openalex.org/S4306400530","display_name":"Queen Mary Research Online (Queen Mary University of London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I166337079","host_organization_name":"Queen Mary University of London","host_organization_lineage":["https://openalex.org/I166337079"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"},"sustainable_development_goals":[{"score":0.7799999713897705,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G3667855123","display_name":null,"funder_award_id":"AH/L01016X/1","funder_id":"https://openalex.org/F4320334609","funder_display_name":"Arts and Humanities Research Council"},{"id":"https://openalex.org/G4327335547","display_name":null,"funder_award_id":"RF/128","funder_id":"https://openalex.org/F4320320005","funder_display_name":"Royal Academy of Engineering"},{"id":"https://openalex.org/G6872237731","display_name":null,"funder_award_id":"ES/R004005/1","funder_id":"https://openalex.org/F4320334630","funder_display_name":"Economic and Social Research Council"}],"funders":[{"id":"https://openalex.org/F4320320005","display_name":"Royal Academy of Engineering","ror":"https://ror.org/0526snb40"},{"id":"https://openalex.org/F4320334609","display_name":"Arts and Humanities Research Council","ror":"https://ror.org/0505m1554"},{"id":"https://openalex.org/F4320334630","display_name":"Economic and Social Research Council","ror":"https://ror.org/03n0ht308"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2906214917.pdf","grobid_xml":"https://content.openalex.org/works/W2906214917.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W56135412","https://openalex.org/W129413713","https://openalex.org/W1492730469","https://openalex.org/W1819710477","https://openalex.org/W2001426554","https://openalex.org/W2017416504","https://openalex.org/W2017578549","https://openalex.org/W2031767620","https://openalex.org/W2065495703","https://openalex.org/W2095401277","https://openalex.org/W2096482524","https://openalex.org/W2101212989","https://openalex.org/W2104298926","https://openalex.org/W2105143211","https://openalex.org/W2107328928","https://openalex.org/W2110007838","https://openalex.org/W2125969424","https://openalex.org/W2127566601","https://openalex.org/W2129150855","https://openalex.org/W2135029798","https://openalex.org/W2152937398","https://openalex.org/W2158983491","https://openalex.org/W2198584637","https://openalex.org/W2294414398","https://openalex.org/W2295460171","https://openalex.org/W2396710372","https://openalex.org/W2416173453","https://openalex.org/W2494437503","https://openalex.org/W2523056285","https://openalex.org/W2577545569","https://openalex.org/W2593836007","https://openalex.org/W2728379535","https://openalex.org/W2759976799","https://openalex.org/W2771644120","https://openalex.org/W2950335938","https://openalex.org/W2962968839","https://openalex.org/W2963551352","https://openalex.org/W3100135054","https://openalex.org/W3143596294","https://openalex.org/W4293775315","https://openalex.org/W6602266860","https://openalex.org/W6629679824","https://openalex.org/W6680012447","https://openalex.org/W6697000175","https://openalex.org/W6697419627","https://openalex.org/W6712289847","https://openalex.org/W6727368055","https://openalex.org/W6732146819","https://openalex.org/W6733936739","https://openalex.org/W6745851314"],"related_works":["https://openalex.org/W4319230458","https://openalex.org/W3010806639","https://openalex.org/W4283766067","https://openalex.org/W2155953287","https://openalex.org/W2046791347","https://openalex.org/W2115723883","https://openalex.org/W3213696209","https://openalex.org/W4214514892","https://openalex.org/W1921028264","https://openalex.org/W2040640823"],"abstract_inverted_index":{"The":[0],"capability":[1],"of":[2,13,44,55,87],"transcribing":[3],"music":[4,7,38,50,56],"audio":[5],"into":[6,52],"notation":[8],"is":[9,58],"a":[10,59],"fascinating":[11],"example":[12],"human":[14],"intelligence.":[15,67],"It":[16,68],"involves":[17],"perception":[18],"(analyzing":[19],"complex":[20],"auditory":[21],"scenes),":[22],"cognition":[23],"(recognizing":[24],"musical":[25,30],"objects),":[26],"knowledge":[27],"representation":[28],"(forming":[29],"structures),":[31],"and":[32,65,77,83,90,92],"inference":[33],"(testing":[34],"alternative":[35],"hypotheses).":[36],"Automatic":[37],"transcription":[39],"(AMT),":[40],"i.e.,":[41],"the":[42],"design":[43],"computational":[45],"algorithms":[46],"to":[47],"convert":[48],"acoustic":[49],"signals":[51],"some":[53],"form":[54],"notation,":[57],"challenging":[60],"task":[61],"in":[62],"signal":[63],"processing":[64],"artificial":[66],"comprises":[69],"several":[70],"subtasks,":[71],"including":[72],"multipitch":[73],"estimation":[74],"(MPE),":[75],"onset":[76],"offset":[78],"detection,":[79],"instrument":[80],"recognition,":[81],"beat":[82],"rhythm":[84],"tracking,":[85],"interpretation":[86],"expressive":[88],"timing":[89],"dynamics,":[91],"score":[93],"typesetting.":[94]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":37},{"year":2024,"cited_by_count":70},{"year":2023,"cited_by_count":37},{"year":2022,"cited_by_count":44},{"year":2021,"cited_by_count":40},{"year":2020,"cited_by_count":26},{"year":2019,"cited_by_count":11},{"year":2018,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
