{"id":"https://openalex.org/W4224941193","doi":"https://doi.org/10.1109/icassp43922.2022.9747629","title":"Hierarchical Graph-Based Neural Network for Singing Melody Extraction","display_name":"Hierarchical Graph-Based Neural Network for Singing Melody Extraction","publication_year":2022,"publication_date":"2022-04-27","ids":{"openalex":"https://openalex.org/W4224941193","doi":"https://doi.org/10.1109/icassp43922.2022.9747629"},"language":"en","primary_location":{"id":"doi:10.1109/icassp43922.2022.9747629","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747629","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011482849","display_name":"Shuai Yu","orcid":"https://orcid.org/0000-0003-1847-563X"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shuai Yu","raw_affiliation_strings":["Fudan University,School of Computer Science and Technology,Shanghai,China","School of Computer Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science and Technology,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100330011","display_name":"Xi Chen","orcid":"https://orcid.org/0000-0003-0248-8161"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xi Chen","raw_affiliation_strings":["Fudan University,School of Computer Science and Technology,Shanghai,China","School of Computer Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science and Technology,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100318193","display_name":"Wei Li","orcid":"https://orcid.org/0000-0002-4486-8341"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Li","raw_affiliation_strings":["Fudan University,School of Computer Science and Technology,Shanghai,China","Shanghai Key Laboratory of Intelligent Information Processing, Fudan University, Shanghai, China","School of Computer Science and Technology, Fudan University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science and Technology,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"Shanghai Key Laboratory of Intelligent Information Processing, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]},{"raw_affiliation_string":"School of Computer Science and Technology, Fudan University, Shanghai, China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5011482849"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":1.841,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.87835703,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"626","last_page":"630"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9879000186920166,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7826793193817139},{"id":"https://openalex.org/keywords/singing","display_name":"Singing","score":0.7072400450706482},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.6343851685523987},{"id":"https://openalex.org/keywords/polyphony","display_name":"Polyphony","score":0.593584418296814},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4984593391418457},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4692133963108063},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.4660400450229645},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.4524553716182709},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.41340962052345276},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.3534508943557739},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3339928686618805},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3046805262565613}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7826793193817139},{"id":"https://openalex.org/C44819458","wikidata":"https://www.wikidata.org/wiki/Q27939","display_name":"Singing","level":2,"score":0.7072400450706482},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.6343851685523987},{"id":"https://openalex.org/C128979739","wikidata":"https://www.wikidata.org/wiki/Q179465","display_name":"Polyphony","level":2,"score":0.593584418296814},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4984593391418457},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4692133963108063},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.4660400450229645},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4524553716182709},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.41340962052345276},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.3534508943557739},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3339928686618805},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3046805262565613},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp43922.2022.9747629","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp43922.2022.9747629","pdf_url":null,"source":{"id":"https://openalex.org/S4363607702","display_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2022 - 2022 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7099999785423279}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W1493535305","https://openalex.org/W1973397896","https://openalex.org/W2001426554","https://openalex.org/W2134025364","https://openalex.org/W2161632835","https://openalex.org/W2550553598","https://openalex.org/W2747756448","https://openalex.org/W2752782242","https://openalex.org/W2884585870","https://openalex.org/W2963158112","https://openalex.org/W2963495494","https://openalex.org/W2963535133","https://openalex.org/W2964015378","https://openalex.org/W2964177567","https://openalex.org/W3015608758","https://openalex.org/W3131937837","https://openalex.org/W3191088441","https://openalex.org/W4221165769","https://openalex.org/W6726873649","https://openalex.org/W6753412334"],"related_works":["https://openalex.org/W2122830402","https://openalex.org/W3107474891","https://openalex.org/W2676493621","https://openalex.org/W178932670","https://openalex.org/W2935701729","https://openalex.org/W2130581557","https://openalex.org/W2811390910","https://openalex.org/W1728708896","https://openalex.org/W4293731510","https://openalex.org/W2143835785"],"abstract_inverted_index":{"Singing":[0],"melody":[1,44,86],"extraction":[2],"from":[3],"polyphonic":[4],"music":[5,13],"is":[6,30,110,132],"a":[7,36,79,105],"critical":[8],"and":[9,25,32,69,136],"challenging":[10,33],"task":[11],"in":[12,66,118],"information":[14],"retrieval":[15],"(MIR).":[16],"However,":[17],"due":[18],"to":[19,34,57,91,112,122,134],"the":[20,23,26,42,52,59,63,67,70,95,100,114,119,124,138,146,149],"interfere":[21],"of":[22,94,148],"accompaniment":[24],"background":[27],"noise,":[28],"it":[29],"key":[31],"obtain":[35,113],"global":[37,60,64,115],"semantic":[38,61,116],"representation":[39,117],"that":[40,55],"discriminates":[41],"singing":[43,85],"line.":[45],"To":[46],"address":[47],"this":[48,75],"issue,":[49],"we":[50,77,97],"consider":[51],"two":[53],"aspects":[54],"regards":[56],"obtaining":[58],"representation:":[62],"relationships":[65,71,125],"spectrum":[68,101],"between":[72,126,140],"channels.":[73,141],"In":[74,88],"paper,":[76],"propose":[78],"novel":[80],"hierarchical":[81],"graph-based":[82],"network":[83,109],"for":[84],"extraction.":[87],"particular,":[89],"according":[90],"its":[92],"characteristics":[93],"spectrum,":[96],"first":[98],"model":[99],"into":[102],"graph":[103,107,129],"structure,":[104],"two-layer":[106],"convolution":[108,130],"used":[111],"spectrum.":[120],"Then":[121],"capture":[123,135],"channels,":[127],"channel-wise":[128],"module":[131],"devised":[133],"reasoning":[137],"relationship":[139],"The":[142],"conducted":[143],"experiments":[144],"demonstrate":[145],"effectiveness":[147],"proposed":[150],"network.":[151]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
