{"id":"https://openalex.org/W4415707758","doi":"https://doi.org/10.1109/icme59968.2025.11210138","title":"HingeNet: A Harmonic-Aware Fine-Tuning Approach for Beat Tracking","display_name":"HingeNet: A Harmonic-Aware Fine-Tuning Approach for Beat Tracking","publication_year":2025,"publication_date":"2025-06-30","ids":{"openalex":"https://openalex.org/W4415707758","doi":"https://doi.org/10.1109/icme59968.2025.11210138"},"language":null,"primary_location":{"id":"doi:10.1109/icme59968.2025.11210138","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11210138","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5060139314","display_name":"Ganghui Ru","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ganghui Ru","raw_affiliation_strings":["Fudan University,School of Computer Science,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100731347","display_name":"Jieying Wang","orcid":"https://orcid.org/0000-0002-0085-3551"},"institutions":[{"id":"https://openalex.org/I1312537475","display_name":"Naval Medical Research Command","ror":"https://ror.org/05f421b09","country_code":"US","type":"facility","lineage":["https://openalex.org/I1312537475","https://openalex.org/I1330347796","https://openalex.org/I3130687028","https://openalex.org/I4391768141"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jieying Wang","raw_affiliation_strings":["Naval Medical Center, PLA,China"],"affiliations":[{"raw_affiliation_string":"Naval Medical Center, PLA,China","institution_ids":["https://openalex.org/I1312537475"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5088562282","display_name":"Jiahao Zhao","orcid":"https://orcid.org/0000-0002-8312-7300"},"institutions":[{"id":"https://openalex.org/I22299242","display_name":"Kyoto University","ror":"https://ror.org/02kpeqv85","country_code":"JP","type":"education","lineage":["https://openalex.org/I22299242"]},{"id":"https://openalex.org/I39012071","display_name":"Kyoto College of Graduate Studies for Informatics","ror":"https://ror.org/05mzj8a56","country_code":"JP","type":"education","lineage":["https://openalex.org/I39012071"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Jiahao Zhao","raw_affiliation_strings":["Kyoto University,Graduate School of Informatics,Kyoto,Japan"],"affiliations":[{"raw_affiliation_string":"Kyoto University,Graduate School of Informatics,Kyoto,Japan","institution_ids":["https://openalex.org/I39012071","https://openalex.org/I22299242"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043561002","display_name":"Yulun Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yulun Wu","raw_affiliation_strings":["Fudan University,School of Computer Science,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100745222","display_name":"Yi Yu","orcid":"https://orcid.org/0000-0002-0294-6620"},"institutions":[{"id":"https://openalex.org/I113306721","display_name":"Hiroshima University","ror":"https://ror.org/03t78wx29","country_code":"JP","type":"education","lineage":["https://openalex.org/I113306721"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Yi Yu","raw_affiliation_strings":["Hiroshima University,Graduate School of Advanced Science and Engineering,Hiroshima,Japan"],"affiliations":[{"raw_affiliation_string":"Hiroshima University,Graduate School of Advanced Science and Engineering,Hiroshima,Japan","institution_ids":["https://openalex.org/I113306721"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060028296","display_name":"Nannan Jiang","orcid":"https://orcid.org/0000-0003-3375-4805"},"institutions":[{"id":"https://openalex.org/I1312537475","display_name":"Naval Medical Research Command","ror":"https://ror.org/05f421b09","country_code":"US","type":"facility","lineage":["https://openalex.org/I1312537475","https://openalex.org/I1330347796","https://openalex.org/I3130687028","https://openalex.org/I4391768141"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nannan Jiang","raw_affiliation_strings":["Naval Medical Center, PLA,China"],"affiliations":[{"raw_affiliation_string":"Naval Medical Center, PLA,China","institution_ids":["https://openalex.org/I1312537475"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059229969","display_name":"Wei Wang","orcid":"https://orcid.org/0000-0001-9596-2752"},"institutions":[{"id":"https://openalex.org/I1312537475","display_name":"Naval Medical Research Command","ror":"https://ror.org/05f421b09","country_code":"US","type":"facility","lineage":["https://openalex.org/I1312537475","https://openalex.org/I1330347796","https://openalex.org/I3130687028","https://openalex.org/I4391768141"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Wei Wang","raw_affiliation_strings":["Naval Medical Center, PLA,China"],"affiliations":[{"raw_affiliation_string":"Naval Medical Center, PLA,China","institution_ids":["https://openalex.org/I1312537475"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100739392","display_name":"Wei Li","orcid":"https://orcid.org/0000-0002-4308-4385"},"institutions":[{"id":"https://openalex.org/I24943067","display_name":"Fudan University","ror":"https://ror.org/013q1eq08","country_code":"CN","type":"education","lineage":["https://openalex.org/I24943067"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Li","raw_affiliation_strings":["Fudan University,School of Computer Science,Shanghai,China"],"affiliations":[{"raw_affiliation_string":"Fudan University,School of Computer Science,Shanghai,China","institution_ids":["https://openalex.org/I24943067"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5060139314"],"corresponding_institution_ids":["https://openalex.org/I24943067"],"apc_list":null,"apc_paid":null,"fwci":2.5565,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.91006347,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9955000281333923,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11349","display_name":"Music Technology and Sound Studies","score":0.00139999995008111,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.0006000000284984708,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beat","display_name":"Beat (acoustics)","score":0.621399998664856},{"id":"https://openalex.org/keywords/harmonics","display_name":"Harmonics","score":0.4489000141620636},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.32739999890327454},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.3073999881744385},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.2903999984264374},{"id":"https://openalex.org/keywords/tracking-system","display_name":"Tracking system","score":0.2587999999523163}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6868000030517578},{"id":"https://openalex.org/C189809214","wikidata":"https://www.wikidata.org/wiki/Q829522","display_name":"Beat (acoustics)","level":2,"score":0.621399998664856},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5196999907493591},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5016000270843506},{"id":"https://openalex.org/C188414643","wikidata":"https://www.wikidata.org/wiki/Q3001183","display_name":"Harmonics","level":3,"score":0.4489000141620636},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3384999930858612},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.32739999890327454},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3073999881744385},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.2903999984264374},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.2587999999523163},{"id":"https://openalex.org/C131770355","wikidata":"https://www.wikidata.org/wiki/Q876215","display_name":"Harmonic analysis","level":2,"score":0.25760000944137573},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25380000472068787},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C2777946086","wikidata":"https://www.wikidata.org/wiki/Q1163335","display_name":"Music information retrieval","level":3,"score":0.25189998745918274},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.2502000033855438}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icme59968.2025.11210138","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icme59968.2025.11210138","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Conference on Multimedia and Expo (ICME)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2016885049","https://openalex.org/W2156063659","https://openalex.org/W2172212034","https://openalex.org/W2404176928","https://openalex.org/W3027082420","https://openalex.org/W3098447809","https://openalex.org/W3115894062","https://openalex.org/W4224918587","https://openalex.org/W4280498166","https://openalex.org/W4310987263","https://openalex.org/W4372259908","https://openalex.org/W4372347373","https://openalex.org/W4385152046","https://openalex.org/W4392904213","https://openalex.org/W4413237296"],"related_works":[],"abstract_inverted_index":{"Fine-tuning":[0],"pre-trained":[1,68,91],"foundation":[2,69,92],"models":[3,15,70],"has":[4],"made":[5],"significant":[6],"progress":[7],"in":[8,100,119,132],"music":[9],"information":[10],"retrieval.":[11],"However,":[12],"applying":[13],"these":[14],"to":[16,64,111],"beat":[17,49,101,133],"tracking":[18,50],"tasks":[19],"remains":[20],"unexplored":[21],"as":[22,77],"the":[23,96,108,116],"limited":[24],"annotated":[25],"data":[26],"renders":[27],"conventional":[28],"fine-tuning":[29,44,109],"methods":[30],"ineffective.":[31],"To":[32],"address":[33],"this":[34],"challenge,":[35],"we":[36,103],"propose":[37],"HingeNet,":[38],"a":[39,54,61],"novel":[40],"and":[41,56,114,134],"general":[42],"parameter-efficient":[43],"method":[45],"specifically":[46],"designed":[47,63],"for":[48],"tasks.":[51],"HingeNet":[52,83,128],"is":[53],"lightweight":[55],"separable":[57],"network,":[58],"visually":[59],"resembling":[60],"hinge,":[62],"tightly":[65],"interface":[66],"with":[67,89],"by":[71],"using":[72],"their":[73],"intermediate":[74],"feature":[75],"representations":[76],"input.":[78],"This":[79],"unique":[80],"architecture":[81],"grants":[82],"broad":[84],"generalizability,":[85],"enabling":[86],"effective":[87],"integration":[88],"various":[90],"models.":[93],"Furthermore,":[94],"considering":[95],"significance":[97],"of":[98],"harmonics":[99],"tracking,":[102],"introduce":[104],"harmonic-aware":[105],"mechanism":[106],"during":[107],"process":[110],"better":[112],"capture":[113],"emphasize":[115],"harmonic":[117],"structures":[118],"musical":[120],"signals.":[121],"Experiments":[122],"on":[123],"benchmark":[124],"datasets":[125],"demonstrate":[126],"that":[127],"achieves":[129],"state-of-the-art":[130],"performance":[131],"downbeat":[135],"tracking.":[136]},"counts_by_year":[{"year":2026,"cited_by_count":2}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-30T00:00:00"}
