{"id":"https://openalex.org/W4392904623","doi":"https://doi.org/10.1109/icassp48485.2024.10445889","title":"SSL-Net: A Synergistic Spectral and Learning-Based Network for Efficient Bird Sound Classification","display_name":"SSL-Net: A Synergistic Spectral and Learning-Based Network for Efficient Bird Sound Classification","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392904623","doi":"https://doi.org/10.1109/icassp48485.2024.10445889"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10445889","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10445889","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101431368","display_name":"Yiyuan Yang","orcid":"https://orcid.org/0009-0002-8533-6074"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Yiyuan Yang","raw_affiliation_strings":["University of Oxford,Department of Computer Science,United Kingdom","Department of Computer Science, University of Oxford, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Oxford,Department of Computer Science,United Kingdom","institution_ids":["https://openalex.org/I40120149"]},{"raw_affiliation_string":"Department of Computer Science, University of Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078078782","display_name":"Kaichen Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Kaichen Zhou","raw_affiliation_strings":["University of Oxford,Department of Computer Science,United Kingdom","Department of Computer Science, University of Oxford, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Oxford,Department of Computer Science,United Kingdom","institution_ids":["https://openalex.org/I40120149"]},{"raw_affiliation_string":"Department of Computer Science, University of Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010637110","display_name":"Niki Trigoni","orcid":"https://orcid.org/0000-0001-6236-9645"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Niki Trigoni","raw_affiliation_strings":["University of Oxford,Department of Computer Science,United Kingdom","Department of Computer Science, University of Oxford, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Oxford,Department of Computer Science,United Kingdom","institution_ids":["https://openalex.org/I40120149"]},{"raw_affiliation_string":"Department of Computer Science, University of Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060183988","display_name":"Andrew Markham","orcid":"https://orcid.org/0000-0001-5716-3941"},"institutions":[{"id":"https://openalex.org/I40120149","display_name":"University of Oxford","ror":"https://ror.org/052gg0110","country_code":"GB","type":"education","lineage":["https://openalex.org/I40120149"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Andrew Markham","raw_affiliation_strings":["University of Oxford,Department of Computer Science,United Kingdom","Department of Computer Science, University of Oxford, United Kingdom"],"affiliations":[{"raw_affiliation_string":"University of Oxford,Department of Computer Science,United Kingdom","institution_ids":["https://openalex.org/I40120149"]},{"raw_affiliation_string":"Department of Computer Science, University of Oxford, United Kingdom","institution_ids":["https://openalex.org/I40120149"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101431368"],"corresponding_institution_ids":["https://openalex.org/I40120149"],"apc_list":null,"apc_paid":null,"fwci":2.17,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.8537931,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"926","last_page":"930"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10659","display_name":"Marine animal studies overview","score":0.958899974822998,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7759867906570435},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.5201423764228821},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5004744529724121},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4700155556201935},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4577151834964752},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.43069538474082947},{"id":"https://openalex.org/keywords/abundance","display_name":"Abundance (ecology)","score":0.42572927474975586},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.363180935382843},{"id":"https://openalex.org/keywords/ecology","display_name":"Ecology","score":0.23368966579437256}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7759867906570435},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.5201423764228821},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5004744529724121},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4700155556201935},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4577151834964752},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.43069538474082947},{"id":"https://openalex.org/C77077793","wikidata":"https://www.wikidata.org/wiki/Q336019","display_name":"Abundance (ecology)","level":2,"score":0.42572927474975586},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.363180935382843},{"id":"https://openalex.org/C18903297","wikidata":"https://www.wikidata.org/wiki/Q7150","display_name":"Ecology","level":1,"score":0.23368966579437256},{"id":"https://openalex.org/C202444582","wikidata":"https://www.wikidata.org/wiki/Q837863","display_name":"Pure mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10445889","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10445889","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5199999809265137,"id":"https://metadata.un.org/sdg/14","display_name":"Life below water"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2547875792","https://openalex.org/W2581706890","https://openalex.org/W2913454197","https://openalex.org/W2944806726","https://openalex.org/W3094550259","https://openalex.org/W3119043017","https://openalex.org/W3173678936","https://openalex.org/W4205396838","https://openalex.org/W4220973791","https://openalex.org/W4283703475","https://openalex.org/W4283837884","https://openalex.org/W4284899153","https://openalex.org/W4285428678","https://openalex.org/W4296106947","https://openalex.org/W4312048190","https://openalex.org/W4364375273","https://openalex.org/W4379929801","https://openalex.org/W4385245566","https://openalex.org/W6729448088","https://openalex.org/W6758780191","https://openalex.org/W6789403026","https://openalex.org/W6848208918"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2358755282","https://openalex.org/W2625833328","https://openalex.org/W1533177136","https://openalex.org/W4380994516","https://openalex.org/W2251519152"],"abstract_inverted_index":{"Efficient":[0],"and":[1,13,26,39,47,57,65,94,118],"accurate":[2],"bird":[3,71,81,99],"sound":[4,100],"classification":[5],"is":[6],"of":[7,28,87],"important":[8],"for":[9],"ecology,":[10],"habitat":[11],"protection":[12],"scientific":[14],"research,":[15],"as":[16],"it":[17],"plays":[18],"a":[19,78],"central":[20],"role":[21],"in":[22,90,98,120],"monitoring":[23],"the":[24,85],"distribution":[25],"abundance":[27],"species.":[29],"However,":[30],"prevailing":[31],"methods":[32],"typically":[33],"demand":[34],"extensively":[35],"labeled":[36],"audio":[37,82],"datasets":[38],"have":[40],"highly":[41],"customized":[42],"frameworks,":[43],"imposing":[44],"substantial":[45],"computational":[46],"annotation":[48],"loads.":[49],"In":[50],"this":[51],"study,":[52],"we":[53,110],"present":[54,111],"an":[55],"efficient":[56],"general":[58],"framework":[59],"called":[60],"SSL-Net,":[61],"which":[62],"combines":[63],"spectral":[64],"learned":[66],"features":[67,92],"to":[68],"identify":[69],"different":[70],"sounds.":[72],"Encouraging":[73],"empirical":[74],"results":[75],"gleaned":[76],"from":[77],"standard":[79],"field-collected":[80],"dataset":[83],"validate":[84],"efficacy":[86],"our":[88],"method":[89],"extracting":[91],"efficiently":[93],"achieving":[95],"heightened":[96],"performance":[97],"classification,":[101],"even":[102],"when":[103],"working":[104],"with":[105],"limited":[106],"sample":[107],"sizes.":[108],"Furthermore,":[109],"three":[112],"feature":[113],"fusion":[114],"strategies,":[115],"aiding":[116],"engineers":[117],"researchers":[119],"their":[121],"selection":[122],"through":[123],"quantitative":[124],"analysis.":[125]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
