{"id":"https://openalex.org/W4401607719","doi":"https://doi.org/10.1109/taslp.2024.3444486","title":"BirdVoxDetect: Large-Scale Detection and Classification of Flight Calls for Bird Migration Monitoring","display_name":"BirdVoxDetect: Large-Scale Detection and Classification of Flight Calls for Bird Migration Monitoring","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4401607719","doi":"https://doi.org/10.1109/taslp.2024.3444486"},"language":"en","primary_location":{"id":"doi:10.1109/taslp.2024.3444486","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3444486","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://hal.science/hal-04670882/document","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5027789239","display_name":"Vincent Lostanlen","orcid":"https://orcid.org/0000-0003-0580-1651"},"institutions":[{"id":"https://openalex.org/I1294671590","display_name":"Centre National de la Recherche Scientifique","ror":"https://ror.org/02feahw73","country_code":"FR","type":"government","lineage":["https://openalex.org/I1294671590"]},{"id":"https://openalex.org/I4210117005","display_name":"Laboratoire des Sciences du Num\u00e9rique de Nantes","ror":"https://ror.org/02snf8m58","country_code":"FR","type":"facility","lineage":["https://openalex.org/I100445878","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1294671590","https://openalex.org/I1326498283","https://openalex.org/I205703379","https://openalex.org/I4210117005","https://openalex.org/I4210124215","https://openalex.org/I4210127572","https://openalex.org/I4210139971","https://openalex.org/I97188460","https://openalex.org/I97188460"]},{"id":"https://openalex.org/I97188460","display_name":"Nantes Universit\u00e9","ror":"https://ror.org/03gnr7b55","country_code":"FR","type":"education","lineage":["https://openalex.org/I97188460"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Vincent Lostanlen","raw_affiliation_strings":["Laboratoire des Sciences du Num&#x00E9;rique de Nantes (LS2N), The Centre National de la Recherche Scientifique (CNRS), Nantes, France"],"affiliations":[{"raw_affiliation_string":"Laboratoire des Sciences du Num&#x00E9;rique de Nantes (LS2N), The Centre National de la Recherche Scientifique (CNRS), Nantes, France","institution_ids":["https://openalex.org/I97188460","https://openalex.org/I4210117005","https://openalex.org/I1294671590"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045867725","display_name":"Aurora Cramer","orcid":"https://orcid.org/0000-0001-5288-9399"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aurora Cramer","raw_affiliation_strings":["New York University (NYU), New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"New York University (NYU), New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037548450","display_name":"Justin Salamon","orcid":"https://orcid.org/0000-0001-6345-4593"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Justin Salamon","raw_affiliation_strings":["Adobe Research, San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Adobe Research, San Francisco, CA, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028426061","display_name":"Andrew Farnsworth","orcid":"https://orcid.org/0000-0002-9854-4449"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andrew Farnsworth","raw_affiliation_strings":["Cornell Lab of Ornithology, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"Cornell Lab of Ornithology, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015943253","display_name":"Benjamin M. Van Doren","orcid":"https://orcid.org/0000-0002-7355-6005"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Benjamin M. Van Doren","raw_affiliation_strings":["Cornell Lab of Ornithology, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"Cornell Lab of Ornithology, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090261891","display_name":"Steve Kelling","orcid":null},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Steve Kelling","raw_affiliation_strings":["Cornell Lab of Ornithology, Cornell University, Ithaca, NY, USA"],"affiliations":[{"raw_affiliation_string":"Cornell Lab of Ornithology, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5031398497","display_name":"Juan Pablo Bello","orcid":"https://orcid.org/0000-0001-8561-5204"},"institutions":[{"id":"https://openalex.org/I57206974","display_name":"New York University","ror":"https://ror.org/0190ak572","country_code":"US","type":"education","lineage":["https://openalex.org/I57206974"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Juan Pablo Bello","raw_affiliation_strings":["New York University (NYU), New York, NY, USA"],"affiliations":[{"raw_affiliation_string":"New York University (NYU), New York, NY, USA","institution_ids":["https://openalex.org/I57206974"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5027789239"],"corresponding_institution_ids":["https://openalex.org/I1294671590","https://openalex.org/I4210117005","https://openalex.org/I97188460"],"apc_list":null,"apc_paid":null,"fwci":6.6376,"has_fulltext":true,"cited_by_count":13,"citation_normalized_percentile":{"value":0.96855059,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"32","issue":null,"first_page":"4134","last_page":"4145"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11665","display_name":"Animal Vocal Communication and Behavior","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1309","display_name":"Developmental Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9922000169754028,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10659","display_name":"Marine animal studies overview","score":0.9832000136375427,"subfield":{"id":"https://openalex.org/subfields/2303","display_name":"Ecology"},"field":{"id":"https://openalex.org/fields/23","display_name":"Environmental Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.621578574180603},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.42655742168426514},{"id":"https://openalex.org/keywords/remote-sensing","display_name":"Remote sensing","score":0.34628909826278687},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.3062129020690918},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.24956616759300232}],"concepts":[{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.621578574180603},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.42655742168426514},{"id":"https://openalex.org/C62649853","wikidata":"https://www.wikidata.org/wiki/Q199687","display_name":"Remote sensing","level":1,"score":0.34628909826278687},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.3062129020690918},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.24956616759300232}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/taslp.2024.3444486","is_oa":false,"landing_page_url":"https://doi.org/10.1109/taslp.2024.3444486","pdf_url":null,"source":{"id":"https://openalex.org/S4210169297","display_name":"IEEE/ACM Transactions on Audio Speech and Language Processing","issn_l":"2329-9290","issn":["2329-9290","2329-9304"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},{"id":"pmh:oai:HAL:hal-04670882v2","is_oa":true,"landing_page_url":"https://hal.science/hal-04670882","pdf_url":"https://hal.science/hal-04670882/document","source":{"id":"https://openalex.org/S4406922466","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech and Language Processing, 2024, &#x27E8;10.1109/TASLP.2024.3444486&#x27E9;","raw_type":"Journal articles"}],"best_oa_location":{"id":"pmh:oai:HAL:hal-04670882v2","is_oa":true,"landing_page_url":"https://hal.science/hal-04670882","pdf_url":"https://hal.science/hal-04670882/document","source":{"id":"https://openalex.org/S4406922466","display_name":"SPIRE - Sciences Po Institutional REpository","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE/ACM Transactions on Audio, Speech and Language Processing, 2024, &#x27E8;10.1109/TASLP.2024.3444486&#x27E9;","raw_type":"Journal articles"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320309445","display_name":"Leon Levy Foundation","ror":"https://ror.org/033hnyq61"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4401607719.pdf"},"referenced_works_count":54,"referenced_works":["https://openalex.org/W95457783","https://openalex.org/W193026404","https://openalex.org/W1987711601","https://openalex.org/W2038484192","https://openalex.org/W2059116937","https://openalex.org/W2060151726","https://openalex.org/W2086384421","https://openalex.org/W2117863804","https://openalex.org/W2124106809","https://openalex.org/W2148260196","https://openalex.org/W2149555119","https://openalex.org/W2178547820","https://openalex.org/W2180351508","https://openalex.org/W2187089797","https://openalex.org/W2327869315","https://openalex.org/W2403438050","https://openalex.org/W2509065397","https://openalex.org/W2527465287","https://openalex.org/W2547699899","https://openalex.org/W2552032035","https://openalex.org/W2680737492","https://openalex.org/W2764236610","https://openalex.org/W2772345051","https://openalex.org/W2796458509","https://openalex.org/W2889004366","https://openalex.org/W2889425561","https://openalex.org/W2890012819","https://openalex.org/W2890211809","https://openalex.org/W2899201823","https://openalex.org/W2927909577","https://openalex.org/W2931863936","https://openalex.org/W2938139608","https://openalex.org/W2944615619","https://openalex.org/W2962894131","https://openalex.org/W2963881567","https://openalex.org/W2974449448","https://openalex.org/W2981733351","https://openalex.org/W3015238983","https://openalex.org/W3098357269","https://openalex.org/W3121931845","https://openalex.org/W3132085514","https://openalex.org/W4226051760","https://openalex.org/W4311391413","https://openalex.org/W4318817234","https://openalex.org/W6603709179","https://openalex.org/W6631190155","https://openalex.org/W6697193729","https://openalex.org/W6760006509","https://openalex.org/W6761155429","https://openalex.org/W6762619520","https://openalex.org/W6839975361","https://openalex.org/W6840583421","https://openalex.org/W6856502591","https://openalex.org/W6993003499"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2139939267","https://openalex.org/W1974511032"],"abstract_inverted_index":{"Sound":[0],"event":[1,115],"classification":[2,34],"has":[3,35],"the":[4,61,133,161,170,219],"potential":[5],"to":[6,65,163,184,195,207,253],"advance":[7],"our":[8,240],"understanding":[9],"of":[10,25,83,96,138,146,173,201,211,235],"bird":[11,66,212,261],"migration.":[12,213],"Although":[13],"it":[14],"is":[15,91,107,125,243],"long":[16],"known":[17],"that":[18,244],"migratory":[19],"species":[20,137],"have":[21],"a":[22,92,108,126,153,177,208],"vocal":[23],"signature":[24],"their":[26],"own,":[27],"previous":[28],"work":[29],"on":[30,152],"automatic":[31],"flight":[32,139],"call":[33],"been":[36],"limited":[37],"in":[38,176,216],"robustness":[39],"and":[40,50,136,168,188,231,247,257,268],"scope:":[41],"e.g.,":[42],"covering":[43],"few":[44],"recording":[45],"sites,":[46],"short":[47],"acquisition":[48],"segments,":[49],"simplified":[51],"biological":[52],"taxonomies.":[53],"In":[54],"this":[55,166,238],"paper,":[56],"we":[57,192],"present":[58],"BirdVoxDetect":[59],"(BVD),":[60],"first":[62,89],"full-fledged":[63],"solution":[64],"migration":[67,262],"monitoring":[68],"from":[69,141,158],"acoustic":[70],"sensor":[71,97,181,249],"network":[72,112,130,229],"data.":[73],"As":[74],"an":[75,80,196],"open-source":[76],"software,":[77],"BVD":[78,151,194,215],"integrates":[79],"original":[81],"pipeline":[82],"three":[84],"machine":[85],"learning":[86,246],"modules.":[87],"The":[88,104,122],"module":[90,106,124],"random":[93],"forest":[94],"classifier":[95],"faults,":[98],"trained":[99],"with":[100,117],"human-in-the-loop":[101],"active":[102],"learning.":[103],"second":[105],"deep":[109,245],"convolutional":[110,128],"neural":[111,129,228],"for":[113,165,260],"sound":[114],"detection":[116],"per-channel":[118],"energy":[119],"normalization":[120],"(PCEN).":[121],"third":[123],"multitask":[127],"which":[131],"predicts":[132],"family,":[134],"genus,":[135],"calls":[140],"passerines":[142],"<italic":[143],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[144],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">(Passeriformes)</i>":[145],"North":[147],"America.":[148],"We":[149],"evaluate":[150],"new":[154],"dataset":[155,221],"(296":[156],"hours":[157,200],"nine":[159],"locations,":[160],"largest":[162],"date":[164],"task)":[167],"discuss":[169],"main":[171,241],"sources":[172],"estimation":[174],"error":[175],"real-world":[178],"deployment:":[179],"mechanical":[180],"failures,":[182],"sensitivity":[183],"background":[185],"noise,":[186],"misdetection,":[187],"taxonomic":[189],"confusion.":[190],"Then,":[191],"deploy":[193],"unprecedented":[197],"scale:":[198],"6672":[199],"audio":[202],"(approximately":[203],"one":[204],"terabyte),":[205],"corresponding":[206],"full":[209],"season":[210],"Running":[214],"parallel":[217],"over":[218,232],"full-season":[220],"yields":[222],"1.6":[223],"billion":[224],"FFT's,":[225],"480":[226],"million":[227],"predictions,":[230],"six":[233],"petabytes":[234],"throughput.":[236],"With":[237],"method,":[239],"finding":[242],"bioacoustic":[248],"networks":[250],"are":[251],"ready":[252],"complement":[254],"radar":[255],"observations":[256],"crowdsourced":[258],"surveys":[259],"monitoring,":[263],"thus":[264],"benefiting":[265],"conservation":[266],"ecology":[267],"land-use":[269],"planning":[270],"at":[271],"large.":[272]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-29T08:15:47.926485","created_date":"2025-10-10T00:00:00"}
