{ "access": { "embargo": { "active": false, "reason": null }, "files": "public", "record": "public", "status": "open" }, "created": "2018-03-26T22:16:59.232004+00:00", "custom_fields": { "meeting:meeting": { "acronym": "ICASSP", "dates": "15-20 April 2018", "place": "Calgary, AB, CA", "session": "Bioacoustics and Medical Acoustics", "session_part": "AASP-P2.3", "title": "IEEE International Conference on Acoustics, Speech, and Signal Processing", "url": "https://wp.nyu.edu/birdvox" } }, "deletion_status": { "is_deleted": false, "status": "P" }, "files": { "count": 1, "enabled": true, "entries": { "BirdVox-DCASE-20k.zip": { "checksum": "md5:3bdde2b472f42ec619d2d665cb40dd2c", "ext": "zip", "id": "aa35451a-a41f-42f9-a0fe-ab4a8fef57b8", "key": "BirdVox-DCASE-20k.zip", "metadata": null, "mimetype": "application/zip", "size": 16517893694 } }, "order": [], "total_bytes": 16517893694 }, "id": "1208080", "is_draft": false, "is_published": true, "links": { "access": "https://zenodo.org/api/records/1208080/access", "access_links": "https://zenodo.org/api/records/1208080/access/links", "access_request": "https://zenodo.org/api/records/1208080/access/request", "access_users": "https://zenodo.org/api/records/1208080/access/users", "archive": "https://zenodo.org/api/records/1208080/files-archive", "archive_media": "https://zenodo.org/api/records/1208080/media-files-archive", "communities": "https://zenodo.org/api/records/1208080/communities", "communities-suggestions": "https://zenodo.org/api/records/1208080/communities-suggestions", "doi": "https://doi.org/10.5281/zenodo.1208080", "draft": "https://zenodo.org/api/records/1208080/draft", "files": "https://zenodo.org/api/records/1208080/files", "latest": "https://zenodo.org/api/records/1208080/versions/latest", "latest_html": "https://zenodo.org/records/1208080/latest", "media_files": "https://zenodo.org/api/records/1208080/media-files", "parent": "https://zenodo.org/api/records/1206960", "parent_doi": "https://zenodo.org/doi/10.5281/zenodo.1206960", "parent_html": "https://zenodo.org/records/1206960", "requests": "https://zenodo.org/api/records/1208080/requests", "reserve_doi": "https://zenodo.org/api/records/1208080/draft/pids/doi", "self": "https://zenodo.org/api/records/1208080", "self_doi": "https://zenodo.org/doi/10.5281/zenodo.1208080", "self_html": "https://zenodo.org/records/1208080", "self_iiif_manifest": "https://zenodo.org/api/iiif/record:1208080/manifest", "self_iiif_sequence": "https://zenodo.org/api/iiif/record:1208080/sequence/default", "versions": "https://zenodo.org/api/records/1208080/versions" }, "media_files": { "count": 0, "enabled": false, "entries": {}, "order": [], "total_bytes": 0 }, "metadata": { "creators": [ { "affiliations": [ { "name": "Cornell Lab of Ornithology" } ], "person_or_org": { "family_name": "Lostanlen", "given_name": "Vincent", "identifiers": [ { "identifier": "0000-0003-0580-1651", "scheme": "orcid" } ], "name": "Lostanlen, Vincent", "type": "personal" } }, { "affiliations": [ { "name": "New York University" } ], "person_or_org": { "family_name": "Salamon", "given_name": "Justin", "identifiers": [ { "identifier": "0000-0001-6345-4593", "scheme": "orcid" } ], "name": "Salamon, Justin", "type": "personal" } }, { "affiliations": [ { "name": "Cornell Lab of Ornithology" } ], "person_or_org": { "family_name": "Farnsworth", "given_name": "Andrew", "identifiers": [ { "identifier": "0000-0002-9854-4449", "scheme": "orcid" } ], "name": "Farnsworth, Andrew", "type": "personal" } }, { "affiliations": [ { "name": "Cornell Lab of Ornithology" } ], "person_or_org": { "family_name": "Kelling", "given_name": "Steve", "name": "Kelling, Steve", "type": "personal" } }, { "affiliations": [ { "name": "New York University" } ], "person_or_org": { "family_name": "Bello", "given_name": "Juan Pablo", "name": "Bello, Juan Pablo", "type": "personal" } } ], "description": "
BirdVox-DCASE-20k: a dataset for bird audio detection in 10-second clips
\n=====================================================
\nVersion 2.0, March 2018.
\nCreated By
\n-------------
Vincent Lostanlen (1, 2, 3), Justin Salamon (2, 3), Andrew Farnsworth (1), Steve Kelling (1), and Juan Pablo Bello (2, 3).
\n\n(1): Cornell Lab of Ornithology (CLO)
\n(2): Center for Urban Science and Progress, New York University
\n(3): Music and Audio Research Lab, New York University
https://wp.nyu.edu/birdvox
\n\n\n\n
Description
\n--------------
The BirdVox-DCASE-20k dataset contains 20,000 ten-second audio recordings. These recordings come from ROBIN autonomous recording units, placed near Ithaca, NY, USA during the fall 2015. They were captured on the night of September 23rd, 2015, by six different sensors, originally numbered 1, 2, 3, 5, 7, and 10.
\n\nOut of these 20,000 recording, 10,017 (50.09%) contain at least one bird vocalization (either song, call, or chatter).
\n\nThe dataset is a derivative work of the BirdVox-full-night dataset [1], containing almost as much data but formatted into ten-second excerpts rather than ten-hour full night recordings.
\n\nIn addition, the BirdVox-DCASE-20k dataset is provided as a development set in the context of the "Bird Audio Detection" challenge, organized by DCASE (Detection and Classification of Acoustic Scenes and Events) and the IEEE Signal Processing Society.
\n\nThe dataset can be used, among other things, for the development and evaluation of bioacoustic classification models.
\n\n
\nWe refer the reader to [1] for details on the distribution of the data and [2] for details on the hardware of ROBIN recording units.
[1] V. Lostanlen, J. Salamon, A. Farnsworth, S. Kelling, J.P. Bello. "BirdVox-full-night: a dataset and benchmark for avian flight call detection", Proc. IEEE ICASSP, 2018.
\n\n[2] J. Salamon, J. P. Bello, A. Farnsworth, M. Robbins, S. Keen, H. Klinck, and S. Kelling. Towards the Automatic Classification of Avian Flight Calls for Bioacoustic Monitoring. PLoS One, 2016.
\n\n\n\n
Data Files
\n------------
The wav folder contains the recordings as WAV files, sampled at 44,1 kHz, with a single channel (mono). The original sample rate was 24 kHz.
\n\nThe name of each wav file is a random 128-bit UUID (Universal Unique IDentifier) string, which is randomized with respect to the origin of the recording in BirdVox-full-night, both in terms of time (UTC hour at the start of the excerpt) and space (location of the sensor).
\n\nThe origin of each 10-second excerpt is known by the challenge organizers, but not disclosed to the participants.
\n\n\n\n
Metadata Files
\n--------------
A table containing a binary label "hasbird" associated to every recording in BirdVox-DCASE-20k is available on the website of the DCASE "Bird Audio Detection" challenge: http://machine-listening.eecs.qmul.ac.uk/bird-audio-detection-challenge/
\n\nThese labels were automatically derived from the annotations of avian flight call events in the BirdVox-full-night dataset.
\n\nIf your evaluation procedure requires the precise timestamps of each avian flight call (at a fine time scale of 50 ms), and is agnostic to non-flight call avian vocalizations (e.g. geese, crows, owls, etc.), we kindly suggest you to use the BirdVox-full-night dataset rather than BirdVox-DCASE-20k: wp.nyu.edu/birdvox/birdvox-full-night
\n\nOn the other hand, if your evaluation procedure encompasses all avian vocalizations, and is performed at a coarse time scale of 10 seconds, then BirdVox-DCASE-20k is the appropriate dataset.
\n\nThe annotation campaign of avian flight calls in BirdVox-full-night was performed by Andrew Farnsworth and lasted 102 hours.
\n\nThe additional annotation campaign of non-flight call avian vocalizations was performed by Vincent Lostanlen and lasted 10 hours.
\n\nThe accuracy of the labeling is estimated to be somewhere between 99.5% (100 mislabelings) and 99.95% (10 mislabelings).
\n\n
\nPlease Acknowledge BirdVox-DCASE-20k in Academic Research
\n--------------------------------------------------------------------------------
When BirdVox-70k is used for academic research, we would highly appreciate it if scientific publications of works partly based on this dataset cite the following publication:
\n\nV. Lostanlen, J. Salamon, A. Farnsworth, S. Kelling, J. Bello. "BirdVox-full-night: a dataset and benchmark for avian flight call detection", Proc. IEEE ICASSP, 2018.
\n\n@inproceedings{lostanlen2018icassp,
\n title = {BirdVox-full-night: a dataset and benchmark for avian flight call detection},
\n author = {Lostanlen, Vincent and Salamon, Justin and Farnsworth, Andrew and Kelling, Steve and Bello, Juan Pablo},
\n booktitle = {Proc. IEEE ICASSP},
\n year = {2018},
\n published = {IEEE},
\n venue = {Calgary, Canada},
\n month = {April},
\n}
The creation of this dataset was supported by NSF grants 1125098 (BIRDCAST) and 1633259 (BIRDVOX), a Google Faculty Award, the Leon Levy Foundation, and two anonymous donors.
\n\n\n\n
Conditions of Use
\n---------------------
Dataset created by Vincent Lostanlen, Justin Salamon, Andrew Farnsworth, Steve Kelling, and Juan Pablo Bello.
\n\nThe BirdVox-DCASE-20k dataset is offered free of charge under the terms of the Creative Commons Attribution 4.0 International (CC BY 4.0) license:
\nhttps://creativecommons.org/licenses/by/4.0/
The dataset and its contents are made available on an "as is" basis and without warranties of any kind, including without limitation satisfactory quality and conformity, merchantability, fitness for a particular purpose, accuracy or completeness, or absence of errors. Subject to any liability that may not be excluded or limited by law, Cornell Lab of Ornithology is not liable for, and expressly excludes all liability for, loss or damage however and whenever caused to anyone by any use of the BirdVox-DCASE-20k dataset or any part of it.
\n\n\n\n
Feedback
\n-----------
Please help us improve BirdVox-DCASE-20k by sending your feedback to:
\n* Vincent Lostanlen: vincent.lostanlen@gmail.com for feedback regarding data pre-processing,
\n* Andrew Farnsworth: af27@cornell.edu for feedback regarding data collection and ornithology, or
\n* Dan Stowell: dan.stowell@qmul.ac.uk for feedback regarding the DCASE "Bird Audio Detection" challenge.
In case of a problem, please include as many details as possible.
\n\n\n\n
\nAcknowledgements
\n------------------------
We thank Jessie Barry, Ian Davies, Tom Fredericks, Jeff Gerbracht, Sara Keen, Holger Klinck, Anne Klingensmith, Ray Mack, Peter Marchetto, Ed Moore, Matt Robbins, Ken Rosenberg, and Chris Tessaglia-Hymes for designing autonomous recording units and collecting data.
\nWe acknowledge that the land on which the data was collected is the unceded territory of the Cayuga nation, which is part of the Haudenosaunee (Iroquois) confederacy.
", "publication_date": "2018-03-24", "publisher": "Zenodo", "references": [ { "reference": "V. Lostanlen, J. Salamon, A. Farnsworth, S. Kelling, J. Bello. BirdVox-full-night: a dataset and benchmark for avian flight call detection. Proc. IEEE ICASSP, 2018." } ], "resource_type": { "id": "dataset", "title": { "de": "Datensatz", "en": "Dataset" } }, "rights": [ { "description": { "en": "The Creative Commons Attribution license allows re-distribution and re-use of a licensed work on the condition that the creator is appropriately credited." }, "icon": "cc-by-icon", "id": "cc-by-4.0", "props": { "scheme": "spdx", "url": "https://creativecommons.org/licenses/by/4.0/legalcode" }, "title": { "en": "Creative Commons Attribution 4.0 International" } } ], "subjects": [ { "subject": "acoustic signal detection" }, { "subject": "bioacoustics" }, { "subject": "bird vocalizations" }, { "subject": "conservation science" }, { "subject": "digital signal processing" }, { "subject": "machine learning" }, { "subject": "machine listening" }, { "subject": "ecology" }, { "subject": "ornithology" } ], "title": "BirdVox-DCASE-20k: a dataset for bird audio detection in 10-second clips" }, "parent": { "access": { "owned_by": { "user": 21149 } }, "communities": {}, "id": "1206960", "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.1206960", "provider": "datacite" } } }, "pids": { "doi": { "client": "datacite", "identifier": "10.5281/zenodo.1208080", "provider": "datacite" }, "oai": { "identifier": "oai:zenodo.org:1208080", "provider": "oai" } }, "revision_id": 6, "stats": { "all_versions": { "data_volume": 208852186569040.0, "downloads": 12644, "unique_downloads": 3289, "unique_views": 2666, "views": 3016 }, "this_version": { "data_volume": 208439300524586.0, "downloads": 12619, "unique_downloads": 3265, "unique_views": 2318, "views": 2621 } }, "status": "published", "updated": "2020-01-24T19:25:37.609011+00:00", "versions": { "index": 2, "is_latest": true } }