@inproceedings{rauch2023active, abstract = {We propose a shift towards end-to-end learning in bird sound monitoring by combining self-supervised (SSL) and deep active learning (DAL). Leveraging transformer models, we aim to bypass traditional spectrogram conversions, enabling direct raw audio processing. ACTIVE BIRD2VEC is set to generate high-quality bird sound representations through SSL, potentially accelerating the assessment of environmental changes and decision-making processes for wind farms. Additionally, we seek to utilize the wide variety of bird vocalizations through DAL, reducing the reliance on extensively labeled datasets by human experts. We plan to curate a comprehensive set of tasks through Huggingface Datasets, enhancing future comparability and reproducibility of bioacoustic research. A comparative analysis between various transformer models will be conducted to evaluate their proficiency in bird sound recognition tasks. We aim to accelerate the progression of avian bioacoustic research and contribute to more effective conservation strategies.}, author = {Rauch, Lukas and Schwinger, Raphael and Wirth, Moritz and Sick, Bernhard and Tomforde, Sven and Scholz, Christoph}, booktitle = {Workshop on Artificial Intelligence for Sustainability (AI4S), ECAI}, interhash = {fa669d70ebe82d3d149ddc85adc736a9}, intrahash = {642c133c4f7cca48aa218da212f69f64}, pages = {1--6}, title = {Active Bird2Vec: Towards End-To-End Bird Sound Monitoring with Transformers}, url = {https://arxiv.org/abs/2308.07121}, year = 2023 }