From afb7f9814528c798520458c60a0d48f50f868c9c Mon Sep 17 00:00:00 2001 From: sammlapp Date: Tue, 8 Oct 2024 01:41:47 -0400 Subject: [PATCH] add train birdnet to quickstart --- README.md | 21 ++++++++++++++++++- .../training_birdnet_and_perch.ipynb | 1 - 2 files changed, 20 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index a299274d..2bb7f84d 100644 --- a/README.md +++ b/README.md @@ -9,8 +9,9 @@ OpenSoundscape includes utilities which can be strung together to create data an * load and manipulate audio files * create and manipulate spectrograms -* train convolutional neural networks (CNNs) on spectrograms with PyTorch +* train deep learning models to recognize sounds * run pre-trained CNNs to detect vocalizations +* tune pre-trained CNNs to custom classification tasks * detect periodic vocalizations with RIBBIT * load and manipulate Raven annotations * estimate the location of sound sources from synchronized recordings @@ -148,4 +149,22 @@ model = CNN(architecture='resnet18', sample_duration=2, classes=class_list) # train the model to recognize the classes of interest in audio data model.train(train_df, validation_df, epochs=20, num_workers=8, batch_size=256) +``` + +### Train a custom classifier on BirdNET or Perch embeddings + +```python +from opensoundscape.ml import bioacoustics_model_zoo as bmz + +# load a model from the model zoo +model = bmz.load('BirdNET') #or bmz.load('Perch') + +# define classes for your custom classifier +model.change_classes(train_df.columns) + +# fit the trainable PyTorch classifier on your labels +model.train(train_df,val_df,num_augmentation_variants=4,batch_size=64) + +# run inference using your custom classifier on audio data +model.predict(audio_files) ``` \ No newline at end of file diff --git a/docs/tutorials/training_birdnet_and_perch.ipynb b/docs/tutorials/training_birdnet_and_perch.ipynb index 7964dbe5..a2c77168 100644 --- a/docs/tutorials/training_birdnet_and_perch.ipynb +++ b/docs/tutorials/training_birdnet_and_perch.ipynb @@ -747,7 +747,6 @@ "\n", "```python\n", "from opensoundscape.ml import bioacoustics_model_zoo as bmz\n", - "from opensoundscape.shallow_classifier import fit_classifier_on_embeddings\n", "\n", "# load a model from the model zoo\n", "model = bmz.load('BirdNET')\n",