Merge branch 'main' into segments-collection-mode

max-mauermann · max-mauermann · commit b36e6ede889b · 2025-06-27T15:18:23.000+02:00
diff --git a/birdnet_analyzer/analyze/utils.py b/birdnet_analyzer/analyze/utils.py
@@ -365,8 +365,7 @@ def combine_kaleidoscope_files(saved_results: list[str]):
                         continue
 
                     # skip header and add to file
-                    for line in lines[1:]:
-                        f.write(line)
+                    f.writelines(lines[1:])
 
                 except Exception as ex:
                     print(f"Error: Cannot combine results from {rfile}.\n", flush=True)
@@ -545,13 +544,12 @@ def iterate_audio_chunks(fpath: str, embeddings: bool = False):
             break
 
         for chunk_index, chunk in enumerate(chunks):
+            t_start = start + (chunk_index * (cfg.SIG_LENGTH - cfg.SIG_OVERLAP) * cfg.AUDIO_SPEED)
+            end = min(t_start + cfg.SIG_LENGTH * cfg.AUDIO_SPEED, fileLengthSeconds)
+
             # Add to batch
             samples.append(chunk)
-            timestamps.append([round(start, 1), round(end, 1)])
-
-            # Advance start and end
-            start += (cfg.SIG_LENGTH - cfg.SIG_OVERLAP) * cfg.AUDIO_SPEED
-            end = min(start + cfg.SIG_LENGTH * cfg.AUDIO_SPEED, fileLengthSeconds)
+            timestamps.append([round(t_start, 2), round(end, 2)])
 
             # Check if batch is full or last chunk
             if len(samples) < cfg.BATCH_SIZE and chunk_index < len(chunks) - 1:
@@ -571,6 +569,8 @@ def iterate_audio_chunks(fpath: str, embeddings: bool = False):
             samples = []
             timestamps = []
 
+        start += len(chunks) * (cfg.SIG_LENGTH - cfg.SIG_OVERLAP) * cfg.AUDIO_SPEED
+
 
 def predict(samples):
     """Predicts the classes for the given samples.
diff --git a/birdnet_analyzer/gui/evaluation.py b/birdnet_analyzer/gui/evaluation.py
@@ -379,7 +379,7 @@ def select_directory_on_empty():  # Nishant - Function modified for For Folder s
 
                 if folder:
                     files = get_selection_tables(folder)
-                    files_to_display = files[:100] + [["..."]] if len(files) > 100 else files
+                    files_to_display = [*files[:100], ["..."]] if len(files) > 100 else files
                     return [files, files_to_display, gr.update(visible=True), *on_select(files)]
 
                 return ["", [[loc.localize("eval-tab-no-files-found")]]]
diff --git a/birdnet_analyzer/gui/multi_file.py b/birdnet_analyzer/gui/multi_file.py
@@ -119,7 +119,7 @@ def select_directory_on_empty():  # Nishant - Function modified for For Folder s
                     if folder:
                         files_and_durations = gu.get_audio_files_and_durations(folder)
                         if len(files_and_durations) > 100:
-                            return [folder, files_and_durations[:100] + [["..."]]]  # hopefully fixes issue#272
+                            return [folder, *files_and_durations[:100], ["..."]]  # hopefully fixes issue#272
                         return [folder, files_and_durations]
 
                     return ["", [[loc.localize("multi-tab-samples-dataframe-no-files-found")]]]
diff --git a/birdnet_analyzer/model.py b/birdnet_analyzer/model.py
@@ -872,8 +872,7 @@ def save_linear_classifier(classifier, model_path: str, labels: list[str], mode=
 
     # Save labels
     with open(model_path.replace(".tflite", "_Labels.txt"), "w", encoding="utf-8") as f:
-        for label in labels:
-            f.write(label + "\n")
+        f.writelines(label + "\n" for label in labels)
 
     save_model_params(model_path.replace(".tflite", "_Params.csv"))
 
diff --git a/birdnet_analyzer/species/utils.py b/birdnet_analyzer/species/utils.py
@@ -70,5 +70,4 @@ def run(output_path, lat, lon, week, threshold, sortby):
 
     # Save species list
     with open(cfg.OUTPUT_PATH, "w") as f:
-        for s in species_list:
-            f.write(s + "\n")
+        f.writelines(s + "\n" for s in species_list)
diff --git a/birdnet_analyzer/train/utils.py b/birdnet_analyzer/train/utils.py
@@ -63,6 +63,7 @@ def _load_audio_file(f, label_vector, config):
         # Load audio
         sig, rate = audio.open_audio_file(
             f,
+            sample_rate=cfg.SAMPLE_RATE,
             duration=cfg.SIG_LENGTH if cfg.SAMPLE_CROP_MODE == "first" else None,
             fmin=cfg.BANDPASS_FMIN,
             fmax=cfg.BANDPASS_FMAX,
@@ -136,7 +137,7 @@ def _load_training_data(cache_mode=None, cache_file="", progress_callback=None):
     train_folders = sorted(utils.list_subdirectories(cfg.TRAIN_DATA_PATH))
 
     # Read all individual labels from the folder names
-    labels = []
+    labels: list[str] = []
 
     for folder in train_folders:
         labels_in_folder = folder.split(",")
diff --git a/birdnet_analyzer/translate.py b/birdnet_analyzer/translate.py
@@ -119,8 +119,7 @@ def save_labels_file(labels: list[str], locale: str):
         cfg.TRANSLATED_LABELS_PATH, "{}_{}.txt".format(os.path.basename(cfg.LABELS_FILE).rsplit(".", 1)[0], locale)
     )
     with open(fpath, "w", encoding="utf-8") as f:
-        for label in labels:
-            f.write(label + "\n")
+        f.writelines(label + "\n" for label in labels)
 
 
 if __name__ == "__main__":
diff --git a/docs/best-practices/segment-review.rst b/docs/best-practices/segment-review.rst
@@ -1,7 +1,8 @@
 Segment Review
-=================================
+==============
 
-Get started by listening to this AI-generated summary of segments review:
+This document provides a quick overview of the segment review process in BirdNET-Analyzer, which is essential for validating species detection results.
+You can also listen to an AI-generated summary of this guide in the audio player below.
 
 .. raw:: html
 
@@ -13,64 +14,97 @@ Get started by listening to this AI-generated summary of segments review:
 | 
 | `Source: Google NotebookLM`
 
-1. Prepare Audio and Result Files
----------------------------------
+Prepare Audio and Result Files
+------------------------------
 
-- | **Collect Audio Recordings and Corresponding BirdNET Result Files**: Organize them into separate folders.
-- | **Result File Formats**: BirdNET-Analyzer typically produces result files with extensions ".BirdNET.txt" or ".BirdNET.csv". It can process various result file formats, including "table", "kaleidoscope", "csv", and "audacity".
-- | **Understanding Confidence Values**: Note that BirdNET confidence values are not probabilities and are not directly transferable between different species or recording conditions.
+The BirdNET Analyzer uses the batch analysis result tables, such as the output formats "table", "kaleidoscope" or "csv".
+To obtain batch analysis result tables, run the analysis via the GUI or the :ref:`command line <cli-docs>`, which automatically generates the result files.
 
-2. Using the "Segments" Function in the GUI or Command Line
------------------------------------------------------------
+.. warning::
 
-- | **Segments Function**: BirdNET provides the "segments" function to create a collection of species-specific predictions that exceed a user-defined confidence value. This function is available in the graphical user interface (GUI) under the "segments" tab or via the "segments.py" script in the command line.
-- | **GUI Usage**: In the GUI, you can select audio, result, and output directories. You can also set additional parameters such as the minimum confidence value, the maximum number of segments per species, the audio speed, and the segment length.
+    The output format "audacity" is not supported for the segments tool since it is missing certain columns. Use "table", "kaleidoscope", or "csv" formats instead.
 
-3. Setting Parameters
----------------------
+Using the "Segments" Tool in the GUI or Command Line
+-----------------------------------------------------
 
-- | **Minimum Confidence (min_conf)**: Set a minimum confidence value for predictions to be considered. Note that this value may vary by species. It is recommended to determine the threshold by reviewing precision and recall.
-- | **Maximum Number of Segments (num_seq)**: Specify how many segments per species should be extracted.
-- | **Audio Speed (audio_speed)**: Adjust the playback speed. Extracted segments will be saved with the adjusted speed (e.g., to listen to ultrsonic calls).
-- | **Segment Length (seq_length)**: Define how long the extracted audio segments should be. If you set to more than 3 seconds, each segment will be padded with audio from the source recording. For example, for 5-second segment length, 1 second of audio before and after each extracted segment will be included. For 7 seconds, 2 seconds will be included, and so on. The first and last segment of each audio file might be shorter than the specified length.
+The BirdNET Analyzer provides the "segments" tool to extract short audio segments from the result files and place them into separate species-specific folders.
+This tool is available in the graphical user interface (GUI) under the "segments" tab or via the :ref:`birdnet_analyzer.segments <cli-segments>` script in the command line.
 
-4. Extracting Segments
-----------------------
+Setting Parameters
+------------------
+
+The GUI and command line tool allow you to set various parameters to customize the segment extraction process:
+
+* **Minimum Confidence** (``min_conf``): Set a minimum confidence value for predictions to be considered. It is recommended to determine the threshold by reviewing precision and recall.
+* **Maximum Number of Segments** (``num_seq``): Specify how many segments per species should be extracted.
+* **Audio Speed** (``audio_speed``): Adjust the playback speed. Extracted segments will be saved with the adjusted speed (e.g., to listen to ultrasonic calls).
+* **Segment Length** (``seq_length``): Define how long the extracted audio segments should be. If you set to more than 3 seconds, each segment will be padded with audio from the source recording. For example, for 5-second segment length, 1 second of audio before and after each extracted segment will be included. For 7 seconds, 2 seconds will be included, and so on. The first and last segment of each audio file might be shorter than the specified length.
+
+.. note::
+
+    The desired minimum confidence value can be different for each species.
+
+Extracting Segments
+-------------------
+
+After setting all parameters, start the extraction process. BirdNET will create subfolders for each identified species and save audio clips of the corresponding recordings.
+The progress of the process will be displayed.
+The resulting audio segments will be saved in the following format:
+
+.. code-block::
+
+    {c}_{i}_{fname}_{start}s_{end}s.wav
 
-- | **Start the Extraction Process**: After setting all parameters, start the extraction process. BirdNET will create subfolders for each identified species and save audio clips of the corresponding recordings.
-- | **Progress Display**: The progress of the process will be displayed.
+where:
 
-5. Reviewing Results
---------------------
+* ``{c}``: confidence value of the prediction (e.g., 0.835)
+* ``{i}``: index of the segment inside the file
+* ``{fname}``: name of the original audio file without the extension
+* ``{start}``: start time of the segment inside the file in seconds
+* ``{end}``: end time of the segment inside the file in seconds
 
-- | **Manual Review of Audio Segments**: The resulting audio segments can be manually reviewed to assess the accuracy of the predictions. It is important to note that BirdNET confidence values are not probabilities but a measure of the algorithm's prediction reliability.
-- | **Systematic Review**: It is recommended to start with the highest confidence scores and work down to the lower scores.
-- | **File Naming**: Files are named with confidence values, allowing for sorting by values.
 
-6. Using the Review Tab in the GUI
+Using the Review Tab in the GUI
 ----------------------------------
 
-- | **Review Tab Overview**: The review tab in the GUI allows you to systematically review and label the extracted segments. It provides tools for visualizing spectrograms, listening to audio segments, and categorizing them as positive or negative detections.
-- | **Collect Segments**: Use the review tab to collect segments from the specified directory. You can shuffle the segments for a randomized review process.
-- | **Create Log Plot**: The review tab can generate a logistic regression plot to visualize the relationship between confidence values and the likelihood of correct detections.
-- **Review Process**:
+The resulting audio segments can be manually reviewed to assess the accuracy of the predictions.
+It is important to note that BirdNET *confidence values are not probabilities* but a measure of the algorithm's prediction reliability.
+We recommended to start with the highest confidence scores and work down to the lower scores.
 
-  - | **Select Directory**: Choose the directory containing the segments to be reviewed.
-  - | **Species Dropdown**: Select the species to review from the dropdown menu.
-  - | **File Count Matrix**: View the count of files to be reviewed, positive detections, and negative detections.
-  - | **Spectrogram and Audio**: Visualize the spectrogram and listen to the audio segment.
-  - | **Label Segments**: Use the buttons to label segments as positive or negative detections. You can also use the left and right arrow keys to assign labels.
-  - | **Undo**: Undo the last action if needed.
-  - | **Download Plots**: Download the spectrogram and regression plots for further analysis.
+The review tab in the GUI allows you to systematically review and label the extracted segments.
+It provides tools for visualizing spectrograms, listening to audio segments, and categorizing them as positive or negative detections.
+The review tab can generate a logistic regression plot to visualize the relationship between confidence values and the likelihood of correct detections.
 
-7. Alternative Approaches
--------------------------
+In the GUI select the "Review" tab and select the segments directory you want to review.
+You can now either select the parent directory containing all the different species subfolders or a specific species subfolder to review.
+If you select the parent directory, the GUI will automatically select the first species subfolder, but you can switch between species via a dropdown menu.
+
+Depending on your selection the segments will be shuffled or sorted by confidence value.
+Each segment will be displayed with an audio player and its spectrogram.
+After listening to a segment, you can either mark it as a positive detection (if you hear the species) or a negative detection (if you do not hear the species).
+The BirdNET Analyzer will create two directories: one for positive detections and one for negative detections, and move the marked segments accordingly.
+The "Undo" button allows you to revert the last action if needed.
+
+.. note::
+
+    You can also use the up (positive) and down (negative) arrow keys to assign labels. The left arrow key will undo the last action and the right arrow key will skip to the next segment without labeling it.
+
+With the number of segments reviewed, the GUI will also display a logistic regression plot.
+This plot shows the relationship between the confidence values and the likelihood of correct detections.
+All of the plots including the spectrogram can be downloaded as PNG files for further analysis or documentation.
+
+.. note::
+
+    The review tab can be used on any directory containing audio files, not just those created by the segments tool. This allows you to review any set of audio files, including those from other sources.
+
+Alternative Approaches
+----------------------
 
 - | **Raven Pro**: BirdNET result tables can be imported into Raven Pro and reviewed using the selection review function.
 - | **Converting Confidence Values to Probabilities**: Another approach is converting confidence values to probabilities using logistic regression in R. However, this still requires manual evaluation of predictions.
 
-8. Important Notes
-------------------
+Important Notes
+---------------
 
 - | **Non-Transferability of Confidence Values**: BirdNET confidence values are not easily transferable between species.
 - | **Audio Quality**: The accuracy of results heavily depends on the quality of audio recordings, such as sample rate and microphone quality.
diff --git a/docs/best-practices/species-lists.rst b/docs/best-practices/species-lists.rst
@@ -7,7 +7,7 @@ You can find label files in the checkpoints folder, e.g., `checkpoints/V2.4/Bird
 
 Species names need to consist of `scientific name_common name` to be valid.
 
-You can generate a species list for a given location using :ref:`species.py <cli-species>`.
+You can generate a species list for a given location using :ref:`birdnet_analyzer.species <cli-species>`.
 
 Practical Information and Considerations
 ----------------------------------------
@@ -29,7 +29,7 @@ In cases where eBird does not have enough observations (i.e., checklists), the d
 If you know which species to expect in your area, it is recommended to compile your own species list. This can help improve the accuracy of BirdNET-Analyzer for your specific use case.
 
 1. **Collect Species Names**: Use the labels file from the model checkpoints to get the correct species names. Ensure the names are in the format `scientific name_common name`.
-2. **Generate Species List**: Use the `species.py` script to generate a species list for a given location and time. This script uses the GeoModel to predict species occurrence based on latitude, longitude, and week of the year.
+2. **Generate Species List**: Use the `birdnet_analyzer.species` script to generate a species list for a given location and time. This script uses the GeoModel to predict species occurrence based on latitude, longitude, and week of the year.
 
 **Example of Training Data**
 
diff --git a/docs/usage/cli.rst b/docs/usage/cli.rst
diff --git a/docs/usage/gui.rst b/docs/usage/gui.rst
diff --git a/pyproject.toml b/pyproject.toml
diff --git a/tests/analyze/test_analyze.py b/tests/analyze/test_analyze.py

Original file line number	Diff line number	Diff line change
`@@ -119,8 +119,7 @@ def save_labels_file(labels: list[str], locale: str):`
`119`	`119`	`cfg.TRANSLATED_LABELS_PATH, "{}_{}.txt".format(os.path.basename(cfg.LABELS_FILE).rsplit(".", 1)[0], locale)`
`120`	`120`	`)`
`121`	`121`	`with open(fpath, "w", encoding="utf-8") as f:`
`122`		`- for label in labels:`
`123`		`- f.write(label + "\n")`
	`122`	`+ f.writelines(label + "\n" for label in labels)`
`124`	`123`
`125`	`124`
`126`	`125`	`if __name__ == "__main__":`