From c80078feeee954f799fb14762c842e760c02c472 Mon Sep 17 00:00:00 2001
From: mbsantiago <santiago.mbal@gmail.com>
Date: Mon, 25 Aug 2025 17:23:27 +0100
Subject: [PATCH] Removing stale tests

---
 example_data/config.yaml                 |   3 +
 src/batdetect2/preprocess/spectrogram.py |   2 +-
 tests/test_train/test_augmentations.py   |  35 +--
 tests/test_train/test_clips.py           | 322 +----------------------
 tests/test_train/test_labels.py          |  89 ++-----
 tests/test_train/test_lightning.py       |  23 +-
 tests/test_train/test_preprocessing.py   |  24 +-
 7 files changed, 52 insertions(+), 446 deletions(-)

diff --git a/example_data/config.yaml b/example_data/config.yaml
index 1039163..1e12018 100644
--- a/example_data/config.yaml
+++ b/example_data/config.yaml
@@ -24,6 +24,9 @@ targets:
       - name: rhifer
         tags:
           - value: Rhinolophus ferrumequinum
+        roi:
+          name: anchor_bbox
+          anchor: top-left
     generic_class:
       - key: class
         value: Bat
diff --git a/src/batdetect2/preprocess/spectrogram.py b/src/batdetect2/preprocess/spectrogram.py
index 2fd0ad0..5e0344c 100644
--- a/src/batdetect2/preprocess/spectrogram.py
+++ b/src/batdetect2/preprocess/spectrogram.py
@@ -89,7 +89,7 @@ def build_spectrogram_builder(
         n_fft=n_fft,
         hop_length=hop_length,
         window_fn=get_spectrogram_window(conf.window_fn),
-        center=False,
+        center=True,
         power=1,
     )
 
diff --git a/tests/test_train/test_augmentations.py b/tests/test_train/test_augmentations.py
index 99d4640..c363d0e 100644
--- a/tests/test_train/test_augmentations.py
+++ b/tests/test_train/test_augmentations.py
@@ -1,10 +1,8 @@
 from collections.abc import Callable
 
-import numpy as np
 import pytest
 import torch
-import xarray as xr
-from soundevent import arrays, data
+from soundevent import data
 
 from batdetect2.train.augmentations import (
     add_echo,
@@ -162,29 +160,10 @@ def test_selected_random_subclip_has_the_correct_width(
         labeller=sample_labeller,
     )
 
-    subclip = select_subclip(original, start=0, span=0.513)
-    assert subclip["spectrogram"].shape[1] == 512
-
-
-def test_add_echo_after_subclip(
-    sample_preprocessor: PreprocessorProtocol,
-    sample_audio_loader: AudioLoader,
-    sample_labeller: ClipLabeller,
-    create_recording: Callable[..., data.Recording],
-):
-    recording1 = create_recording(duration=2)
-    clip1 = data.Clip(recording=recording1, start_time=0, end_time=1)
-    clip_annotation_1 = data.ClipAnnotation(clip=clip1)
-    original = generate_train_example(
-        clip_annotation_1,
-        audio_loader=sample_audio_loader,
-        preprocessor=sample_preprocessor,
-        labeller=sample_labeller,
+    subclip = select_subclip(
+        original,
+        samplerate=256_000,
+        start=0,
+        duration=0.512,
     )
-
-    assert original.sizes["time"] > 512
-
-    subclip = select_subclip(original, start=0, span=0.513)
-    with_echo = add_echo(subclip, preprocessor=sample_preprocessor)
-
-    assert with_echo.sizes["time"] == 512
+    assert subclip.spectrogram.shape[1] == 512
diff --git a/tests/test_train/test_clips.py b/tests/test_train/test_clips.py
index 3ab7661..0f4f4f4 100644
--- a/tests/test_train/test_clips.py
+++ b/tests/test_train/test_clips.py
@@ -1,323 +1,3 @@
 import numpy as np
-import pytest
-import xarray as xr
 
-from batdetect2.train.clips import (
-    _compute_expected_width,
-    select_subclip,
-)
-
-AUDIO_SAMPLERATE = 48000
-
-SPEC_SAMPLERATE = 100
-SPEC_FREQS = 64
-CLIP_DURATION = 0.5
-
-
-CLIP_WIDTH_SPEC = int(np.floor(CLIP_DURATION * SPEC_SAMPLERATE))
-CLIP_WIDTH_AUDIO = int(np.floor(CLIP_DURATION * AUDIO_SAMPLERATE))
-MAX_EMPTY = 0.2
-
-
-def create_test_dataset(
-    duration_sec: float,
-    spec_samplerate: int = SPEC_SAMPLERATE,
-    audio_samplerate: int = AUDIO_SAMPLERATE,
-    num_freqs: int = SPEC_FREQS,
-    start_time: float = 0.0,
-) -> xr.Dataset:
-    """Creates a sample xr.Dataset for testing."""
-    time_step = 1 / spec_samplerate
-    audio_time_step = 1 / audio_samplerate
-
-    times = np.arange(start_time, start_time + duration_sec, step=time_step)
-    freqs = np.linspace(0, audio_samplerate / 2, num_freqs)
-    audio_times = np.arange(
-        start_time,
-        start_time + duration_sec,
-        step=audio_time_step,
-    )
-
-    num_time_steps = len(times)
-    num_audio_samples = len(audio_times)
-    spec_shape = (num_freqs, num_time_steps)
-
-    spectrogram_data = np.arange(num_time_steps).reshape(1, -1) * np.ones(
-        (num_freqs, 1)
-    )
-
-    spectrogram = xr.DataArray(
-        spectrogram_data.astype(np.float32),
-        coords=[("frequency", freqs), ("time", times)],
-        name="spectrogram",
-    )
-
-    detection = xr.DataArray(
-        np.ones(spec_shape, dtype=np.float32) * 0.5,
-        coords=spectrogram.coords,
-        name="detection",
-    )
-
-    classes = xr.DataArray(
-        np.ones((3, *spec_shape), dtype=np.float32),
-        coords=[
-            ("category", ["A", "B", "C"]),
-            ("frequency", freqs),
-            ("time", times),
-        ],
-        name="class",
-    )
-
-    size = xr.DataArray(
-        np.ones((2, *spec_shape), dtype=np.float32),
-        coords=[
-            ("dimension", ["height", "width"]),
-            ("frequency", freqs),
-            ("time", times),
-        ],
-        name="size",
-    )
-
-    audio_data = np.arange(num_audio_samples)
-    audio = xr.DataArray(
-        audio_data.astype(np.float32),
-        coords=[("audio_time", audio_times)],
-        name="audio",
-    )
-
-    metadata = xr.DataArray([1, 2, 3], dims=["other_dim"], name="metadata")
-
-    return xr.Dataset(
-        {
-            "audio": audio,
-            "spectrogram": spectrogram,
-            "detection": detection,
-            "class": classes,
-            "size": size,
-            "metadata": metadata,
-        }
-    ).assign_attrs(
-        samplerate=audio_samplerate,
-        spec_samplerate=spec_samplerate,
-    )
-
-
-@pytest.fixture
-def long_dataset() -> xr.Dataset:
-    """Dataset longer than the clip duration."""
-    return create_test_dataset(duration_sec=2.0)
-
-
-@pytest.fixture
-def short_dataset() -> xr.Dataset:
-    """Dataset shorter than the clip duration."""
-    return create_test_dataset(duration_sec=0.3)
-
-
-@pytest.fixture
-def exact_dataset() -> xr.Dataset:
-    """Dataset exactly the clip duration."""
-    return create_test_dataset(duration_sec=CLIP_DURATION - 1e-9)
-
-
-@pytest.fixture
-def offset_dataset() -> xr.Dataset:
-    """Dataset starting at a non-zero time."""
-    return create_test_dataset(duration_sec=1.0, start_time=0.5)
-
-
-def test_select_subclip_within_bounds(long_dataset):
-    start_time = 0.5
-    subclip = select_subclip(
-        long_dataset, span=CLIP_DURATION, start=start_time, dim="time"
-    )
-    expected_width = _compute_expected_width(
-        long_dataset, CLIP_DURATION, "time"
-    )
-
-    assert "time" in subclip.dims
-    assert subclip.dims["time"] == expected_width
-    assert subclip.spectrogram.dims == ("frequency", "time")
-    assert subclip.spectrogram.shape == (SPEC_FREQS, expected_width)
-    assert subclip.detection.shape == (SPEC_FREQS, expected_width)
-    assert subclip["class"].shape == (3, SPEC_FREQS, expected_width)
-    assert subclip.size.shape == (2, SPEC_FREQS, expected_width)
-    assert subclip.time.min() >= start_time
-    assert (
-        subclip.time.max() <= start_time + CLIP_DURATION + 1 / SPEC_SAMPLERATE
-    )
-
-    assert "metadata" in subclip
-    xr.testing.assert_equal(subclip.metadata, long_dataset.metadata)
-
-
-def test_select_subclip_pad_start(long_dataset):
-    start_time = -0.1
-    subclip = select_subclip(
-        long_dataset, span=CLIP_DURATION, start=start_time, dim="time"
-    )
-    expected_width = _compute_expected_width(
-        long_dataset, CLIP_DURATION, "time"
-    )
-    step = 1 / SPEC_SAMPLERATE
-    expected_pad_samples = int(np.floor(abs(start_time) / step))
-
-    assert subclip.dims["time"] == expected_width
-    assert subclip.spectrogram.shape[1] == expected_width
-
-    assert np.all(
-        subclip.spectrogram.isel(time=slice(0, expected_pad_samples)) == 0
-    )
-
-    assert np.any(
-        subclip.spectrogram.isel(time=slice(expected_pad_samples, None)) != 0
-    )
-    assert subclip.time.min() >= start_time
-    assert subclip.time.max() < start_time + CLIP_DURATION + step
-
-
-def test_select_subclip_pad_end(long_dataset):
-    original_duration = long_dataset.time.max() - long_dataset.time.min()
-    start_time = original_duration - 0.1
-    subclip = select_subclip(
-        long_dataset, span=CLIP_DURATION, start=start_time, dim="time"
-    )
-    expected_width = _compute_expected_width(
-        long_dataset, CLIP_DURATION, "time"
-    )
-    step = 1 / SPEC_SAMPLERATE
-    original_width = long_dataset.dims["time"]
-    expected_pad_samples = expected_width - (
-        original_width - int(np.floor(start_time / step))
-    )
-
-    assert subclip.sizes["time"] == expected_width
-    assert subclip.spectrogram.shape[1] == expected_width
-
-    assert np.all(
-        subclip.spectrogram.isel(
-            time=slice(expected_width - expected_pad_samples, None)
-        )
-        == 0
-    )
-
-    assert np.any(
-        subclip.spectrogram.isel(
-            time=slice(0, expected_width - expected_pad_samples)
-        )
-        != 0
-    )
-    assert subclip.time.min() >= start_time
-    assert subclip.time.max() < start_time + CLIP_DURATION + step
-
-
-def test_select_subclip_pad_both_short_dataset(short_dataset):
-    start_time = -0.1
-    subclip = select_subclip(
-        short_dataset, span=CLIP_DURATION, start=start_time, dim="time"
-    )
-    expected_width = _compute_expected_width(
-        short_dataset, CLIP_DURATION, "time"
-    )
-    step = 1 / SPEC_SAMPLERATE
-
-    assert subclip.dims["time"] == expected_width
-    assert subclip.spectrogram.shape[1] == expected_width
-
-    assert subclip.spectrogram.coords["time"][0] == pytest.approx(
-        start_time,
-        abs=step,
-    )
-    assert subclip.spectrogram.coords["time"][-1] == pytest.approx(
-        start_time + CLIP_DURATION - step,
-        abs=2 * step,
-    )
-
-
-def test_select_subclip_width_consistency(long_dataset):
-    expected_width = _compute_expected_width(
-        long_dataset, CLIP_DURATION, "time"
-    )
-    step = 1 / SPEC_SAMPLERATE
-
-    subclip_aligned = select_subclip(
-        long_dataset.copy(deep=True),
-        span=CLIP_DURATION,
-        start=5 * step,
-        dim="time",
-    )
-
-    subclip_offset = select_subclip(
-        long_dataset.copy(deep=True),
-        span=CLIP_DURATION,
-        start=5.3 * step,
-        dim="time",
-    )
-
-    assert subclip_aligned.sizes["time"] == expected_width
-    assert subclip_offset.sizes["time"] == expected_width
-    assert subclip_aligned.spectrogram.shape[1] == expected_width
-    assert subclip_offset.spectrogram.shape[1] == expected_width
-
-
-def test_select_subclip_different_dimension(long_dataset):
-    freq_coords = long_dataset.frequency.values
-    freq_min, freq_max = freq_coords.min(), freq_coords.max()
-    freq_span = (freq_max - freq_min) / 2
-    start_freq = freq_min + freq_span / 2
-
-    subclip = select_subclip(
-        long_dataset, span=freq_span, start=start_freq, dim="frequency"
-    )
-
-    assert "frequency" in subclip.dims
-    assert subclip.spectrogram.shape[0] < long_dataset.spectrogram.shape[0]
-    assert subclip.detection.shape[0] < long_dataset.detection.shape[0]
-    assert subclip["class"].shape[1] < long_dataset["class"].shape[1]
-    assert subclip.size.shape[1] < long_dataset.size.shape[1]
-
-    assert subclip.dims["time"] == long_dataset.dims["time"]
-    assert subclip.spectrogram.shape[1] == long_dataset.spectrogram.shape[1]
-
-    xr.testing.assert_equal(subclip.audio, long_dataset.audio)
-    assert subclip.dims["audio_time"] == long_dataset.dims["audio_time"]
-
-
-def test_select_subclip_fill_value(short_dataset):
-    fill_value = -999.0
-    subclip = select_subclip(
-        short_dataset,
-        span=CLIP_DURATION,
-        start=0,
-        dim="time",
-        fill_value=fill_value,
-    )
-
-    expected_width = _compute_expected_width(
-        short_dataset,
-        CLIP_DURATION,
-        "time",
-    )
-
-    assert subclip.dims["time"] == expected_width
-    assert np.all(subclip.spectrogram.sel(time=slice(0.3, None)) == fill_value)
-
-
-def test_select_subclip_no_overlap_raises_error(long_dataset):
-    original_duration = long_dataset.time.max() - long_dataset.time.min()
-
-    with pytest.raises(ValueError, match="does not overlap"):
-        select_subclip(
-            long_dataset,
-            span=CLIP_DURATION,
-            start=original_duration + 1.0,
-            dim="time",
-        )
-
-    with pytest.raises(ValueError, match="does not overlap"):
-        select_subclip(
-            long_dataset,
-            span=CLIP_DURATION,
-            start=-1.0 * CLIP_DURATION - 1.0,
-            dim="time",
-        )
+from batdetect2.train.clips import select_subclip
diff --git a/tests/test_train/test_labels.py b/tests/test_train/test_labels.py
index 2ce8302..213d7ba 100644
--- a/tests/test_train/test_labels.py
+++ b/tests/test_train/test_labels.py
@@ -1,10 +1,9 @@
 from pathlib import Path
 
-import numpy as np
-import xarray as xr
+import torch
 from soundevent import data
 
-from batdetect2.targets import TargetConfig, TargetProtocol, build_targets
+from batdetect2.targets import TargetConfig, build_targets
 from batdetect2.targets.rois import AnchorBBoxMapperConfig
 from batdetect2.targets.terms import TagInfo
 from batdetect2.train.labels import generate_heatmaps
@@ -21,63 +20,10 @@ recording = data.Recording(
 clip = data.Clip(
     recording=recording,
     start_time=0,
-    end_time=1,
+    end_time=100,
 )
 
 
-def test_generated_heatmaps_have_correct_dimensions(
-    sample_targets: TargetProtocol,
-):
-    spec = xr.DataArray(
-        data=np.random.rand(100, 100),
-        dims=["time", "frequency"],
-        coords={
-            "time": np.linspace(0, 100, 100, endpoint=False),
-            "frequency": np.linspace(0, 100, 100, endpoint=False),
-        },
-    )
-
-    clip_annotation = data.ClipAnnotation(
-        clip=clip,
-        sound_events=[
-            data.SoundEventAnnotation(
-                sound_event=data.SoundEvent(
-                    recording=recording,
-                    geometry=data.BoundingBox(
-                        coordinates=[10, 10, 20, 20],
-                    ),
-                ),
-            )
-        ],
-    )
-
-    detection_heatmap, class_heatmap, size_heatmap = generate_heatmaps(
-        clip_annotation.sound_events,
-        spec,
-        targets=sample_targets,
-    )
-
-    assert isinstance(detection_heatmap, xr.DataArray)
-    assert detection_heatmap.shape == (100, 100)
-    assert detection_heatmap.dims == ("time", "frequency")
-
-    assert isinstance(class_heatmap, xr.DataArray)
-    assert class_heatmap.shape == (2, 100, 100)
-    assert class_heatmap.dims == ("category", "time", "frequency")
-    assert class_heatmap.coords["category"].values.tolist() == [
-        "pippip",
-        "myomyo",
-    ]
-
-    assert isinstance(size_heatmap, xr.DataArray)
-    assert size_heatmap.shape == (2, 100, 100)
-    assert size_heatmap.dims == ("dimension", "time", "frequency")
-    assert size_heatmap.coords["dimension"].values.tolist() == [
-        "width",
-        "height",
-    ]
-
-
 def test_generated_heatmap_are_non_zero_at_correct_positions(
     sample_target_config: TargetConfig,
     pippip_tag: TagInfo,
@@ -93,15 +39,6 @@ def test_generated_heatmap_are_non_zero_at_correct_positions(
 
     targets = build_targets(config)
 
-    spec = xr.DataArray(
-        data=np.random.rand(100, 100),
-        dims=["time", "frequency"],
-        coords={
-            "time": np.linspace(0, 100, 100, endpoint=False),
-            "frequency": np.linspace(0, 100, 100, endpoint=False),
-        },
-    )
-
     clip_annotation = data.ClipAnnotation(
         clip=clip,
         sound_events=[
@@ -109,7 +46,7 @@ def test_generated_heatmap_are_non_zero_at_correct_positions(
                 sound_event=data.SoundEvent(
                     recording=recording,
                     geometry=data.BoundingBox(
-                        coordinates=[10, 10, 20, 20],
+                        coordinates=[10, 10, 20, 30],
                     ),
                 ),
                 tags=[data.Tag(key=pippip_tag.key, value=pippip_tag.value)],  # type: ignore
@@ -118,12 +55,16 @@ def test_generated_heatmap_are_non_zero_at_correct_positions(
     )
 
     detection_heatmap, class_heatmap, size_heatmap = generate_heatmaps(
-        clip_annotation.sound_events,
-        spec,
+        clip_annotation,
+        torch.rand([100, 100]),
+        min_freq=0,
+        max_freq=100,
         targets=targets,
     )
-    assert size_heatmap.sel(time=10, frequency=10, dimension="width") == 10
-    assert size_heatmap.sel(time=10, frequency=10, dimension="height") == 10
-    assert class_heatmap.sel(time=10, frequency=10, category="pippip") == 1.0
-    assert class_heatmap.sel(time=10, frequency=10, category="myomyo") == 0.0
-    assert detection_heatmap.sel(time=10, frequency=10) == 1.0
+    pippip_index = targets.class_names.index("pippip")
+    myomyo_index = targets.class_names.index("myomyo")
+    assert size_heatmap[0, 10, 10] == 10
+    assert size_heatmap[1, 10, 10] == 20
+    assert class_heatmap[pippip_index, 10, 10] == 1.0
+    assert class_heatmap[myomyo_index, 10, 10] == 0.0
+    assert detection_heatmap[10, 10] == 1.0
diff --git a/tests/test_train/test_lightning.py b/tests/test_train/test_lightning.py
index 13da352..af4bcad 100644
--- a/tests/test_train/test_lightning.py
+++ b/tests/test_train/test_lightning.py
@@ -2,11 +2,11 @@ from pathlib import Path
 
 import lightning as L
 import torch
-import xarray as xr
 from soundevent import data
 
 from batdetect2.train import FullTrainingConfig, TrainingModule
 from batdetect2.train.train import build_training_module
+from batdetect2.typing.preprocess import AudioLoader
 
 
 def build_default_module():
@@ -19,7 +19,11 @@ def test_can_initialize_default_module():
     assert isinstance(module, L.LightningModule)
 
 
-def test_can_save_checkpoint(tmp_path: Path, clip: data.Clip):
+def test_can_save_checkpoint(
+    tmp_path: Path,
+    clip: data.Clip,
+    sample_audio_loader: AudioLoader,
+):
     module = build_default_module()
     trainer = L.Trainer()
     path = tmp_path / "example.ckpt"
@@ -28,15 +32,14 @@ def test_can_save_checkpoint(tmp_path: Path, clip: data.Clip):
 
     recovered = TrainingModule.load_from_checkpoint(path)
 
-    spec1 = module.model.preprocessor.preprocess_clip(clip)
-    spec2 = recovered.model.preprocessor.preprocess_clip(clip)
+    wav = torch.tensor(sample_audio_loader.load_clip(clip))
 
-    xr.testing.assert_equal(spec1, spec2)
+    spec1 = module.model.preprocessor(wav)
+    spec2 = recovered.model.preprocessor(wav)
 
-    input1 = torch.tensor([spec1.values]).unsqueeze(0)
-    input2 = torch.tensor([spec2.values]).unsqueeze(0)
+    torch.testing.assert_close(spec1, spec2, rtol=0, atol=0)
 
-    output1 = module(input1)
-    output2 = recovered(input2)
+    output1 = module(spec1.unsqueeze(0).unsqueeze(0))
+    output2 = recovered(spec2.unsqueeze(0).unsqueeze(0))
 
-    torch.testing.assert_close(output1, output2)
+    torch.testing.assert_close(output1, output2, rtol=0, atol=0)
diff --git a/tests/test_train/test_preprocessing.py b/tests/test_train/test_preprocessing.py
index bf52eed..6e74348 100644
--- a/tests/test_train/test_preprocessing.py
+++ b/tests/test_train/test_preprocessing.py
@@ -88,12 +88,12 @@ def test_encoding_decoding_roundtrip_recovers_object(
     )
     predictions = postprocessor.get_predictions(
         ModelOutput(
-            detection_probs=encoded["detection_heatmap"]
-            .unsqueeze(0)
-            .unsqueeze(0),
-            size_preds=encoded["size_heatmap"].unsqueeze(0),
-            class_probs=encoded["class_heatmap"].unsqueeze(0),
-            features=encoded["spectrogram"].unsqueeze(0).unsqueeze(0),
+            detection_probs=encoded.detection_heatmap.unsqueeze(0).unsqueeze(
+                0
+            ),
+            size_preds=encoded.size_heatmap.unsqueeze(0),
+            class_probs=encoded.class_heatmap.unsqueeze(0),
+            features=encoded.spectrogram.unsqueeze(0).unsqueeze(0),
         ),
         [clip],
     )[0]
@@ -182,12 +182,12 @@ def test_encoding_decoding_roundtrip_recovers_object_with_roi_override(
     )
     predictions = postprocessor.get_predictions(
         ModelOutput(
-            detection_probs=encoded["detection_heatmap"]
-            .unsqueeze(0)
-            .unsqueeze(0),
-            size_preds=encoded["size_heatmap"].unsqueeze(0),
-            class_probs=encoded["class_heatmap"].unsqueeze(0),
-            features=encoded["spectrogram"].unsqueeze(0).unsqueeze(0),
+            detection_probs=encoded.detection_heatmap.unsqueeze(0).unsqueeze(
+                0
+            ),
+            size_preds=encoded.size_heatmap.unsqueeze(0),
+            class_probs=encoded.class_heatmap.unsqueeze(0),
+            features=encoded.spectrogram.unsqueeze(0).unsqueeze(0),
         ),
         [clip],
     )[0]