Expanded cli tests

2026-07-07 21:00:10 +02:00 · 2026-03-18 20:35:08 +00:00 · 2026-03-18 20:35:08 +00:00 · 0163a572cb
commit 0163a572cb
parent f0af5dd79e
9 changed files with 607 additions and 185 deletions
--- a/src/batdetect2/cli/inference.py
+++ b/src/batdetect2/cli/inference.py
@ -164,6 +164,7 @@ def inference_file_list_command(
    num_workers: int,
    format_name: str | None,
 ) -> None:
+    file_list = Path(file_list)
    audio_files = [
        Path(line.strip())
        for line in file_list.read_text().splitlines()
@ -207,6 +208,7 @@ def inference_dataset_command(
    num_workers: int,
    format_name: str | None,
 ) -> None:
+    dataset_path = Path(dataset_path)
    dataset = io.load(dataset_path, type="annotation_set")
    audio_files = sorted(
        {
--- a/tests/conftest.py
+++ b/tests/conftest.py
@ -3,6 +3,7 @@ from pathlib import Path
 from typing import Callable, List, Optional
 from uuid import uuid4

+import lightning as L
 import numpy as np
 import pytest
 import soundfile as sf
@ -12,6 +13,7 @@ from soundevent import data, terms
 from batdetect2.audio import build_audio_loader
 from batdetect2.audio.clips import build_clipper
 from batdetect2.audio.types import AudioLoader, ClipperProtocol
+from batdetect2.config import BatDetect2Config
 from batdetect2.data import DatasetConfig, load_dataset
 from batdetect2.data.annotations.batdetect2 import BatDetect2FilesAnnotations
 from batdetect2.preprocess import build_preprocessor
@ -24,6 +26,7 @@ from batdetect2.targets import (
 from batdetect2.targets.classes import TargetClassConfig
 from batdetect2.targets.types import TargetProtocol
 from batdetect2.train.labels import build_clip_labeler
+from batdetect2.train.lightning import build_training_module
 from batdetect2.train.types import ClipLabeller


@ -452,3 +455,23 @@ def create_temp_yaml(tmp_path: Path) -> Callable[[str], Path]:
        return temp_file

    return factory
+
+
+@pytest.fixture
+def tiny_checkpoint_path(tmp_path: Path) -> Path:
+    module = build_training_module(model_config=BatDetect2Config().model)
+    trainer = L.Trainer(enable_checkpointing=False, logger=False)
+    checkpoint_path = tmp_path / "model.ckpt"
+    trainer.strategy.connect(module)
+    trainer.save_checkpoint(checkpoint_path)
+    return checkpoint_path
+
+
+@pytest.fixture
+def single_audio_dir(tmp_path: Path, example_audio_files: List[Path]) -> Path:
+    audio_dir = tmp_path / "audio"
+    audio_dir.mkdir()
+    source = example_audio_files[0]
+    target = audio_dir / source.name
+    target.write_bytes(source.read_bytes())
+    return audio_dir
--- a/tests/test_cli.py
+++ b/tests/test_cli.py
@ -1,185 +0,0 @@
-"""Test the command line interface."""
-
-import shutil
-from pathlib import Path
-
-import lightning as L
-import pandas as pd
-from click.testing import CliRunner
-
-from batdetect2.cli import cli
-from batdetect2.config import BatDetect2Config
-from batdetect2.train.lightning import build_training_module
-
-runner = CliRunner()
-
-
-def test_cli_base_command():
-    """Test the base command."""
-    result = runner.invoke(cli, ["--help"])
-    assert result.exit_code == 0
-    assert (
-        "BatDetect2 - Bat Call Detection and Classification" in result.output
-    )
-
-
-def test_cli_detect_command_help():
-    """Test the detect command help."""
-    result = runner.invoke(cli, ["detect", "--help"])
-    assert result.exit_code == 0
-    assert "Detect bat calls in files in AUDIO_DIR" in result.output
-
-
-def test_cli_predict_command_help():
-    """Test the predict command help."""
-    result = runner.invoke(cli, ["predict", "--help"])
-    assert result.exit_code == 0
-    assert "directory" in result.output
-    assert "file_list" in result.output
-    assert "dataset" in result.output
-
-
-def test_cli_predict_directory_runs_on_real_audio(tmp_path: Path):
-    """User story: run prediction from CLI on a small directory."""
-
-    source_audio = Path("example_data/audio")
-    source_file = next(source_audio.glob("*.wav"))
-    audio_dir = tmp_path / "audio"
-    audio_dir.mkdir()
-    target_file = audio_dir / source_file.name
-    shutil.copy(source_file, target_file)
-
-    module = build_training_module(model_config=BatDetect2Config().model)
-    trainer = L.Trainer(enable_checkpointing=False, logger=False)
-    model_path = tmp_path / "model.ckpt"
-    trainer.strategy.connect(module)
-    trainer.save_checkpoint(model_path)
-    output_path = tmp_path / "predictions"
-
-    result = runner.invoke(
-        cli,
-        [
-            "predict",
-            "directory",
-            str(model_path),
-            str(audio_dir),
-            str(output_path),
-            "--batch-size",
-            "1",
-            "--workers",
-            "0",
-            "--format",
-            "batdetect2",
-        ],
-    )
-
-    assert result.exit_code == 0
-    assert output_path.exists()
-    output_files = list(output_path.glob("*.json"))
-    assert len(output_files) == 1
-
-
-def test_cli_detect_command_on_test_audio(tmp_path):
-    """Test the detect command on test audio."""
-    results_dir = tmp_path / "results"
-
-    # Remove results dir if it exists
-    if results_dir.exists():
-        results_dir.rmdir()
-
-    result = runner.invoke(
-        cli,
-        [
-            "detect",
-            "example_data/audio",
-            str(results_dir),
-            "0.3",
-        ],
-    )
-    assert result.exit_code == 0
-    assert results_dir.exists()
-    assert len(list(results_dir.glob("*.csv"))) == 3
-    assert len(list(results_dir.glob("*.json"))) == 3
-
-
-def test_cli_detect_command_with_non_trivial_time_expansion(tmp_path):
-    """Test the detect command with a non-trivial time expansion factor."""
-    results_dir = tmp_path / "results"
-
-    # Remove results dir if it exists
-    if results_dir.exists():
-        results_dir.rmdir()
-
-    result = runner.invoke(
-        cli,
-        [
-            "detect",
-            "example_data/audio",
-            str(results_dir),
-            "0.3",
-            "--time_expansion_factor",
-            "10",
-        ],
-    )
-
-    assert result.exit_code == 0
-    assert "Time Expansion Factor: 10" in result.stdout
-
-
-def test_cli_detect_command_with_the_spec_feature_flag(tmp_path: Path):
-    """Test the detect command with the spec feature flag."""
-    results_dir = tmp_path / "results"
-
-    # Remove results dir if it exists
-    if results_dir.exists():
-        results_dir.rmdir()
-
-    result = runner.invoke(
-        cli,
-        [
-            "detect",
-            "example_data/audio",
-            str(results_dir),
-            "0.3",
-            "--spec_features",
-        ],
-    )
-    assert result.exit_code == 0
-    assert results_dir.exists()
-
-    csv_files = [path.name for path in results_dir.glob("*.csv")]
-
-    expected_files = [
-        "20170701_213954-MYOMYS-LR_0_0.5.wav_spec_features.csv",
-        "20180530_213516-EPTSER-LR_0_0.5.wav_spec_features.csv",
-        "20180627_215323-RHIFER-LR_0_0.5.wav_spec_features.csv",
-    ]
-
-    for expected_file in expected_files:
-        assert expected_file in csv_files
-
-        df = pd.read_csv(results_dir / expected_file)
-        assert not (df.duration == -1).any()
-
-
-def test_cli_detect_fails_gracefully_on_empty_file(tmp_path: Path):
-    results_dir = tmp_path / "results"
-    target = tmp_path / "audio"
-    target.mkdir()
-
-    # Create an empty file with the .wav extension
-    empty_file = target / "empty.wav"
-    empty_file.touch()
-
-    result = runner.invoke(
-        cli,
-        args=[
-            "detect",
-            str(target),
-            str(results_dir),
-            "0.3",
-            "--spec_features",
-        ],
-    )
-    assert result.exit_code == 0
-    assert f"Error processing file {empty_file}" in result.output
--- a/tests/test_cli/test_base.py
+++ b/tests/test_cli/test_base.py
@ -0,0 +1,18 @@
+"""Behavior-focused tests for top-level CLI command discovery."""
+
+from click.testing import CliRunner
+
+from batdetect2.cli import cli
+
+
+def test_cli_base_help_lists_main_commands() -> None:
+    """User story: discover available workflows from top-level help."""
+
+    result = CliRunner().invoke(cli, ["--help"])
+
+    assert result.exit_code == 0
+    assert "predict" in result.output
+    assert "train" in result.output
+    assert "evaluate" in result.output
+    assert "data" in result.output
+    assert "detect" in result.output
--- a/tests/test_cli/test_data.py
+++ b/tests/test_cli/test_data.py
@ -0,0 +1,60 @@
+"""Behavior tests for data CLI command group."""
+
+from pathlib import Path
+
+from click.testing import CliRunner
+
+from batdetect2.cli import cli
+
+
+def test_cli_data_help() -> None:
+    """User story: discover data subcommands."""
+
+    result = CliRunner().invoke(cli, ["data", "--help"])
+
+    assert result.exit_code == 0
+    assert "summary" in result.output
+    assert "convert" in result.output
+
+
+def test_cli_data_convert_creates_annotation_set(tmp_path: Path) -> None:
+    """User story: convert dataset config into a soundevent annotation set."""
+
+    output = tmp_path / "annotations.json"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "data",
+            "convert",
+            "example_data/dataset.yaml",
+            "--base-dir",
+            ".",
+            "--output",
+            str(output),
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert output.exists()
+
+
+def test_cli_data_convert_fails_with_invalid_field(tmp_path: Path) -> None:
+    """User story: invalid nested field in dataset config fails clearly."""
+
+    output = tmp_path / "annotations.json"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "data",
+            "convert",
+            "example_data/dataset.yaml",
+            "--field",
+            "does.not.exist",
+            "--output",
+            str(output),
+        ],
+    )
+
+    assert result.exit_code != 0
--- a/tests/test_cli/test_detect.py
+++ b/tests/test_cli/test_detect.py
@ -0,0 +1,119 @@
+"""Behavior tests for legacy detect command."""
+
+from pathlib import Path
+
+import pandas as pd
+from click.testing import CliRunner
+
+from batdetect2.cli import cli
+
+
+def test_cli_detect_help() -> None:
+    """User story: get usage help for legacy detect command."""
+
+    result = CliRunner().invoke(cli, ["detect", "--help"])
+
+    assert result.exit_code == 0
+    assert "Detect bat calls in files in AUDIO_DIR" in result.output
+
+
+def test_cli_detect_command_on_test_audio(tmp_path: Path) -> None:
+    """User story: run legacy detect on example audio directory."""
+
+    results_dir = tmp_path / "results"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "detect",
+            "example_data/audio",
+            str(results_dir),
+            "0.3",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert results_dir.exists()
+    assert len(list(results_dir.glob("*.csv"))) == 3
+    assert len(list(results_dir.glob("*.json"))) == 3
+
+
+def test_cli_detect_command_with_non_trivial_time_expansion(
+    tmp_path: Path,
+) -> None:
+    """User story: set time expansion in legacy detect command."""
+
+    results_dir = tmp_path / "results"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "detect",
+            "example_data/audio",
+            str(results_dir),
+            "0.3",
+            "--time_expansion_factor",
+            "10",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert "Time Expansion Factor: 10" in result.stdout
+
+
+def test_cli_detect_command_with_spec_feature_flag(tmp_path: Path) -> None:
+    """User story: request extra spectral features in output CSV."""
+
+    results_dir = tmp_path / "results"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "detect",
+            "example_data/audio",
+            str(results_dir),
+            "0.3",
+            "--spec_features",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert results_dir.exists()
+
+    csv_files = [path.name for path in results_dir.glob("*.csv")]
+
+    expected_files = [
+        "20170701_213954-MYOMYS-LR_0_0.5.wav_spec_features.csv",
+        "20180530_213516-EPTSER-LR_0_0.5.wav_spec_features.csv",
+        "20180627_215323-RHIFER-LR_0_0.5.wav_spec_features.csv",
+    ]
+
+    for expected_file in expected_files:
+        assert expected_file in csv_files
+        df = pd.read_csv(results_dir / expected_file)
+        assert not (df.duration == -1).any()
+
+
+def test_cli_detect_fails_gracefully_on_empty_file(tmp_path: Path) -> None:
+    """User story: bad/empty input file reports error but command survives."""
+
+    results_dir = tmp_path / "results"
+    target = tmp_path / "audio"
+    target.mkdir()
+
+    empty_file = target / "empty.wav"
+    empty_file.touch()
+
+    result = CliRunner().invoke(
+        cli,
+        args=[
+            "detect",
+            str(target),
+            str(results_dir),
+            "0.3",
+            "--spec_features",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert f"Error processing file {empty_file}" in result.output
--- a/tests/test_cli/test_evaluate.py
+++ b/tests/test_cli/test_evaluate.py
@ -0,0 +1,47 @@
+"""CLI tests for evaluate command."""
+
+from pathlib import Path
+
+from click.testing import CliRunner
+
+from batdetect2.cli import cli
+
+BASE_DIR = Path(__file__).parent.parent.parent
+
+
+def test_cli_evaluate_help() -> None:
+    """User story: inspect evaluate command interface and options."""
+
+    result = CliRunner().invoke(cli, ["evaluate", "--help"])
+
+    assert result.exit_code == 0
+    assert "MODEL_PATH" in result.output
+    assert "TEST_DATASET" in result.output
+    assert "--evaluation-config" in result.output
+
+
+def test_cli_evaluate_writes_metrics_for_small_dataset(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+) -> None:
+    """User story: evaluate a checkpoint and get metrics artifacts."""
+
+    output_dir = tmp_path / "eval_out"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "evaluate",
+            str(tiny_checkpoint_path),
+            str(BASE_DIR / "example_data" / "dataset.yaml"),
+            "--base-dir",
+            str(BASE_DIR),
+            "--workers",
+            "0",
+            "--output-dir",
+            str(output_dir),
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert len(list(output_dir.rglob("metrics.csv"))) >= 1
--- a/tests/test_cli/test_predict.py
+++ b/tests/test_cli/test_predict.py
@ -0,0 +1,257 @@
+"""Behavior tests for predict CLI workflows."""
+
+from pathlib import Path
+
+import pytest
+from click.testing import CliRunner
+from soundevent import data, io
+
+from batdetect2.cli import cli
+
+
+def test_cli_predict_help() -> None:
+    """User story: discover available predict modes."""
+
+    result = CliRunner().invoke(cli, ["predict", "--help"])
+
+    assert result.exit_code == 0
+    assert "directory" in result.output
+    assert "file_list" in result.output
+    assert "dataset" in result.output
+
+
+def test_cli_predict_directory_runs_on_real_audio(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+    single_audio_dir: Path,
+) -> None:
+    """User story: run prediction for all files in a directory."""
+
+    output_path = tmp_path / "predictions"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "predict",
+            "directory",
+            str(tiny_checkpoint_path),
+            str(single_audio_dir),
+            str(output_path),
+            "--batch-size",
+            "1",
+            "--workers",
+            "0",
+            "--format",
+            "batdetect2",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert output_path.exists()
+    assert len(list(output_path.glob("*.json"))) == 1
+
+
+def test_cli_predict_file_list_runs_on_real_audio(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+    single_audio_dir: Path,
+) -> None:
+    """User story: run prediction from an explicit list of files."""
+
+    audio_file = next(single_audio_dir.glob("*.wav"))
+    file_list = tmp_path / "files.txt"
+    file_list.write_text(f"{audio_file}\n")
+
+    output_path = tmp_path / "predictions"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "predict",
+            "file_list",
+            str(tiny_checkpoint_path),
+            str(file_list),
+            str(output_path),
+            "--batch-size",
+            "1",
+            "--workers",
+            "0",
+            "--format",
+            "batdetect2",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert output_path.exists()
+    assert len(list(output_path.glob("*.json"))) == 1
+
+
+def test_cli_predict_dataset_runs_on_aoef_metadata(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+    single_audio_dir: Path,
+) -> None:
+    """User story: predict from AOEF dataset metadata file."""
+
+    audio_file = next(single_audio_dir.glob("*.wav"))
+    recording = data.Recording.from_file(audio_file)
+    clip = data.Clip(
+        recording=recording,
+        start_time=0,
+        end_time=recording.duration,
+    )
+    annotation_set = data.AnnotationSet(
+        name="test",
+        description="predict dataset test",
+        clip_annotations=[data.ClipAnnotation(clip=clip, sound_events=[])],
+    )
+
+    dataset_path = tmp_path / "dataset.json"
+    io.save(annotation_set, dataset_path)
+
+    output_path = tmp_path / "predictions"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "predict",
+            "dataset",
+            str(tiny_checkpoint_path),
+            str(dataset_path),
+            str(output_path),
+            "--batch-size",
+            "1",
+            "--workers",
+            "0",
+            "--format",
+            "batdetect2",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert output_path.exists()
+    assert len(list(output_path.glob("*.json"))) == 1
+
+
+@pytest.mark.parametrize(
+    ("format_name", "expected_pattern", "writes_single_file"),
+    [
+        ("batdetect2", "*.json", False),
+        ("raw", "*.nc", False),
+        ("soundevent", "*.json", True),
+    ],
+)
+def test_cli_predict_directory_supports_output_format_override(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+    single_audio_dir: Path,
+    format_name: str,
+    expected_pattern: str,
+    writes_single_file: bool,
+) -> None:
+    """User story: change output format via --format only."""
+
+    output_path = tmp_path / f"predictions_{format_name}"
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "predict",
+            "directory",
+            str(tiny_checkpoint_path),
+            str(single_audio_dir),
+            str(output_path),
+            "--batch-size",
+            "1",
+            "--workers",
+            "0",
+            "--format",
+            format_name,
+        ],
+    )
+
+    assert result.exit_code == 0
+
+    if writes_single_file:
+        assert output_path.with_suffix(".json").exists()
+    else:
+        assert output_path.exists()
+        assert len(list(output_path.glob(expected_pattern))) >= 1
+
+
+def test_cli_predict_dataset_deduplicates_recordings(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+    single_audio_dir: Path,
+) -> None:
+    """User story: duplicated recording entries are predicted once."""
+
+    audio_file = next(single_audio_dir.glob("*.wav"))
+    recording = data.Recording.from_file(audio_file)
+    first_clip = data.Clip(
+        recording=recording,
+        start_time=0,
+        end_time=recording.duration,
+    )
+    second_clip = data.Clip(
+        recording=recording,
+        start_time=0,
+        end_time=recording.duration,
+    )
+    annotation_set = data.AnnotationSet(
+        name="dupe-recording-dataset",
+        description="contains same recording twice",
+        clip_annotations=[
+            data.ClipAnnotation(clip=first_clip, sound_events=[]),
+            data.ClipAnnotation(clip=second_clip, sound_events=[]),
+        ],
+    )
+
+    dataset_path = tmp_path / "dupes.json"
+    io.save(annotation_set, dataset_path)
+
+    output_path = tmp_path / "predictions"
+    result = CliRunner().invoke(
+        cli,
+        [
+            "predict",
+            "dataset",
+            str(tiny_checkpoint_path),
+            str(dataset_path),
+            str(output_path),
+            "--batch-size",
+            "1",
+            "--workers",
+            "0",
+            "--format",
+            "raw",
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert output_path.exists()
+    assert len(list(output_path.glob("*.nc"))) == 1
+
+
+def test_cli_predict_rejects_unknown_output_format(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+    single_audio_dir: Path,
+) -> None:
+    """User story: invalid output format fails with error."""
+
+    output_path = tmp_path / "predictions"
+    result = CliRunner().invoke(
+        cli,
+        [
+            "predict",
+            "directory",
+            str(tiny_checkpoint_path),
+            str(single_audio_dir),
+            str(output_path),
+            "--format",
+            "not_a_real_format",
+        ],
+    )
+
+    assert result.exit_code != 0
--- a/tests/test_cli/test_train.py
+++ b/tests/test_cli/test_train.py
@ -0,0 +1,81 @@
+"""CLI tests for train command."""
+
+from pathlib import Path
+
+from click.testing import CliRunner
+
+from batdetect2.cli import cli
+from batdetect2.models import ModelConfig
+
+
+def test_cli_train_help() -> None:
+    """User story: inspect train command interface and options."""
+
+    result = CliRunner().invoke(cli, ["train", "--help"])
+
+    assert result.exit_code == 0
+    assert "TRAIN_DATASET" in result.output
+    assert "--training-config" in result.output
+    assert "--model" in result.output
+
+
+def test_cli_train_from_checkpoint_runs_on_small_dataset(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+) -> None:
+    """User story: continue training from checkpoint via CLI."""
+
+    ckpt_dir = tmp_path / "checkpoints"
+    log_dir = tmp_path / "logs"
+    ckpt_dir.mkdir()
+    log_dir.mkdir()
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "train",
+            "example_data/dataset.yaml",
+            "--val-dataset",
+            "example_data/dataset.yaml",
+            "--model",
+            str(tiny_checkpoint_path),
+            "--num-epochs",
+            "1",
+            "--train-workers",
+            "0",
+            "--val-workers",
+            "0",
+            "--ckpt-dir",
+            str(ckpt_dir),
+            "--log-dir",
+            str(log_dir),
+        ],
+    )
+
+    assert result.exit_code == 0
+    assert len(list(ckpt_dir.rglob("*.ckpt"))) >= 1
+
+
+def test_cli_train_rejects_model_and_model_config_together(
+    tmp_path: Path,
+    tiny_checkpoint_path: Path,
+) -> None:
+    """User story: invalid train flags fail with clear usage error."""
+
+    model_config_path = tmp_path / "model.yaml"
+    model_config_path.write_text(ModelConfig().to_yaml_string())
+
+    result = CliRunner().invoke(
+        cli,
+        [
+            "train",
+            "example_data/dataset.yaml",
+            "--model",
+            str(tiny_checkpoint_path),
+            "--model-config",
+            str(model_config_path),
+        ],
+    )
+
+    assert result.exit_code != 0
+    assert "--model-config cannot be used with --model" in result.output