Change inference command to predict

2026-05-22 22:32:18 +02:00 · 2026-03-18 20:07:53 +00:00 · 2026-03-18 20:07:53 +00:00 · f0af5dd79e
commit f0af5dd79e
parent 2f03abe8f6
3 changed files with 284 additions and 0 deletions
--- a/src/batdetect2/cli/init.py
+++ b/src/batdetect2/cli/init.py
@ -2,6 +2,7 @@ from batdetect2.cli.base import cli
 from batdetect2.cli.compat import detect
 from batdetect2.cli.data import data
 from batdetect2.cli.evaluate import evaluate_command
 from batdetect2.cli.inference import predict
 from batdetect2.cli.train import train_command
 __all__ = [
@ -10,6 +11,7 @@ __all__ = [
    "data",
    "train_command",
    "evaluate_command",
    "predict",
 ]
--- a/src/batdetect2/cli/inference.py
+++ b/src/batdetect2/cli/inference.py
@ -0,0 +1,229 @@
 from pathlib import Path
 import click
 from loguru import logger
 from soundevent import io
 from soundevent.audio.files import get_audio_files
 from batdetect2.cli.base import cli
 __all__ = ["predict"]
@cli.group(name="predict")
 def predict() -> None:
    """Run prediction with BatDetect2 API v2."""
 def _build_api(
    model_path: Path,
    audio_config: Path | None,
    inference_config: Path | None,
    outputs_config: Path | None,
    logging_config: Path | None,
 ):
    from batdetect2.api_v2 import BatDetect2API
    from batdetect2.audio import AudioConfig
    from batdetect2.inference import InferenceConfig
    from batdetect2.logging import AppLoggingConfig
    from batdetect2.outputs import OutputsConfig
    audio_conf = (
        AudioConfig.load(audio_config) if audio_config is not None else None
    )
    inference_conf = (
        InferenceConfig.load(inference_config)
        if inference_config is not None
        else None
    )
    outputs_conf = (
        OutputsConfig.load(outputs_config)
        if outputs_config is not None
        else None
    )
    logging_conf = (
        AppLoggingConfig.load(logging_config)
        if logging_config is not None
        else None
    )
    api = BatDetect2API.from_checkpoint(
        model_path,
        audio_config=audio_conf,
        inference_config=inference_conf,
        outputs_config=outputs_conf,
        logging_config=logging_conf,
    )
    return api, audio_conf, inference_conf, outputs_conf
 def _run_inference(
    model_path: Path,
    audio_files: list[Path],
    output_path: Path,
    audio_config: Path | None,
    inference_config: Path | None,
    outputs_config: Path | None,
    logging_config: Path | None,
    batch_size: int | None,
    num_workers: int,
    format_name: str | None,
 ) -> None:
    logger.info("Initiating prediction process...")
    api, audio_conf, inference_conf, outputs_conf = _build_api(
        model_path,
        audio_config,
        inference_config,
        outputs_config,
        logging_config,
    )
    logger.info("Found {num_files} audio files", num_files=len(audio_files))
    predictions = api.process_files(
        audio_files,
        batch_size=batch_size,
        num_workers=num_workers,
        audio_config=audio_conf,
        inference_config=inference_conf,
        output_config=outputs_conf,
    )
    common_path = audio_files[0].parent if audio_files else None
    api.save_predictions(
        predictions,
        path=output_path,
        audio_dir=common_path,
        format=format_name,
    )
    logger.info(
        "Inference complete. Results saved to {path}", path=output_path
    )
@predict.command(name="directory")
@click.argument("model_path", type=click.Path(exists=True))
@click.argument("audio_dir", type=click.Path(exists=True))
@click.argument("output_path", type=click.Path())
@click.option("--audio-config", type=click.Path(exists=True))
@click.option("--inference-config", type=click.Path(exists=True))
@click.option("--outputs-config", type=click.Path(exists=True))
@click.option("--logging-config", type=click.Path(exists=True))
@click.option("--batch-size", type=int)
@click.option("--workers", "num_workers", type=int, default=0)
@click.option("--format", "format_name", type=str)
 def inference_directory_command(
    model_path: Path,
    audio_dir: Path,
    output_path: Path,
    audio_config: Path | None,
    inference_config: Path | None,
    outputs_config: Path | None,
    logging_config: Path | None,
    batch_size: int | None,
    num_workers: int,
    format_name: str | None,
 ) -> None:
    audio_files = list(get_audio_files(audio_dir))
    _run_inference(
        model_path=model_path,
        audio_files=audio_files,
        output_path=output_path,
        audio_config=audio_config,
        inference_config=inference_config,
        outputs_config=outputs_config,
        logging_config=logging_config,
        batch_size=batch_size,
        num_workers=num_workers,
        format_name=format_name,
    )
@predict.command(name="file_list")
@click.argument("model_path", type=click.Path(exists=True))
@click.argument("file_list", type=click.Path(exists=True))
@click.argument("output_path", type=click.Path())
@click.option("--audio-config", type=click.Path(exists=True))
@click.option("--inference-config", type=click.Path(exists=True))
@click.option("--outputs-config", type=click.Path(exists=True))
@click.option("--logging-config", type=click.Path(exists=True))
@click.option("--batch-size", type=int)
@click.option("--workers", "num_workers", type=int, default=0)
@click.option("--format", "format_name", type=str)
 def inference_file_list_command(
    model_path: Path,
    file_list: Path,
    output_path: Path,
    audio_config: Path | None,
    inference_config: Path | None,
    outputs_config: Path | None,
    logging_config: Path | None,
    batch_size: int | None,
    num_workers: int,
    format_name: str | None,
 ) -> None:
    audio_files = [
        Path(line.strip())
        for line in file_list.read_text().splitlines()
        if line.strip()
    ]
    _run_inference(
        model_path=model_path,
        audio_files=audio_files,
        output_path=output_path,
        audio_config=audio_config,
        inference_config=inference_config,
        outputs_config=outputs_config,
        logging_config=logging_config,
        batch_size=batch_size,
        num_workers=num_workers,
        format_name=format_name,
    )
@predict.command(name="dataset")
@click.argument("model_path", type=click.Path(exists=True))
@click.argument("dataset_path", type=click.Path(exists=True))
@click.argument("output_path", type=click.Path())
@click.option("--audio-config", type=click.Path(exists=True))
@click.option("--inference-config", type=click.Path(exists=True))
@click.option("--outputs-config", type=click.Path(exists=True))
@click.option("--logging-config", type=click.Path(exists=True))
@click.option("--batch-size", type=int)
@click.option("--workers", "num_workers", type=int, default=0)
@click.option("--format", "format_name", type=str)
 def inference_dataset_command(
    model_path: Path,
    dataset_path: Path,
    output_path: Path,
    audio_config: Path | None,
    inference_config: Path | None,
    outputs_config: Path | None,
    logging_config: Path | None,
    batch_size: int | None,
    num_workers: int,
    format_name: str | None,
 ) -> None:
    dataset = io.load(dataset_path, type="annotation_set")
    audio_files = sorted(
        {
            Path(clip_annotation.clip.recording.path)
            for clip_annotation in dataset.clip_annotations
        }
    )
    _run_inference(
        model_path=model_path,
        audio_files=audio_files,
        output_path=output_path,
        audio_config=audio_config,
        inference_config=inference_config,
        outputs_config=outputs_config,
        logging_config=logging_config,
        batch_size=batch_size,
        num_workers=num_workers,
        format_name=format_name,
    )
--- a/tests/test_cli.py
+++ b/tests/test_cli.py
@ -1,11 +1,15 @@
 """Test the command line interface."""
 import shutil
 from pathlib import Path
 import lightning as L
 import pandas as pd
 from click.testing import CliRunner
 from batdetect2.cli import cli
 from batdetect2.config import BatDetect2Config
 from batdetect2.train.lightning import build_training_module
 runner = CliRunner()
@ -26,6 +30,55 @@ def test_cli_detect_command_help():
    assert "Detect bat calls in files in AUDIO_DIR" in result.output
 def test_cli_predict_command_help():
    """Test the predict command help."""
    result = runner.invoke(cli, ["predict", "--help"])
    assert result.exit_code == 0
    assert "directory" in result.output
    assert "file_list" in result.output
    assert "dataset" in result.output
 def test_cli_predict_directory_runs_on_real_audio(tmp_path: Path):
    """User story: run prediction from CLI on a small directory."""
    source_audio = Path("example_data/audio")
    source_file = next(source_audio.glob("*.wav"))
    audio_dir = tmp_path / "audio"
    audio_dir.mkdir()
    target_file = audio_dir / source_file.name
    shutil.copy(source_file, target_file)
    module = build_training_module(model_config=BatDetect2Config().model)
    trainer = L.Trainer(enable_checkpointing=False, logger=False)
    model_path = tmp_path / "model.ckpt"
    trainer.strategy.connect(module)
    trainer.save_checkpoint(model_path)
    output_path = tmp_path / "predictions"
    result = runner.invoke(
        cli,
        [
            "predict",
            "directory",
            str(model_path),
            str(audio_dir),
            str(output_path),
            "--batch-size",
            "1",
            "--workers",
            "0",
            "--format",
            "batdetect2",
        ],
    )
    assert result.exit_code == 0
    assert output_path.exists()
    output_files = list(output_path.glob("*.json"))
    assert len(output_files) == 1
 def test_cli_detect_command_on_test_audio(tmp_path):
    """Test the detect command on test audio."""
    results_dir = tmp_path / "results"