Change inference command to predict

This commit is contained in:
mbsantiago 2026-03-18 20:07:53 +00:00
parent 2f03abe8f6
commit f0af5dd79e
3 changed files with 284 additions and 0 deletions

View File

@ -2,6 +2,7 @@ from batdetect2.cli.base import cli
from batdetect2.cli.compat import detect
from batdetect2.cli.data import data
from batdetect2.cli.evaluate import evaluate_command
from batdetect2.cli.inference import predict
from batdetect2.cli.train import train_command
__all__ = [
@ -10,6 +11,7 @@ __all__ = [
"data",
"train_command",
"evaluate_command",
"predict",
]

View File

@ -0,0 +1,229 @@
from pathlib import Path
import click
from loguru import logger
from soundevent import io
from soundevent.audio.files import get_audio_files
from batdetect2.cli.base import cli
__all__ = ["predict"]
@cli.group(name="predict")
def predict() -> None:
"""Run prediction with BatDetect2 API v2."""
def _build_api(
model_path: Path,
audio_config: Path | None,
inference_config: Path | None,
outputs_config: Path | None,
logging_config: Path | None,
):
from batdetect2.api_v2 import BatDetect2API
from batdetect2.audio import AudioConfig
from batdetect2.inference import InferenceConfig
from batdetect2.logging import AppLoggingConfig
from batdetect2.outputs import OutputsConfig
audio_conf = (
AudioConfig.load(audio_config) if audio_config is not None else None
)
inference_conf = (
InferenceConfig.load(inference_config)
if inference_config is not None
else None
)
outputs_conf = (
OutputsConfig.load(outputs_config)
if outputs_config is not None
else None
)
logging_conf = (
AppLoggingConfig.load(logging_config)
if logging_config is not None
else None
)
api = BatDetect2API.from_checkpoint(
model_path,
audio_config=audio_conf,
inference_config=inference_conf,
outputs_config=outputs_conf,
logging_config=logging_conf,
)
return api, audio_conf, inference_conf, outputs_conf
def _run_inference(
model_path: Path,
audio_files: list[Path],
output_path: Path,
audio_config: Path | None,
inference_config: Path | None,
outputs_config: Path | None,
logging_config: Path | None,
batch_size: int | None,
num_workers: int,
format_name: str | None,
) -> None:
logger.info("Initiating prediction process...")
api, audio_conf, inference_conf, outputs_conf = _build_api(
model_path,
audio_config,
inference_config,
outputs_config,
logging_config,
)
logger.info("Found {num_files} audio files", num_files=len(audio_files))
predictions = api.process_files(
audio_files,
batch_size=batch_size,
num_workers=num_workers,
audio_config=audio_conf,
inference_config=inference_conf,
output_config=outputs_conf,
)
common_path = audio_files[0].parent if audio_files else None
api.save_predictions(
predictions,
path=output_path,
audio_dir=common_path,
format=format_name,
)
logger.info(
"Inference complete. Results saved to {path}", path=output_path
)
@predict.command(name="directory")
@click.argument("model_path", type=click.Path(exists=True))
@click.argument("audio_dir", type=click.Path(exists=True))
@click.argument("output_path", type=click.Path())
@click.option("--audio-config", type=click.Path(exists=True))
@click.option("--inference-config", type=click.Path(exists=True))
@click.option("--outputs-config", type=click.Path(exists=True))
@click.option("--logging-config", type=click.Path(exists=True))
@click.option("--batch-size", type=int)
@click.option("--workers", "num_workers", type=int, default=0)
@click.option("--format", "format_name", type=str)
def inference_directory_command(
model_path: Path,
audio_dir: Path,
output_path: Path,
audio_config: Path | None,
inference_config: Path | None,
outputs_config: Path | None,
logging_config: Path | None,
batch_size: int | None,
num_workers: int,
format_name: str | None,
) -> None:
audio_files = list(get_audio_files(audio_dir))
_run_inference(
model_path=model_path,
audio_files=audio_files,
output_path=output_path,
audio_config=audio_config,
inference_config=inference_config,
outputs_config=outputs_config,
logging_config=logging_config,
batch_size=batch_size,
num_workers=num_workers,
format_name=format_name,
)
@predict.command(name="file_list")
@click.argument("model_path", type=click.Path(exists=True))
@click.argument("file_list", type=click.Path(exists=True))
@click.argument("output_path", type=click.Path())
@click.option("--audio-config", type=click.Path(exists=True))
@click.option("--inference-config", type=click.Path(exists=True))
@click.option("--outputs-config", type=click.Path(exists=True))
@click.option("--logging-config", type=click.Path(exists=True))
@click.option("--batch-size", type=int)
@click.option("--workers", "num_workers", type=int, default=0)
@click.option("--format", "format_name", type=str)
def inference_file_list_command(
model_path: Path,
file_list: Path,
output_path: Path,
audio_config: Path | None,
inference_config: Path | None,
outputs_config: Path | None,
logging_config: Path | None,
batch_size: int | None,
num_workers: int,
format_name: str | None,
) -> None:
audio_files = [
Path(line.strip())
for line in file_list.read_text().splitlines()
if line.strip()
]
_run_inference(
model_path=model_path,
audio_files=audio_files,
output_path=output_path,
audio_config=audio_config,
inference_config=inference_config,
outputs_config=outputs_config,
logging_config=logging_config,
batch_size=batch_size,
num_workers=num_workers,
format_name=format_name,
)
@predict.command(name="dataset")
@click.argument("model_path", type=click.Path(exists=True))
@click.argument("dataset_path", type=click.Path(exists=True))
@click.argument("output_path", type=click.Path())
@click.option("--audio-config", type=click.Path(exists=True))
@click.option("--inference-config", type=click.Path(exists=True))
@click.option("--outputs-config", type=click.Path(exists=True))
@click.option("--logging-config", type=click.Path(exists=True))
@click.option("--batch-size", type=int)
@click.option("--workers", "num_workers", type=int, default=0)
@click.option("--format", "format_name", type=str)
def inference_dataset_command(
model_path: Path,
dataset_path: Path,
output_path: Path,
audio_config: Path | None,
inference_config: Path | None,
outputs_config: Path | None,
logging_config: Path | None,
batch_size: int | None,
num_workers: int,
format_name: str | None,
) -> None:
dataset = io.load(dataset_path, type="annotation_set")
audio_files = sorted(
{
Path(clip_annotation.clip.recording.path)
for clip_annotation in dataset.clip_annotations
}
)
_run_inference(
model_path=model_path,
audio_files=audio_files,
output_path=output_path,
audio_config=audio_config,
inference_config=inference_config,
outputs_config=outputs_config,
logging_config=logging_config,
batch_size=batch_size,
num_workers=num_workers,
format_name=format_name,
)

View File

@ -1,11 +1,15 @@
"""Test the command line interface."""
import shutil
from pathlib import Path
import lightning as L
import pandas as pd
from click.testing import CliRunner
from batdetect2.cli import cli
from batdetect2.config import BatDetect2Config
from batdetect2.train.lightning import build_training_module
runner = CliRunner()
@ -26,6 +30,55 @@ def test_cli_detect_command_help():
assert "Detect bat calls in files in AUDIO_DIR" in result.output
def test_cli_predict_command_help():
"""Test the predict command help."""
result = runner.invoke(cli, ["predict", "--help"])
assert result.exit_code == 0
assert "directory" in result.output
assert "file_list" in result.output
assert "dataset" in result.output
def test_cli_predict_directory_runs_on_real_audio(tmp_path: Path):
"""User story: run prediction from CLI on a small directory."""
source_audio = Path("example_data/audio")
source_file = next(source_audio.glob("*.wav"))
audio_dir = tmp_path / "audio"
audio_dir.mkdir()
target_file = audio_dir / source_file.name
shutil.copy(source_file, target_file)
module = build_training_module(model_config=BatDetect2Config().model)
trainer = L.Trainer(enable_checkpointing=False, logger=False)
model_path = tmp_path / "model.ckpt"
trainer.strategy.connect(module)
trainer.save_checkpoint(model_path)
output_path = tmp_path / "predictions"
result = runner.invoke(
cli,
[
"predict",
"directory",
str(model_path),
str(audio_dir),
str(output_path),
"--batch-size",
"1",
"--workers",
"0",
"--format",
"batdetect2",
],
)
assert result.exit_code == 0
assert output_path.exists()
output_files = list(output_path.glob("*.json"))
assert len(output_files) == 1
def test_cli_detect_command_on_test_audio(tmp_path):
"""Test the detect command on test audio."""
results_dir = tmp_path / "results"