mirror of
https://github.com/macaodha/batdetect2.git
synced 2026-05-22 22:32:18 +02:00
164 lines
4.7 KiB
Python
164 lines
4.7 KiB
Python
import sys
|
|
import types
|
|
from pathlib import Path
|
|
|
|
import pytest
|
|
from soundevent import data
|
|
|
|
from batdetect2.train import TrainingConfig, run_train
|
|
from batdetect2.train.checkpoints import resolve_checkpoint_path
|
|
|
|
pytestmark = pytest.mark.slow
|
|
|
|
|
|
def _build_fast_train_config() -> TrainingConfig:
|
|
config = TrainingConfig()
|
|
config.trainer.limit_train_batches = 1
|
|
config.trainer.limit_val_batches = 1
|
|
config.trainer.log_every_n_steps = 1
|
|
config.trainer.check_val_every_n_epoch = 1
|
|
config.train_loader.batch_size = 1
|
|
config.train_loader.augmentations.enabled = False
|
|
return config
|
|
|
|
|
|
def test_train_saves_checkpoint_in_requested_experiment_run_dir(
|
|
tmp_path: Path,
|
|
example_annotations: list[data.ClipAnnotation],
|
|
) -> None:
|
|
config = _build_fast_train_config()
|
|
|
|
run_train(
|
|
train_annotations=example_annotations[:1],
|
|
val_annotations=example_annotations[:1],
|
|
train_config=config,
|
|
num_epochs=1,
|
|
train_workers=0,
|
|
val_workers=0,
|
|
checkpoint_dir=tmp_path,
|
|
experiment_name="exp_a",
|
|
run_name="run_b",
|
|
seed=0,
|
|
)
|
|
|
|
checkpoints = list((tmp_path / "exp_a" / "run_b").rglob("*.ckpt"))
|
|
assert checkpoints
|
|
|
|
|
|
def test_train_without_validation_can_still_save_last_checkpoint(
|
|
tmp_path: Path,
|
|
example_annotations: list[data.ClipAnnotation],
|
|
) -> None:
|
|
config = _build_fast_train_config()
|
|
config.checkpoints.save_last = True
|
|
|
|
run_train(
|
|
train_annotations=example_annotations[:1],
|
|
val_annotations=None,
|
|
train_config=config,
|
|
num_epochs=1,
|
|
train_workers=0,
|
|
val_workers=0,
|
|
checkpoint_dir=tmp_path,
|
|
seed=0,
|
|
)
|
|
|
|
assert list(tmp_path.rglob("last*.ckpt"))
|
|
|
|
|
|
def test_train_controls_which_checkpoints_are_kept(
|
|
tmp_path: Path,
|
|
example_annotations: list[data.ClipAnnotation],
|
|
) -> None:
|
|
config = _build_fast_train_config()
|
|
config.checkpoints.save_top_k = 1
|
|
config.checkpoints.save_last = True
|
|
config.checkpoints.filename = "epoch{epoch}"
|
|
|
|
run_train(
|
|
train_annotations=example_annotations[:1],
|
|
val_annotations=example_annotations[:1],
|
|
train_config=config,
|
|
num_epochs=3,
|
|
train_workers=0,
|
|
val_workers=0,
|
|
checkpoint_dir=tmp_path,
|
|
seed=0,
|
|
)
|
|
|
|
all_checkpoints = list(tmp_path.rglob("*.ckpt"))
|
|
last_checkpoints = list(tmp_path.rglob("last*.ckpt"))
|
|
best_checkpoints = [
|
|
path for path in all_checkpoints if not path.name.startswith("last")
|
|
]
|
|
|
|
assert last_checkpoints
|
|
assert len(best_checkpoints) == 1
|
|
assert "epoch" in best_checkpoints[0].name
|
|
|
|
|
|
def test_resolve_checkpoint_path_returns_local_path_unchanged(
|
|
tmp_path: Path,
|
|
) -> None:
|
|
local_path = tmp_path / "model.ckpt"
|
|
local_path.write_bytes(b"checkpoint")
|
|
|
|
assert resolve_checkpoint_path(local_path) == local_path
|
|
assert resolve_checkpoint_path(str(local_path)) == local_path
|
|
|
|
|
|
def test_resolve_checkpoint_path_downloads_huggingface_checkpoint(
|
|
monkeypatch: pytest.MonkeyPatch,
|
|
tmp_path: Path,
|
|
) -> None:
|
|
expected_path = tmp_path / "downloaded.ckpt"
|
|
|
|
def fake_hf_hub_download(repo_id: str, filename: str) -> str:
|
|
assert repo_id == "owner/repo"
|
|
assert filename == "weights/model.ckpt"
|
|
return str(expected_path)
|
|
|
|
class FakeHuggingFaceHub(types.ModuleType):
|
|
hf_hub_download = staticmethod(fake_hf_hub_download)
|
|
|
|
fake_module = FakeHuggingFaceHub("huggingface_hub")
|
|
monkeypatch.setitem(
|
|
sys.modules,
|
|
"huggingface_hub",
|
|
fake_module,
|
|
)
|
|
|
|
resolved = resolve_checkpoint_path("hf://owner/repo/weights/model.ckpt")
|
|
|
|
assert resolved == expected_path
|
|
|
|
|
|
def test_resolve_checkpoint_path_requires_huggingface_dependency(
|
|
monkeypatch: pytest.MonkeyPatch,
|
|
) -> None:
|
|
monkeypatch.delitem(sys.modules, "huggingface_hub", raising=False)
|
|
|
|
import builtins
|
|
|
|
original_import = builtins.__import__
|
|
|
|
def fake_import(name, globals=None, locals=None, fromlist=(), level=0):
|
|
if name == "huggingface_hub":
|
|
raise ImportError("missing")
|
|
return original_import(name, globals, locals, fromlist, level)
|
|
|
|
monkeypatch.setattr(builtins, "__import__", fake_import)
|
|
|
|
with pytest.raises(ValueError, match="Hugging Face checkpoint support"):
|
|
resolve_checkpoint_path("hf://owner/repo/weights/model.ckpt")
|
|
|
|
|
|
def test_resolve_checkpoint_path_rejects_incomplete_huggingface_uri() -> None:
|
|
with pytest.raises(ValueError, match="hf://owner/repo/path/to"):
|
|
resolve_checkpoint_path("hf://owner/repo")
|
|
|
|
|
|
def test_resolve_checkpoint_path_rejects_missing_local_path() -> None:
|
|
with pytest.raises(FileNotFoundError, match="Checkpoint not found"):
|
|
resolve_checkpoint_path("missing.ckpt")
|