bipolaroidbipolaroid/src/models/__init__.py

76 lines
2.3 KiB
Python

from typing import Any, Dict, Tuple
from .simple_cnn import SimpleCNN
from .residual import Residual
from .histogram_net import HistogramNet
from .dummy import Dummy
import torch
import torch.nn as nn
from pathlib import Path
import logging
import json
MODELS = {
"Dummy": Dummy,
"SimpleCNN": SimpleCNN,
"Residual": Residual,
"HistogramNet": HistogramNet,
}
def create_model(
type: str, hyperparameters: Dict[str, Any], device: torch.device
) -> nn.Module:
return MODELS[type](**hyperparameters).to(device)
def save_model(model: nn.Module, hyperparameters: Dict[str, Any], path: Path):
model_path = path.with_suffix(".pth")
params_path = path.with_suffix(".json")
logging.info(f"Saving model to {model_path}")
logging.info(f"Parameter count: {sum(p.numel() for p in model.parameters())}")
with open(model_path, "wb") as f:
torch.save(model.state_dict(), f)
with open(params_path, "w") as f:
json.dump(hyperparameters, f, indent=2)
def load_model(path: Path, device: torch.device) -> Tuple[nn.Module, Dict[str, Any]]:
logging.info(f"Loading model from {path}")
params_path = path.with_suffix(".json")
with open(params_path) as f:
hyperparameters = json.load(f)
logging.info(f"Hyperparameters: {hyperparameters}")
model_path = path.with_suffix(".pth")
model = create_model(
type=hyperparameters["model_type"],
hyperparameters=hyperparameters,
device=device,
)
model.load_state_dict(torch.load(model_path))
logging.info(f"Parameter count: {sum(p.numel() for p in model.parameters())}")
return model, hyperparameters
def test_models():
for model_name, model_constructor in MODELS.items():
logging.info(f"Testing model {model_name}")
_test_network_dimensions(model_constructor)
def _test_network_dimensions(constructor):
for bin_count in [16, 32, 64]:
model = constructor()
# Create a dummy input tensor of the correct shape, the mini-batch size is 4
input_tensor = torch.rand(4, 1, bin_count, bin_count, bin_count)
output = model(input_tensor)
assert (
input_tensor.shape == output.shape
), f"Expected output shape {input_tensor.shape}, but got {output.shape}"
logging.info("Test passed! Output shape matches input shape.")