Source code for starling.inference.model_loading

import os

import torch

import starling
from starling import configs

# local imports
from starling.configs import DEFAULT_DDPM_WEIGHTS_PATH, DEFAULT_ENCODER_WEIGHTS_PATH
from starling.models.diffusion import DiffusionModel
from starling.models.transformer import SequenceEncoder
from starling.models.vae import VAE
from starling.models.vit import ViT



[docs]
class ModelManager:

[docs]
    def __init__(self):
        self.encoder_model = None
        self.diffusion_model = None



[docs]
    def load_models(self, encoder_path, ddpm_path, device):
        """Load the models from local files or URLs."""

        def load_from_path_or_url(path):
            if path.startswith("http"):
                # Download from URL if not cached
                cache_dir = torch.hub.get_dir() + "/checkpoints/"
                os.makedirs(cache_dir, exist_ok=True)
                cached_path = cache_dir + os.path.basename(path)
                if not os.path.exists(cached_path):
                    torch.hub.download_url_to_file(path, cached_path)
                return cached_path
            return path

        # Resolve paths
        encoder_path = encoder_path or DEFAULT_ENCODER_WEIGHTS_PATH
        ddpm_path = ddpm_path or DEFAULT_DDPM_WEIGHTS_PATH

        encoder_path = load_from_path_or_url(encoder_path)
        ddpm_path = load_from_path_or_url(ddpm_path)

        # Continue with existing loading logic
        if not os.path.exists(encoder_path):
            raise FileNotFoundError(f"Encoder model {encoder_path} not found.")
        if not os.path.exists(ddpm_path):
            raise FileNotFoundError(f"DDPM model {ddpm_path} not found.")

        # Load the diffusion model
        sequence_encoder = SequenceEncoder(12, 512, 8)
        diffusion_model = DiffusionModel.load_from_checkpoint(
            ddpm_path,
            model=ViT(12, 512, 8, 512),
            sequence_encoder=sequence_encoder,
            distance_map_encoder=encoder_path,
            map_location=device,
        )
        encoder_model = VAE.load_from_checkpoint(
            encoder_path,
            map_location=device,
        )
        return encoder_model, diffusion_model



[docs]
    def get_models(
        self,
        encoder_path=DEFAULT_ENCODER_WEIGHTS_PATH,
        ddpm_path=DEFAULT_DDPM_WEIGHTS_PATH,
        device="cpu",
    ):
        """
        Lazy-load models if not already loaded.

        Parameters
        ----------
        encoder_path : str
            The path to the encoder model.
            Default is
        ddpm_path : str
            The path to the DDPM model.
        device : str
            The device on which to load the models. Default is CPU,
            but this changes depending on whatever we want to use
            in ensemble_generation.py. Just made CPU default because
            all platforms have CPU.

        Returns
        -------
        encoder_model, diffusion_model
            The loaded encoder and diffusion models.
        """
        if self.encoder_model is None or self.diffusion_model is None:
            # Models haven't been loaded yet, so load them now
            self.encoder_model, self.diffusion_model = self.load_models(
                encoder_path, ddpm_path, device
            )
            if configs.TORCH_COMPILATION["enabled"]:
                # Compile the models if requested
                self.encoder_model, self.diffusion_model = self.compile()

        # Return the already-loaded models
        return self.encoder_model, self.diffusion_model



[docs]
    def compile(self):
        """
        Compile the models using PyTorch's compile function.
        This is a placeholder for the actual compilation logic.
        """
        compile_kwargs = configs.TORCH_COMPILATION["options"].copy()

        self.diffusion_model.model = torch.compile(
            self.diffusion_model.model, **compile_kwargs
        )
        self.encoder_model.decoder = torch.compile(
            self.encoder_model.decoder, **compile_kwargs
        )

        # self.diffusion_model.sequence_encoder = torch.compile(
        #     self.diffusion_model.sequence_encoder, **compile_kwargs
        # )

        print(
            "\nCompiling the diffusion model for faster inference, this may take a while..."
        )
        print(
            "This is a one-time operation, subsequent inferences will be MUCH faster.\n"
        )
        print("Compiling with the following options:")
        for key, value in compile_kwargs.items():
            print(f"  {key}: {value}")

        return self.encoder_model, self.diffusion_model