imaginAIry/imaginairy/utils.py

import importlib
import logging
import platform
from contextlib import contextmanager
from functools import lru_cache
from typing import List, Optional

import numpy as np
import torch
from PIL import Image
from torch import Tensor

logger = logging.getLogger(__name__)


@lru_cache()
def get_device():
    if torch.cuda.is_available():
        return "cuda"
    elif torch.backends.mps.is_available():
        return "mps"
    else:
        return "cpu"


@lru_cache()
def get_device_name(device_type):
    if device_type == "cuda":
        return torch.cuda.get_device_name(0)
    return platform.processor()


def log_params(model):
    total_params = sum(p.numel() for p in model.parameters())
    logger.debug(f"{model.__class__.__name__} has {total_params * 1.e-6:.2f} M params.")


def instantiate_from_config(config):
    if not "target" in config:
        if config == "__is_first_stage__":
            return None
        elif config == "__is_unconditional__":
            return None
        raise KeyError("Expected key `target` to instantiate.")
    return get_obj_from_str(config["target"])(**config.get("params", dict()))


def get_obj_from_str(string, reload=False):
    module, cls = string.rsplit(".", 1)
    if reload:
        module_imp = importlib.import_module(module)
        importlib.reload(module_imp)
    return getattr(importlib.import_module(module, package=None), cls)


from torch.overrides import handle_torch_function, has_torch_function_variadic


def _fixed_layer_norm(
    input: Tensor,
    normalized_shape: List[int],
    weight: Optional[Tensor] = None,
    bias: Optional[Tensor] = None,
    eps: float = 1e-5,
) -> Tensor:
    r"""Applies Layer Normalization for last certain number of dimensions.
    See :class:`~torch.nn.LayerNorm` for details.
    """
    if has_torch_function_variadic(input, weight, bias):
        return handle_torch_function(
            _fixed_layer_norm,
            (input, weight, bias),
            input,
            normalized_shape,
            weight=weight,
            bias=bias,
            eps=eps,
        )
    return torch.layer_norm(
        input.contiguous(),
        normalized_shape,
        weight,
        bias,
        eps,
        torch.backends.cudnn.enabled,
    )


@contextmanager
def fix_torch_nn_layer_norm():
    """https://github.com/CompVis/stable-diffusion/issues/25#issuecomment-1221416526"""
    from torch.nn import functional

    orig_function = functional.layer_norm
    functional.layer_norm = _fixed_layer_norm
    try:
        yield
    finally:
        functional.layer_norm = orig_function


def img_path_to_torch_image(path, max_height=512, max_width=512):
    image = Image.open(path).convert("RGB")
    logger.info(f"Loaded input 🖼 of size {image.size} from {path}")
    return pillow_img_to_torch_image(image, max_height=max_height, max_width=max_width)


def pillow_img_to_torch_image(image, max_height=512, max_width=512):
    w, h = image.size
    resize_ratio = min(max_width / w, max_height / h)
    w, h = int(w * resize_ratio), int(h * resize_ratio)
    w, h = map(lambda x: x - x % 64, (w, h))  # resize to integer multiple of 32
    image = image.resize((w, h), resample=Image.Resampling.LANCZOS)
    image = np.array(image).astype(np.float32) / 255.0
    image = image[None].transpose(0, 3, 1, 2)
    image = torch.from_numpy(image)
    return 2.0 * image - 1.0, w, h
first commit 2022-09-08 03:59:30 +00:00			`import importlib`
refactor: use logging instead of prints 2022-09-09 04:51:25 +00:00			`import logging`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2022-09-11 06:27:22 +00:00			`import platform`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			`from contextlib import contextmanager`
first commit 2022-09-08 03:59:30 +00:00			`from functools import lru_cache`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			`from typing import List, Optional`
first commit 2022-09-08 03:59:30 +00:00
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2022-09-12 01:00:40 +00:00			`import numpy as np`
first commit 2022-09-08 03:59:30 +00:00			`import torch`
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2022-09-12 01:00:40 +00:00			`from PIL import Image`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			`from torch import Tensor`
first commit 2022-09-08 03:59:30 +00:00
refactor: use logging instead of prints 2022-09-09 04:51:25 +00:00			`logger = logging.getLogger(__name__)`

first commit 2022-09-08 03:59:30 +00:00
			`@lru_cache()`
			`def get_device():`
			`if torch.cuda.is_available():`
			`return "cuda"`
			`elif torch.backends.mps.is_available():`
			`return "mps"`
			`else:`
			`return "cpu"`


feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2022-09-11 06:27:22 +00:00			`@lru_cache()`
			`def get_device_name(device_type):`
			`if device_type == "cuda":`
			`return torch.cuda.get_device_name(0)`
			`return platform.processor()`


refactor: use logging instead of prints 2022-09-09 04:51:25 +00:00			`def log_params(model):`
first commit 2022-09-08 03:59:30 +00:00			`total_params = sum(p.numel() for p in model.parameters())`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2022-09-11 06:27:22 +00:00			`logger.debug(f"{model.__class__.__name__} has {total_params * 1.e-6:.2f} M params.")`
first commit 2022-09-08 03:59:30 +00:00

			`def instantiate_from_config(config):`
			`if not "target" in config:`
			`if config == "__is_first_stage__":`
			`return None`
			`elif config == "__is_unconditional__":`
			`return None`
			raise KeyError("Expected key `target` to instantiate.")
			`return get_obj_from_str(config["target"])(**config.get("params", dict()))`


			`def get_obj_from_str(string, reload=False):`
			`module, cls = string.rsplit(".", 1)`
			`if reload:`
			`module_imp = importlib.import_module(module)`
			`importlib.reload(module_imp)`
			`return getattr(importlib.import_module(module, package=None), cls)`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00

refactor: run import sorter 2022-09-11 20:58:14 +00:00			`from torch.overrides import handle_torch_function, has_torch_function_variadic`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00

			`def _fixed_layer_norm(`
			`input: Tensor,`
			`normalized_shape: List[int],`
			`weight: Optional[Tensor] = None,`
			`bias: Optional[Tensor] = None,`
			`eps: float = 1e-5,`
			`) -> Tensor:`
			`r"""Applies Layer Normalization for last certain number of dimensions.`
			See :class:`~torch.nn.LayerNorm` for details.
			`"""`
			`if has_torch_function_variadic(input, weight, bias):`
			`return handle_torch_function(`
			`_fixed_layer_norm,`
			`(input, weight, bias),`
			`input,`
			`normalized_shape,`
			`weight=weight,`
			`bias=bias,`
			`eps=eps,`
			`)`
			`return torch.layer_norm(`
			`input.contiguous(),`
			`normalized_shape,`
			`weight,`
			`bias,`
			`eps,`
			`torch.backends.cudnn.enabled,`
			`)`


			`@contextmanager`
			`def fix_torch_nn_layer_norm():`
			`"""https://github.com/CompVis/stable-diffusion/issues/25#issuecomment-1221416526"""`
			`from torch.nn import functional`

			`orig_function = functional.layer_norm`
			`functional.layer_norm = _fixed_layer_norm`
			`try:`
			`yield`
			`finally:`
			`functional.layer_norm = orig_function`
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2022-09-12 01:00:40 +00:00

			`def img_path_to_torch_image(path, max_height=512, max_width=512):`
			`image = Image.open(path).convert("RGB")`
perf: get "half" mode working when running on cuda 2022-09-12 04:32:11 +00:00			`logger.info(f"Loaded input 🖼 of size {image.size} from {path}")`
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2022-09-12 01:00:40 +00:00			`return pillow_img_to_torch_image(image, max_height=max_height, max_width=max_width)`


			`def pillow_img_to_torch_image(image, max_height=512, max_width=512):`
			`w, h = image.size`
			`resize_ratio = min(max_width / w, max_height / h)`
			`w, h = int(w * resize_ratio), int(h * resize_ratio)`
			`w, h = map(lambda x: x - x % 64, (w, h)) # resize to integer multiple of 32`
perf: get "half" mode working when running on cuda 2022-09-12 04:32:11 +00:00			`image = image.resize((w, h), resample=Image.Resampling.LANCZOS)`
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2022-09-12 01:00:40 +00:00			`image = np.array(image).astype(np.float32) / 255.0`
			`image = image[None].transpose(0, 3, 1, 2)`
			`image = torch.from_numpy(image)`
			`return 2.0 * image - 1.0, w, h`