imaginAIry/imaginairy/utils.py

import importlib
import logging
import os.path
import platform
from contextlib import contextmanager, nullcontext
from functools import lru_cache
from typing import List, Optional

import requests
import torch
from torch import Tensor, autocast
from torch.nn import functional
from torch.overrides import handle_torch_function, has_torch_function_variadic
from transformers import cached_path

logger = logging.getLogger(__name__)


@lru_cache()
def get_device():
    if torch.cuda.is_available():
        return "cuda"

    if torch.backends.mps.is_available():
        return "mps:0"

    return "cpu"


@lru_cache()
def get_device_name(device_type):
    if device_type == "cuda":
        return torch.cuda.get_device_name(0)
    return platform.processor()


def log_params(model):
    total_params = sum(p.numel() for p in model.parameters())
    logger.debug(f"{model.__class__.__name__} has {total_params * 1.e-6:.2f} M params.")


def instantiate_from_config(config):
    if "target" not in config:
        if config == "__is_first_stage__":
            return None
        if config == "__is_unconditional__":
            return None
        raise KeyError("Expected key `target` to instantiate.")
    return get_obj_from_str(config["target"])(**config.get("params", {}))


def get_obj_from_str(string, reload=False):
    module, cls = string.rsplit(".", 1)
    if reload:
        module_imp = importlib.import_module(module)
        importlib.reload(module_imp)
    return getattr(importlib.import_module(module, package=None), cls)


@contextmanager
def platform_appropriate_autocast(precision="autocast"):
    """
    Allow calculations to run in mixed precision, which can be faster
    """
    precision_scope = nullcontext
    if precision == "autocast" and get_device() in ("cuda", "cpu"):
        precision_scope = autocast
    with precision_scope(get_device()):
        yield


def _fixed_layer_norm(
    input: Tensor,  # noqa
    normalized_shape: List[int],
    weight: Optional[Tensor] = None,
    bias: Optional[Tensor] = None,
    eps: float = 1e-5,
) -> Tensor:
    """
    Applies Layer Normalization for last certain number of dimensions.

    See :class:`~torch.nn.LayerNorm` for details.
    """
    if has_torch_function_variadic(input, weight, bias):
        return handle_torch_function(
            _fixed_layer_norm,
            (input, weight, bias),
            input,
            normalized_shape,
            weight=weight,
            bias=bias,
            eps=eps,
        )
    return torch.layer_norm(
        input.contiguous(),
        normalized_shape,
        weight,
        bias,
        eps,
        torch.backends.cudnn.enabled,
    )


@contextmanager
def fix_torch_nn_layer_norm():
    """https://github.com/CompVis/stable-diffusion/issues/25#issuecomment-1221416526"""
    orig_function = functional.layer_norm
    functional.layer_norm = _fixed_layer_norm
    try:
        yield
    finally:
        functional.layer_norm = orig_function


@contextmanager
def fix_torch_group_norm():
    """
    Patch group_norm to cast the weights to the same type as the inputs

    From what I can understand all the other repos just switch to full precision instead
    of addressing this.  I think this would make things slower but I'm not sure.

    https://github.com/pytorch/pytorch/pull/81852

    """

    orig_group_norm = functional.group_norm

    def _group_norm_wrapper(
        input: Tensor,  # noqa
        num_groups: int,
        weight: Optional[Tensor] = None,
        bias: Optional[Tensor] = None,
        eps: float = 1e-5,
    ) -> Tensor:
        if weight is not None and weight.dtype != input.dtype:
            weight = weight.to(input.dtype)
        if bias is not None and bias.dtype != input.dtype:
            bias = bias.to(input.dtype)

        return orig_group_norm(
            input=input, num_groups=num_groups, weight=weight, bias=bias, eps=eps
        )

    functional.group_norm = _group_norm_wrapper
    try:
        yield
    finally:
        functional.group_norm = orig_group_norm


def get_cache_dir():
    xdg_cache_home = os.getenv("XDG_CACHE_HOME", None)
    if xdg_cache_home is None:
        user_home = os.getenv("HOME", None)
        if user_home:
            xdg_cache_home = os.path.join(user_home, ".cache")

    if xdg_cache_home is not None:
        return os.path.join(xdg_cache_home, "imaginairy", "weights")

    return os.path.join(os.path.dirname(__file__), ".cached-downloads")


def get_cached_url_path(url):
    try:
        return cached_path(url)
    except OSError:
        pass
    filename = url.split("/")[-1]
    dest = get_cache_dir()
    os.makedirs(dest, exist_ok=True)
    dest_path = os.path.join(dest, filename)
    if os.path.exists(dest_path):
        return dest_path
    r = requests.get(url)  # noqa

    with open(dest_path, "wb") as f:
        f.write(r.content)
    return dest_path
first commit 2022-09-08 03:59:30 +00:00			`import importlib`
refactor: use logging instead of prints 2022-09-09 04:51:25 +00:00			`import logging`
feature: face enhancement and upscaling!! 2022-09-13 07:27:53 +00:00			`import os.path`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2022-09-11 06:27:22 +00:00			`import platform`
fix: try to address #13 BFloat16 issue Seems to be caused by incompatible types in group_norm when we use autocast. Patch group_norm to cast the weights to the same type as the inputs From what I can understand all the other repos just switch to full precision instead of addressing this. I think this would make things slower but I'm not sure. So maybe the patching solution I'm doing is better? https://github.com/pytorch/pytorch/pull/81852 2022-09-22 05:03:12 +00:00			`from contextlib import contextmanager, nullcontext`
first commit 2022-09-08 03:59:30 +00:00			`from functools import lru_cache`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			`from typing import List, Optional`
first commit 2022-09-08 03:59:30 +00:00
feature: face enhancement and upscaling!! 2022-09-13 07:27:53 +00:00			`import requests`
first commit 2022-09-08 03:59:30 +00:00			`import torch`
fix: try to address #13 BFloat16 issue Seems to be caused by incompatible types in group_norm when we use autocast. Patch group_norm to cast the weights to the same type as the inputs From what I can understand all the other repos just switch to full precision instead of addressing this. I think this would make things slower but I'm not sure. So maybe the patching solution I'm doing is better? https://github.com/pytorch/pytorch/pull/81852 2022-09-22 05:03:12 +00:00			`from torch import Tensor, autocast`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`from torch.nn import functional`
docs and lint 2022-09-13 07:46:37 +00:00			`from torch.overrides import handle_torch_function, has_torch_function_variadic`
feature: face enhancement and upscaling!! 2022-09-13 07:27:53 +00:00			`from transformers import cached_path`
first commit 2022-09-08 03:59:30 +00:00
refactor: use logging instead of prints 2022-09-09 04:51:25 +00:00			`logger = logging.getLogger(__name__)`

first commit 2022-09-08 03:59:30 +00:00
			`@lru_cache()`
			`def get_device():`
			`if torch.cuda.is_available():`
			`return "cuda"`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00
			`if torch.backends.mps.is_available():`
refactor: cleanup ddim 2022-09-17 19:24:27 +00:00			`return "mps:0"`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00
			`return "cpu"`
first commit 2022-09-08 03:59:30 +00:00

feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2022-09-11 06:27:22 +00:00			`@lru_cache()`
			`def get_device_name(device_type):`
			`if device_type == "cuda":`
			`return torch.cuda.get_device_name(0)`
			`return platform.processor()`


refactor: use logging instead of prints 2022-09-09 04:51:25 +00:00			`def log_params(model):`
first commit 2022-09-08 03:59:30 +00:00			`total_params = sum(p.numel() for p in model.parameters())`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2022-09-11 06:27:22 +00:00			`logger.debug(f"{model.__class__.__name__} has {total_params * 1.e-6:.2f} M params.")`
first commit 2022-09-08 03:59:30 +00:00

			`def instantiate_from_config(config):`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`if "target" not in config:`
first commit 2022-09-08 03:59:30 +00:00			`if config == "__is_first_stage__":`
			`return None`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`if config == "__is_unconditional__":`
first commit 2022-09-08 03:59:30 +00:00			`return None`
			raise KeyError("Expected key `target` to instantiate.")
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`return get_obj_from_str(config["target"])(**config.get("params", {}))`
first commit 2022-09-08 03:59:30 +00:00

			`def get_obj_from_str(string, reload=False):`
			`module, cls = string.rsplit(".", 1)`
			`if reload:`
			`module_imp = importlib.import_module(module)`
			`importlib.reload(module_imp)`
			`return getattr(importlib.import_module(module, package=None), cls)`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00

tests: add docker image for testing environment. minor test improvements 2022-09-22 05:38:44 +00:00			`@contextmanager`
			`def platform_appropriate_autocast(precision="autocast"):`
			`"""`
feature: boolean logic masks Specify advanced text based masks using boolean logic and strength modifiers. Mask descriptions must be lowercase. Keywords uppercase. Valid symbols: `AND`, `OR`, `NOT`, `()`, and mask strength modifier `{1.5}` where `+` can be any of `+ - /`. Single-character boolean operators also work. When writing strength modifies know that pixel values are between 0 and 1. - feature: apply mask edits to original files - feature: auto-rotate images if exif data specifies to do so - fix: accept mask images in command line 2022-09-24 05:58:48 +00:00			`Allow calculations to run in mixed precision, which can be faster`
tests: add docker image for testing environment. minor test improvements 2022-09-22 05:38:44 +00:00			`"""`
			`precision_scope = nullcontext`
			`if precision == "autocast" and get_device() in ("cuda", "cpu"):`
			`precision_scope = autocast`
			`with precision_scope(get_device()):`
			`yield`


feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			`def _fixed_layer_norm(`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`input: Tensor, # noqa`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			`normalized_shape: List[int],`
			`weight: Optional[Tensor] = None,`
			`bias: Optional[Tensor] = None,`
			`eps: float = 1e-5,`
			`) -> Tensor:`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`"""`
			`Applies Layer Normalization for last certain number of dimensions.`

feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2022-09-10 07:32:31 +00:00			See :class:`~torch.nn.LayerNorm` for details.
			`"""`
			`if has_torch_function_variadic(input, weight, bias):`
			`return handle_torch_function(`
			`_fixed_layer_norm,`
			`(input, weight, bias),`
			`input,`
			`normalized_shape,`
			`weight=weight,`
			`bias=bias,`
			`eps=eps,`
			`)`
			`return torch.layer_norm(`
			`input.contiguous(),`
			`normalized_shape,`
			`weight,`
			`bias,`
			`eps,`
			`torch.backends.cudnn.enabled,`
			`)`


			`@contextmanager`
			`def fix_torch_nn_layer_norm():`
			`"""https://github.com/CompVis/stable-diffusion/issues/25#issuecomment-1221416526"""`
			`orig_function = functional.layer_norm`
			`functional.layer_norm = _fixed_layer_norm`
			`try:`
			`yield`
			`finally:`
			`functional.layer_norm = orig_function`
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2022-09-12 01:00:40 +00:00

fix: try to address #13 BFloat16 issue Seems to be caused by incompatible types in group_norm when we use autocast. Patch group_norm to cast the weights to the same type as the inputs From what I can understand all the other repos just switch to full precision instead of addressing this. I think this would make things slower but I'm not sure. So maybe the patching solution I'm doing is better? https://github.com/pytorch/pytorch/pull/81852 2022-09-22 05:03:12 +00:00			`@contextmanager`
			`def fix_torch_group_norm():`
			`"""`
			`Patch group_norm to cast the weights to the same type as the inputs`

			`From what I can understand all the other repos just switch to full precision instead`
			`of addressing this. I think this would make things slower but I'm not sure.`

			`https://github.com/pytorch/pytorch/pull/81852`

			`"""`

			`orig_group_norm = functional.group_norm`

			`def _group_norm_wrapper(`
tests: add docker image for testing environment. minor test improvements 2022-09-22 05:38:44 +00:00			`input: Tensor, # noqa`
fix: try to address #13 BFloat16 issue Seems to be caused by incompatible types in group_norm when we use autocast. Patch group_norm to cast the weights to the same type as the inputs From what I can understand all the other repos just switch to full precision instead of addressing this. I think this would make things slower but I'm not sure. So maybe the patching solution I'm doing is better? https://github.com/pytorch/pytorch/pull/81852 2022-09-22 05:03:12 +00:00			`num_groups: int,`
			`weight: Optional[Tensor] = None,`
			`bias: Optional[Tensor] = None,`
			`eps: float = 1e-5,`
			`) -> Tensor:`
			`if weight is not None and weight.dtype != input.dtype:`
			`weight = weight.to(input.dtype)`
			`if bias is not None and bias.dtype != input.dtype:`
			`bias = bias.to(input.dtype)`

			`return orig_group_norm(`
			`input=input, num_groups=num_groups, weight=weight, bias=bias, eps=eps`
			`)`

			`functional.group_norm = _group_norm_wrapper`
			`try:`
			`yield`
			`finally:`
			`functional.group_norm = orig_group_norm`


feature: face enhancement and upscaling!! 2022-09-13 07:27:53 +00:00			`def get_cache_dir():`
			`xdg_cache_home = os.getenv("XDG_CACHE_HOME", None)`
			`if xdg_cache_home is None:`
			`user_home = os.getenv("HOME", None)`
			`if user_home:`
			`xdg_cache_home = os.path.join(user_home, ".cache")`

			`if xdg_cache_home is not None:`
			`return os.path.join(xdg_cache_home, "imaginairy", "weights")`

			`return os.path.join(os.path.dirname(__file__), ".cached-downloads")`


			`def get_cached_url_path(url):`
			`try:`
			`return cached_path(url)`
			`except OSError:`
			`pass`
			`filename = url.split("/")[-1]`
			`dest = get_cache_dir()`
			`os.makedirs(dest, exist_ok=True)`
			`dest_path = os.path.join(dest, filename)`
			`if os.path.exists(dest_path):`
			`return dest_path`
style: lint fixes. remove unused code 2022-09-16 16:24:24 +00:00			`r = requests.get(url) # noqa`
feature: face enhancement and upscaling!! 2022-09-13 07:27:53 +00:00
			`with open(dest_path, "wb") as f:`
			`f.write(r.content)`
			`return dest_path`