imaginAIry/imaginairy/modules/sgm/autoencoding/lpips/util.py

"""Utilities for model checkpoint management and normalization layers"""

import hashlib
import os

import requests
import torch
import torch.nn as nn
from tqdm import tqdm

URL_MAP = {"vgg_lpips": "https://heibox.uni-heidelberg.de/f/607503859c864bc1b30b/?dl=1"}

CKPT_MAP = {"vgg_lpips": "vgg.pth"}

MD5_MAP = {"vgg_lpips": "d507d7349b931f0638a25a48a722f98a"}


def download(url, local_path, chunk_size=1024):
    os.makedirs(os.path.split(local_path)[0], exist_ok=True)
    with requests.get(url, stream=True) as r, tqdm(
        total=int(r.headers.get("content-length", 0)), unit="B", unit_scale=True
    ) as pbar, open(local_path, "wb") as f:
        for data in r.iter_content(chunk_size=chunk_size):
            if data:
                f.write(data)
                pbar.update(chunk_size)


def md5_hash(path):
    with open(path, "rb") as f:
        content = f.read()
    return hashlib.md5(content).hexdigest()


def get_ckpt_path(name, root, check=False):
    assert name in URL_MAP
    path = os.path.join(root, CKPT_MAP[name])
    if not os.path.exists(path) or (check and md5_hash(path) != MD5_MAP[name]):
        print(f"Downloading {name} model from {URL_MAP[name]} to {path}")
        download(URL_MAP[name], path)
        md5 = md5_hash(path)
        assert md5 == MD5_MAP[name], md5
    return path


class ActNorm(nn.Module):
    def __init__(
        self, num_features, logdet=False, affine=True, allow_reverse_init=False
    ):
        assert affine
        super().__init__()
        self.logdet = logdet
        self.loc = nn.Parameter(torch.zeros(1, num_features, 1, 1))
        self.scale = nn.Parameter(torch.ones(1, num_features, 1, 1))
        self.allow_reverse_init = allow_reverse_init

        self.register_buffer("initialized", torch.tensor(0, dtype=torch.uint8))

    def initialize(self, input_tensor):
        with torch.no_grad():
            flatten = (
                input_tensor.permute(1, 0, 2, 3)
                .contiguous()
                .view(input_tensor.shape[1], -1)
            )
            mean = (
                flatten.mean(1)
                .unsqueeze(1)
                .unsqueeze(2)
                .unsqueeze(3)
                .permute(1, 0, 2, 3)
            )
            std = (
                flatten.std(1)
                .unsqueeze(1)
                .unsqueeze(2)
                .unsqueeze(3)
                .permute(1, 0, 2, 3)
            )

            self.loc.data.copy_(-mean)
            self.scale.data.copy_(1 / (std + 1e-6))

    def forward(self, input_tensor, reverse=False):
        if reverse:
            return self.reverse(input_tensor)
        if len(input_tensor.shape) == 2:
            input_tensor = input_tensor[:, :, None, None]
            squeeze = True
        else:
            squeeze = False

        _, _, height, width = input_tensor.shape

        if self.training and self.initialized.item() == 0:
            self.initialize(input_tensor)
            self.initialized.fill_(1)

        h = self.scale * (input_tensor + self.loc)

        if squeeze:
            h = h.squeeze(-1).squeeze(-1)

        if self.logdet:
            log_abs = torch.log(torch.abs(self.scale))
            logdet = height * width * torch.sum(log_abs)
            logdet = logdet * torch.ones(input_tensor.shape[0]).to(input_tensor)
            return h, logdet

        return h

    def reverse(self, output):
        if self.training and self.initialized.item() == 0:
            if not self.allow_reverse_init:
                msg = "Initializing ActNorm in reverse direction is disabled by default. Use allow_reverse_init=True to enable."
                raise RuntimeError(msg)
            else:
                self.initialize(output)
                self.initialized.fill_(1)

        if len(output.shape) == 2:
            output = output[:, :, None, None]
            squeeze = True
        else:
            squeeze = False

        h = output / self.scale - self.loc

        if squeeze:
            h = h.squeeze(-1).squeeze(-1)
        return h
docs: add docstrings Wrote an openai script and custom prompt to generate them. 2023-12-15 20:31:28 +00:00			`"""Utilities for model checkpoint management and normalization layers"""`

feature: stable diffusion video (SVD) 2023-11-22 18:33:58 +00:00			`import hashlib`
			`import os`

			`import requests`
			`import torch`
			`import torch.nn as nn`
			`from tqdm import tqdm`

			`URL_MAP = {"vgg_lpips": "https://heibox.uni-heidelberg.de/f/607503859c864bc1b30b/?dl=1"}`

			`CKPT_MAP = {"vgg_lpips": "vgg.pth"}`

			`MD5_MAP = {"vgg_lpips": "d507d7349b931f0638a25a48a722f98a"}`


			`def download(url, local_path, chunk_size=1024):`
			`os.makedirs(os.path.split(local_path)[0], exist_ok=True)`
			`with requests.get(url, stream=True) as r, tqdm(`
			`total=int(r.headers.get("content-length", 0)), unit="B", unit_scale=True`
			`) as pbar, open(local_path, "wb") as f:`
			`for data in r.iter_content(chunk_size=chunk_size):`
			`if data:`
			`f.write(data)`
			`pbar.update(chunk_size)`


			`def md5_hash(path):`
			`with open(path, "rb") as f:`
			`content = f.read()`
			`return hashlib.md5(content).hexdigest()`


			`def get_ckpt_path(name, root, check=False):`
			`assert name in URL_MAP`
			`path = os.path.join(root, CKPT_MAP[name])`
			`if not os.path.exists(path) or (check and md5_hash(path) != MD5_MAP[name]):`
			`print(f"Downloading {name} model from {URL_MAP[name]} to {path}")`
			`download(URL_MAP[name], path)`
			`md5 = md5_hash(path)`
			`assert md5 == MD5_MAP[name], md5`
			`return path`


			`class ActNorm(nn.Module):`
			`def __init__(`
			`self, num_features, logdet=False, affine=True, allow_reverse_init=False`
			`):`
			`assert affine`
			`super().__init__()`
			`self.logdet = logdet`
			`self.loc = nn.Parameter(torch.zeros(1, num_features, 1, 1))`
			`self.scale = nn.Parameter(torch.ones(1, num_features, 1, 1))`
			`self.allow_reverse_init = allow_reverse_init`

			`self.register_buffer("initialized", torch.tensor(0, dtype=torch.uint8))`

			`def initialize(self, input_tensor):`
			`with torch.no_grad():`
			`flatten = (`
			`input_tensor.permute(1, 0, 2, 3)`
			`.contiguous()`
			`.view(input_tensor.shape[1], -1)`
			`)`
			`mean = (`
			`flatten.mean(1)`
			`.unsqueeze(1)`
			`.unsqueeze(2)`
			`.unsqueeze(3)`
			`.permute(1, 0, 2, 3)`
			`)`
			`std = (`
			`flatten.std(1)`
			`.unsqueeze(1)`
			`.unsqueeze(2)`
			`.unsqueeze(3)`
			`.permute(1, 0, 2, 3)`
			`)`

			`self.loc.data.copy_(-mean)`
			`self.scale.data.copy_(1 / (std + 1e-6))`

			`def forward(self, input_tensor, reverse=False):`
			`if reverse:`
			`return self.reverse(input_tensor)`
			`if len(input_tensor.shape) == 2:`
			`input_tensor = input_tensor[:, :, None, None]`
			`squeeze = True`
			`else:`
			`squeeze = False`

			`_, _, height, width = input_tensor.shape`

			`if self.training and self.initialized.item() == 0:`
			`self.initialize(input_tensor)`
			`self.initialized.fill_(1)`

			`h = self.scale * (input_tensor + self.loc)`

			`if squeeze:`
			`h = h.squeeze(-1).squeeze(-1)`

			`if self.logdet:`
			`log_abs = torch.log(torch.abs(self.scale))`
			`logdet = height * width * torch.sum(log_abs)`
			`logdet = logdet * torch.ones(input_tensor.shape[0]).to(input_tensor)`
			`return h, logdet`

			`return h`

			`def reverse(self, output):`
			`if self.training and self.initialized.item() == 0:`
			`if not self.allow_reverse_init:`
			`msg = "Initializing ActNorm in reverse direction is disabled by default. Use allow_reverse_init=True to enable."`
			`raise RuntimeError(msg)`
			`else:`
			`self.initialize(output)`
			`self.initialized.fill_(1)`

			`if len(output.shape) == 2:`
			`output = output[:, :, None, None]`
			`squeeze = True`
			`else:`
			`squeeze = False`

			`h = output / self.scale - self.loc`

			`if squeeze:`
			`h = h.squeeze(-1).squeeze(-1)`
			`return h`