imaginAIry/imaginairy/img_utils.py

from typing import Sequence

import numpy as np
import PIL
import torch
from einops import rearrange, repeat
from PIL import Image

from imaginairy.utils import get_device


def pillow_fit_image_within(
    image: PIL.Image.Image, max_height=512, max_width=512, convert="RGB", snap_size=8
):
    image = image.convert(convert)
    w, h = image.size
    resize_ratio = 1
    if w > max_width or h > max_height:
        resize_ratio = min(max_width / w, max_height / h)
    elif w < max_width and h < max_height:
        # it's smaller than our target image, enlarge
        resize_ratio = max(max_width / w, max_height / h)

    if resize_ratio != 1:
        w, h = int(w * resize_ratio), int(h * resize_ratio)
    # resize to integer multiple of snap_size
    w -= w % snap_size
    h -= h % snap_size

    if (w, h) != image.size:
        image = image.resize((w, h), resample=Image.Resampling.LANCZOS)
    return image


def pillow_img_to_torch_image(img: PIL.Image.Image):
    img = img.convert("RGB")
    img = np.array(img).astype(np.float32) / 255.0
    img = img[None].transpose(0, 3, 1, 2)
    img = torch.from_numpy(img)
    return 2.0 * img - 1.0


def pillow_img_to_opencv_img(img: PIL.Image.Image):
    open_cv_image = np.array(img)
    # Convert RGB to BGR
    open_cv_image = open_cv_image[:, :, ::-1].copy()
    return open_cv_image


def model_latents_to_pillow_imgs(latents: torch.Tensor) -> Sequence[PIL.Image.Image]:
    from imaginairy.model_manager import get_current_diffusion_model  # noqa

    model = get_current_diffusion_model()
    latents = model.decode_first_stage(latents)
    latents = torch.clamp((latents + 1.0) / 2.0, min=0.0, max=1.0)
    imgs = []
    for latent in latents:
        latent = 255.0 * rearrange(latent.cpu().numpy(), "c h w -> h w c")
        img = Image.fromarray(latent.astype(np.uint8))
        imgs.append(img)
    return imgs


def pillow_img_to_model_latent(model, img, batch_size=1, half=True):
    # init_image = pil_img_to_torch(img, half=half).to(device)
    init_image = pillow_img_to_torch_image(img).to(get_device())
    init_image = repeat(init_image, "1 ... -> b ...", b=batch_size)
    if half:
        return model.get_first_stage_encoding(
            model.encode_first_stage(init_image.half())
        )
    return model.get_first_stage_encoding(model.encode_first_stage(init_image))


def make_gif_image(filepath, imgs, duration=1000, loop=0):

    imgs[0].save(
        filepath,
        save_all=True,
        append_images=imgs[1:],
        duration=duration,
        loop=loop,
        optimize=False,
    )
feature: boolean logic masks Specify advanced text based masks using boolean logic and strength modifiers. Mask descriptions must be lowercase. Keywords uppercase. Valid symbols: `AND`, `OR`, `NOT`, `()`, and mask strength modifier `{1.5}` where `+` can be any of `+ - /`. Single-character boolean operators also work. When writing strength modifies know that pixel values are between 0 and 1. - feature: apply mask edits to original files - feature: auto-rotate images if exif data specifies to do so - fix: accept mask images in command line 2022-09-24 05:58:48 +00:00			`from typing import Sequence`

			`import numpy as np`
			`import PIL`
			`import torch`
			`from einops import rearrange, repeat`
			`from PIL import Image`

			`from imaginairy.utils import get_device`


feature: finetuning - feature: finetuning your own image models - feature: image prep command. crops to face or other interesting parts of photo - fix: back-compat for hf_hub_download - feature: add prune-ckpt command - feature: allow specification of model config file 2023-01-01 22:54:49 +00:00			`def pillow_fit_image_within(`
feature: image sizes can now be multiples of 8 instead of 64 from https://github.com/CompVis/stable-diffusion/issues/60#issuecomment-1240294667 2023-01-24 06:25:56 +00:00			`image: PIL.Image.Image, max_height=512, max_width=512, convert="RGB", snap_size=8`
feature: finetuning - feature: finetuning your own image models - feature: image prep command. crops to face or other interesting parts of photo - fix: back-compat for hf_hub_download - feature: add prune-ckpt command - feature: allow specification of model config file 2023-01-01 22:54:49 +00:00			`):`
			`image = image.convert(convert)`
feature: boolean logic masks Specify advanced text based masks using boolean logic and strength modifiers. Mask descriptions must be lowercase. Keywords uppercase. Valid symbols: `AND`, `OR`, `NOT`, `()`, and mask strength modifier `{1.5}` where `+` can be any of `+ - /`. Single-character boolean operators also work. When writing strength modifies know that pixel values are between 0 and 1. - feature: apply mask edits to original files - feature: auto-rotate images if exif data specifies to do so - fix: accept mask images in command line 2022-09-24 05:58:48 +00:00			`w, h = image.size`
fix: handle small input images If input images didn't need resizing because they were already smaller than max width/height then they didn't get normalized to a multiple of 64. This caused an exception like the following: ```Sizes of tensors must match except in dimension 1. Expected size 4 but got size 3 for tensor number 1 in the list. ``` 2022-10-06 06:13:48 +00:00			`resize_ratio = 1`
fix: masking now works properly at strengths 0 and 1 2022-09-24 21:41:25 +00:00			`if w > max_width or h > max_height:`
			`resize_ratio = min(max_width / w, max_height / h)`
fix: handle small input images If input images didn't need resizing because they were already smaller than max width/height then they didn't get normalized to a multiple of 64. This caused an exception like the following: ```Sizes of tensors must match except in dimension 1. Expected size 4 but got size 3 for tensor number 1 in the list. ``` 2022-10-06 06:13:48 +00:00			`elif w < max_width and h < max_height:`
			`# it's smaller than our target image, enlarge`
			`resize_ratio = max(max_width / w, max_height / h)`

			`if resize_ratio != 1:`
fix: masking now works properly at strengths 0 and 1 2022-09-24 21:41:25 +00:00			`w, h = int(w * resize_ratio), int(h * resize_ratio)`
feature: image sizes can now be multiples of 8 instead of 64 from https://github.com/CompVis/stable-diffusion/issues/60#issuecomment-1240294667 2023-01-24 06:25:56 +00:00			`# resize to integer multiple of snap_size`
			`w -= w % snap_size`
			`h -= h % snap_size`
lint: new ruff linter 2023-01-02 04:14:22 +00:00
fix: handle small input images If input images didn't need resizing because they were already smaller than max width/height then they didn't get normalized to a multiple of 64. This caused an exception like the following: ```Sizes of tensors must match except in dimension 1. Expected size 4 but got size 3 for tensor number 1 in the list. ``` 2022-10-06 06:13:48 +00:00			`if (w, h) != image.size:`
fix: masking now works properly at strengths 0 and 1 2022-09-24 21:41:25 +00:00			`image = image.resize((w, h), resample=Image.Resampling.LANCZOS)`
style: fix lint issues 2022-09-24 07:29:45 +00:00			`return image`
feature: boolean logic masks Specify advanced text based masks using boolean logic and strength modifiers. Mask descriptions must be lowercase. Keywords uppercase. Valid symbols: `AND`, `OR`, `NOT`, `()`, and mask strength modifier `{1.5}` where `+` can be any of `+ - /`. Single-character boolean operators also work. When writing strength modifies know that pixel values are between 0 and 1. - feature: apply mask edits to original files - feature: auto-rotate images if exif data specifies to do so - fix: accept mask images in command line 2022-09-24 05:58:48 +00:00

			`def pillow_img_to_torch_image(img: PIL.Image.Image):`
			`img = img.convert("RGB")`
			`img = np.array(img).astype(np.float32) / 255.0`
			`img = img[None].transpose(0, 3, 1, 2)`
			`img = torch.from_numpy(img)`
			`return 2.0 * img - 1.0`


			`def pillow_img_to_opencv_img(img: PIL.Image.Image):`
			`open_cv_image = np.array(img)`
			`# Convert RGB to BGR`
			`open_cv_image = open_cv_image[:, :, ::-1].copy()`
			`return open_cv_image`


			`def model_latents_to_pillow_imgs(latents: torch.Tensor) -> Sequence[PIL.Image.Image]:`
feature: inpainting model support; improved model manager 2022-10-23 21:46:45 +00:00			`from imaginairy.model_manager import get_current_diffusion_model # noqa`
feature: boolean logic masks Specify advanced text based masks using boolean logic and strength modifiers. Mask descriptions must be lowercase. Keywords uppercase. Valid symbols: `AND`, `OR`, `NOT`, `()`, and mask strength modifier `{1.5}` where `+` can be any of `+ - /`. Single-character boolean operators also work. When writing strength modifies know that pixel values are between 0 and 1. - feature: apply mask edits to original files - feature: auto-rotate images if exif data specifies to do so - fix: accept mask images in command line 2022-09-24 05:58:48 +00:00
feature: inpainting model support; improved model manager 2022-10-23 21:46:45 +00:00			`model = get_current_diffusion_model()`
feature: boolean logic masks Specify advanced text based masks using boolean logic and strength modifiers. Mask descriptions must be lowercase. Keywords uppercase. Valid symbols: `AND`, `OR`, `NOT`, `()`, and mask strength modifier `{1.5}` where `+` can be any of `+ - /`. Single-character boolean operators also work. When writing strength modifies know that pixel values are between 0 and 1. - feature: apply mask edits to original files - feature: auto-rotate images if exif data specifies to do so - fix: accept mask images in command line 2022-09-24 05:58:48 +00:00			`latents = model.decode_first_stage(latents)`
			`latents = torch.clamp((latents + 1.0) / 2.0, min=0.0, max=1.0)`
			`imgs = []`
			`for latent in latents:`
			`latent = 255.0 * rearrange(latent.cpu().numpy(), "c h w -> h w c")`
			`img = Image.fromarray(latent.astype(np.uint8))`
			`imgs.append(img)`
			`return imgs`


			`def pillow_img_to_model_latent(model, img, batch_size=1, half=True):`
			`# init_image = pil_img_to_torch(img, half=half).to(device)`
			`init_image = pillow_img_to_torch_image(img).to(get_device())`
			`init_image = repeat(init_image, "1 ... -> b ...", b=batch_size)`
			`if half:`
			`return model.get_first_stage_encoding(`
			`model.encode_first_stage(init_image.half())`
			`)`
			`return model.get_first_stage_encoding(model.encode_first_stage(init_image))`
feature: image edit gifs and demo-reels 2023-01-22 01:36:47 +00:00

			`def make_gif_image(filepath, imgs, duration=1000, loop=0):`

			`imgs[0].save(`
			`filepath,`
			`save_all=True,`
			`append_images=imgs[1:],`
			`duration=duration,`
			`loop=loop,`
			`optimize=False,`
			`)`