imaginAIry/imaginairy/api.py

import logging
import os
import re
from contextlib import nullcontext
from functools import lru_cache

import numpy as np
import torch
import torch.nn
from einops import rearrange
from omegaconf import OmegaConf
from PIL import Image, ImageDraw, ImageFilter
from pytorch_lightning import seed_everything
from torch import autocast
from transformers import cached_path

from imaginairy.enhancers.face_restoration_codeformer import enhance_faces
from imaginairy.enhancers.upscale_realesrgan import upscale_image
from imaginairy.img_log import LatentLoggingContext, log_latent
from imaginairy.safety import is_nsfw, safety_models
from imaginairy.samplers.base import get_sampler
from imaginairy.schema import ImaginePrompt, ImagineResult
from imaginairy.utils import (
    fix_torch_nn_layer_norm,
    get_device,
    img_path_to_torch_image,
    instantiate_from_config,
)

LIB_PATH = os.path.dirname(__file__)
logger = logging.getLogger(__name__)

# leave undocumented. I'd ask that no one publicize this flag
IMAGINAIRY_ALLOW_NSFW = os.getenv("IMAGINAIRY_ALLOW_NSFW", "False")
IMAGINAIRY_ALLOW_NSFW = bool(IMAGINAIRY_ALLOW_NSFW == "I AM A RESPONSIBLE ADULT")


def load_model_from_config(config):
    url = "https://www.googleapis.com/storage/v1/b/aai-blog-files/o/sd-v1-4.ckpt?alt=media"
    ckpt_path = cached_path(url)
    logger.info(f"Loading model onto {get_device()} backend...")
    logger.debug(f"Loading model from {ckpt_path}")
    pl_sd = torch.load(ckpt_path, map_location="cpu")
    if "global_step" in pl_sd:
        logger.debug(f"Global Step: {pl_sd['global_step']}")
    sd = pl_sd["state_dict"]
    model = instantiate_from_config(config.model)
    m, u = model.load_state_dict(sd, strict=False)
    if len(m) > 0:
        logger.debug(f"missing keys: {m}")
    if len(u) > 0:
        logger.debug(f"unexpected keys: {u}")

    model.to(get_device())
    model.eval()
    return model


def patch_conv(**patch):
    """
    Patch to enable tiling mode
    https://github.com/replicate/cog-stable-diffusion/compare/main...TomMoore515:material_stable_diffusion:main
    """
    cls = torch.nn.Conv2d
    init = cls.__init__

    def __init__(self, *args, **kwargs):
        return init(self, *args, **kwargs, **patch)

    cls.__init__ = __init__


@lru_cache()
def load_model(tile_mode=False):
    if tile_mode:
        # generated images are tileable
        patch_conv(padding_mode="circular")

    config = "configs/stable-diffusion-v1.yaml"
    config = OmegaConf.load(f"{LIB_PATH}/{config}")
    model = load_model_from_config(config)

    model = model.to(get_device())
    return model


def imagine_image_files(
    prompts,
    outdir,
    latent_channels=4,
    downsampling_factor=8,
    precision="autocast",
    ddim_eta=0.0,
    record_step_images=False,
    output_file_extension="jpg",
    tile_mode=False,
):
    big_path = os.path.join(outdir, "upscaled")
    os.makedirs(outdir, exist_ok=True)

    base_count = len(os.listdir(outdir))
    output_file_extension = output_file_extension.lower()
    if output_file_extension not in {"jpg", "png"}:
        raise ValueError("Must output a png or jpg")

    def _record_step(img, description, step_count, prompt):
        steps_path = os.path.join(outdir, "steps", f"{base_count:08}_S{prompt.seed}")
        os.makedirs(steps_path, exist_ok=True)
        filename = f"{base_count:08}_S{prompt.seed}_step{step_count:04}.jpg"
        destination = os.path.join(steps_path, filename)
        draw = ImageDraw.Draw(img)
        draw.text((10, 10), str(description))
        img.save(destination)

    for result in imagine(
        prompts,
        latent_channels=latent_channels,
        downsampling_factor=downsampling_factor,
        precision=precision,
        ddim_eta=ddim_eta,
        img_callback=_record_step if record_step_images else None,
        tile_mode=tile_mode,
    ):
        prompt = result.prompt
        basefilename = f"{base_count:06}_{prompt.seed}_{prompt.sampler_type}{prompt.steps}_PS{prompt.prompt_strength}_{prompt_normalized(prompt.prompt_text)}"
        filepath = os.path.join(outdir, f"{basefilename}.jpg")

        result.save(filepath)
        logger.info(f"    🖼  saved to: {filepath}")
        if result.upscaled_img:
            os.makedirs(big_path, exist_ok=True)
            bigfilepath = os.path.join(big_path, basefilename) + "_upscaled.jpg"
            result.save_upscaled(bigfilepath)
            logger.info(f"    Upscaled 🖼  saved to: {bigfilepath}")
        base_count += 1


def imagine(
    prompts,
    latent_channels=4,
    downsampling_factor=8,
    precision="autocast",
    ddim_eta=0.0,
    img_callback=None,
    tile_mode=False,
    half_mode=None,
):
    model = load_model(tile_mode=tile_mode)

    if not IMAGINAIRY_ALLOW_NSFW:
        # needs to be loaded before we set default tensor type to half
        safety_models()
    # only run half-mode on cuda. run it by default
    half_mode = half_mode is None and get_device() == "cuda"
    if half_mode:
        model = model.half()
        # needed when model is in half mode, remove if not using half mode
        # torch.set_default_tensor_type(torch.HalfTensor)
    prompts = [ImaginePrompt(prompts)] if isinstance(prompts, str) else prompts
    prompts = [prompts] if isinstance(prompts, ImaginePrompt) else prompts
    _img_callback = None
    step_count = 0

    precision_scope = (
        autocast
        if precision == "autocast" and get_device() in ("cuda", "cpu")
        else nullcontext
    )
    with (torch.no_grad(), precision_scope(get_device()), fix_torch_nn_layer_norm()):
        for prompt in prompts:
            with LatentLoggingContext(
                prompt=prompt, model=model, img_callback=img_callback
            ):
                logger.info(f"Generating {prompt.prompt_description()}")
                seed_everything(prompt.seed)

                uc = None
                if prompt.prompt_strength != 1.0:
                    uc = model.get_learned_conditioning(1 * [""])
                total_weight = sum(wp.weight for wp in prompt.prompts)
                c = sum(
                    [
                        model.get_learned_conditioning(wp.text)
                        * (wp.weight / total_weight)
                        for wp in prompt.prompts
                    ]
                )

                shape = [
                    latent_channels,
                    prompt.height // downsampling_factor,
                    prompt.width // downsampling_factor,
                ]

                start_code = None
                sampler = get_sampler(prompt.sampler_type, model)
                if prompt.init_image:
                    generation_strength = 1 - prompt.init_image_strength
                    ddim_steps = int(prompt.steps / generation_strength)
                    sampler.make_schedule(ddim_num_steps=ddim_steps, ddim_eta=ddim_eta)

                    t_enc = int(generation_strength * ddim_steps)
                    init_image, w, h = img_path_to_torch_image(prompt.init_image)
                    init_image = init_image.to(get_device())
                    init_latent = model.get_first_stage_encoding(
                        model.encode_first_stage(init_image)
                    )
                    log_latent(init_latent, "init_latent")

                    # encode (scaled latent)
                    z_enc = sampler.stochastic_encode(
                        init_latent, torch.tensor([t_enc]).to(get_device())
                    )
                    log_latent(z_enc, "z_enc")

                    # decode it
                    samples = sampler.decode(
                        z_enc,
                        c,
                        t_enc,
                        unconditional_guidance_scale=prompt.prompt_strength,
                        unconditional_conditioning=uc,
                        img_callback=_img_callback,
                    )
                else:

                    samples, _ = sampler.sample(
                        num_steps=prompt.steps,
                        conditioning=c,
                        batch_size=1,
                        shape=shape,
                        unconditional_guidance_scale=prompt.prompt_strength,
                        unconditional_conditioning=uc,
                        eta=ddim_eta,
                        initial_noise_tensor=start_code,
                        img_callback=_img_callback,
                    )

                x_samples = model.decode_first_stage(samples)
                x_samples = torch.clamp((x_samples + 1.0) / 2.0, min=0.0, max=1.0)

                for x_sample in x_samples:
                    x_sample = 255.0 * rearrange(
                        x_sample.cpu().numpy(), "c h w -> h w c"
                    )
                    x_sample_8_orig = x_sample.astype(np.uint8)
                    img = Image.fromarray(x_sample_8_orig)
                    upscaled_img = None
                    if not IMAGINAIRY_ALLOW_NSFW and is_nsfw(
                        img, x_sample, half_mode=half_mode
                    ):
                        logger.info("    ⚠️  Filtering NSFW image")
                        img = img.filter(ImageFilter.GaussianBlur(radius=40))

                    if prompt.fix_faces:
                        logger.info("    Fixing 😊 's in 🖼  using GFPGAN...")
                        img = enhance_faces(img, fidelity=0.2)
                    if prompt.upscale:
                        logger.info("    Upscaling 🖼  using real-ESRGAN...")
                        upscaled_img = upscale_image(img)

                    yield ImagineResult(
                        img=img, prompt=prompt, upscaled_img=upscaled_img
                    )


def prompt_normalized(prompt):
    return re.sub(r"[^a-zA-Z0-9.,]+", "_", prompt)[:130]
refactor: use logging instead of prints 2 years ago			`import logging`
first commit 2 years ago			`import os`
			`import re`
			`from contextlib import nullcontext`
refactor: use logging instead of prints 2 years ago			`from functools import lru_cache`
first commit 2 years ago
			`import numpy as np`
			`import torch`
perf: performance optimizations from Doggettx https://github.com/CompVis/stable-diffusion/compare/main...Doggettx:stable-diffusion:autocast-improvements# https://www.reddit.com/r/StableDiffusion/comments/xalaws/test_update_for_less_memory_usage_and_higher/ 2 years ago			`import torch.nn`
first commit 2 years ago			`from einops import rearrange`
			`from omegaconf import OmegaConf`
feature: face enhancement and upscaling!! 2 years ago			`from PIL import Image, ImageDraw, ImageFilter`
first commit 2 years ago			`from pytorch_lightning import seed_everything`
			`from torch import autocast`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`from transformers import cached_path`
first commit 2 years ago
feature: face enhancement and upscaling!! 2 years ago			`from imaginairy.enhancers.face_restoration_codeformer import enhance_faces`
			`from imaginairy.enhancers.upscale_realesrgan import upscale_image`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`from imaginairy.img_log import LatentLoggingContext, log_latent`
perf: get "half" mode working when running on cuda 2 years ago			`from imaginairy.safety import is_nsfw, safety_models`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`from imaginairy.samplers.base import get_sampler`
feature: add ImageResult. step output option remove verbose args 2 years ago			`from imaginairy.schema import ImaginePrompt, ImagineResult`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`from imaginairy.utils import (`
refactor: run import sorter 2 years ago			`fix_torch_nn_layer_norm,`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`get_device,`
feature: (wip) better image to image I tried it with the DDIM sampler and it didn't work. Probably need to use the k-diffusion sampler with it from https://gist.githubusercontent.com/trygvebw/c71334dd127d537a15e9d59790f7f5e1/raw/a846393251f5be8289d4febc75a19f1f962aabcc/find_noise.py needs https://github.com/crowsonkb/k-diffusion 2 years ago			`img_path_to_torch_image,`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`instantiate_from_config,`
			`)`

first commit 2 years ago			`LIB_PATH = os.path.dirname(__file__)`
refactor: use logging instead of prints 2 years ago			`logger = logging.getLogger(__name__)`
first commit 2 years ago
feature: add nsfw image filter 2 years ago			`# leave undocumented. I'd ask that no one publicize this flag`
			`IMAGINAIRY_ALLOW_NSFW = os.getenv("IMAGINAIRY_ALLOW_NSFW", "False")`
			`IMAGINAIRY_ALLOW_NSFW = bool(IMAGINAIRY_ALLOW_NSFW == "I AM A RESPONSIBLE ADULT")`


feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`def load_model_from_config(config):`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`url = "https://www.googleapis.com/storage/v1/b/aai-blog-files/o/sd-v1-4.ckpt?alt=media"`
			`ckpt_path = cached_path(url)`
			`logger.info(f"Loading model onto {get_device()} backend...")`
			`logger.debug(f"Loading model from {ckpt_path}")`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`pl_sd = torch.load(ckpt_path, map_location="cpu")`
first commit 2 years ago			`if "global_step" in pl_sd:`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`logger.debug(f"Global Step: {pl_sd['global_step']}")`
first commit 2 years ago			`sd = pl_sd["state_dict"]`
			`model = instantiate_from_config(config.model)`
			`m, u = model.load_state_dict(sd, strict=False)`
feature: add ImageResult. step output option remove verbose args 2 years ago			`if len(m) > 0:`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`logger.debug(f"missing keys: {m}")`
feature: add ImageResult. step output option remove verbose args 2 years ago			`if len(u) > 0:`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`logger.debug(f"unexpected keys: {u}")`
first commit 2 years ago
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`model.to(get_device())`
first commit 2 years ago			`model.eval()`
			`return model`


perf: performance optimizations from Doggettx https://github.com/CompVis/stable-diffusion/compare/main...Doggettx:stable-diffusion:autocast-improvements# https://www.reddit.com/r/StableDiffusion/comments/xalaws/test_update_for_less_memory_usage_and_higher/ 2 years ago			`def patch_conv(**patch):`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`"""`
			`Patch to enable tiling mode`
			`https://github.com/replicate/cog-stable-diffusion/compare/main...TomMoore515:material_stable_diffusion:main`
			`"""`
perf: performance optimizations from Doggettx https://github.com/CompVis/stable-diffusion/compare/main...Doggettx:stable-diffusion:autocast-improvements# https://www.reddit.com/r/StableDiffusion/comments/xalaws/test_update_for_less_memory_usage_and_higher/ 2 years ago			`cls = torch.nn.Conv2d`
			`init = cls.__init__`

			`def __init__(self, args, *kwargs):`
			`return init(self, args, kwargs, *patch)`

			`cls.__init__ = __init__`


refactor: use logging instead of prints 2 years ago			`@lru_cache()`
perf: performance optimizations from Doggettx https://github.com/CompVis/stable-diffusion/compare/main...Doggettx:stable-diffusion:autocast-improvements# https://www.reddit.com/r/StableDiffusion/comments/xalaws/test_update_for_less_memory_usage_and_higher/ 2 years ago			`def load_model(tile_mode=False):`
			`if tile_mode:`
			`# generated images are tileable`
			`patch_conv(padding_mode="circular")`

feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`config = "configs/stable-diffusion-v1.yaml"`
refactor: use logging instead of prints 2 years ago			`config = OmegaConf.load(f"{LIB_PATH}/{config}")`
feature: Mac M1 Support out of box - auto-downloads checkpoints - fixes bug in torch - autoset environment variable 2 years ago			`model = load_model_from_config(config)`
refactor: use logging instead of prints 2 years ago
			`model = model.to(get_device())`
			`return model`


feature: add ImageResult. step output option remove verbose args 2 years ago			`def imagine_image_files(`
first commit 2 years ago			`prompts,`
feature: add ImageResult. step output option remove verbose args 2 years ago			`outdir,`
first commit 2 years ago			`latent_channels=4,`
			`downsampling_factor=8,`
			`precision="autocast",`
			`ddim_eta=0.0,`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`record_step_images=False,`
			`output_file_extension="jpg",`
feature: tile mode from https://github.com/replicate/cog-stable-diffusion/compare/main...TomMoore515:material_stable_diffusion:main 2 years ago			`tile_mode=False,`
first commit 2 years ago			`):`
feature: add ImageResult. step output option remove verbose args 2 years ago			`big_path = os.path.join(outdir, "upscaled")`
first commit 2 years ago			`os.makedirs(outdir, exist_ok=True)`
feature: face enhancement and upscaling!! 2 years ago
feature: add ImageResult. step output option remove verbose args 2 years ago			`base_count = len(os.listdir(outdir))`
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`output_file_extension = output_file_extension.lower()`
			`if output_file_extension not in {"jpg", "png"}:`
			`raise ValueError("Must output a png or jpg")`
feature: add ImageResult. step output option remove verbose args 2 years ago
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`def _record_step(img, description, step_count, prompt):`
feature: add ImageResult. step output option remove verbose args 2 years ago			`steps_path = os.path.join(outdir, "steps", f"{base_count:08}_S{prompt.seed}")`
			`os.makedirs(steps_path, exist_ok=True)`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`filename = f"{base_count:08}_S{prompt.seed}_step{step_count:04}.jpg"`
			`destination = os.path.join(steps_path, filename)`
			`draw = ImageDraw.Draw(img)`
			`draw.text((10, 10), str(description))`
			`img.save(destination)`

feature: face enhancement and upscaling!! 2 years ago			`for result in imagine(`
feature: add ImageResult. step output option remove verbose args 2 years ago			`prompts,`
			`latent_channels=latent_channels,`
			`downsampling_factor=downsampling_factor,`
			`precision=precision,`
			`ddim_eta=ddim_eta,`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`img_callback=_record_step if record_step_images else None,`
feature: tile mode from https://github.com/replicate/cog-stable-diffusion/compare/main...TomMoore515:material_stable_diffusion:main 2 years ago			`tile_mode=tile_mode,`
feature: add ImageResult. step output option remove verbose args 2 years ago			`):`
			`prompt = result.prompt`
			`basefilename = f"{base_count:06}_{prompt.seed}_{prompt.sampler_type}{prompt.steps}_PS{prompt.prompt_strength}_{prompt_normalized(prompt.prompt_text)}"`
			`filepath = os.path.join(outdir, f"{basefilename}.jpg")`

feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`result.save(filepath)`
			`logger.info(f" 🖼 saved to: {filepath}")`
feature: face enhancement and upscaling!! 2 years ago			`if result.upscaled_img:`
			`os.makedirs(big_path, exist_ok=True)`
			`bigfilepath = os.path.join(big_path, basefilename) + "_upscaled.jpg"`
			`result.save_upscaled(bigfilepath)`
			`logger.info(f" Upscaled 🖼 saved to: {bigfilepath}")`
feature: add ImageResult. step output option remove verbose args 2 years ago			`base_count += 1`


feature: face enhancement and upscaling!! 2 years ago			`def imagine(`
feature: add ImageResult. step output option remove verbose args 2 years ago			`prompts,`
			`latent_channels=4,`
			`downsampling_factor=8,`
			`precision="autocast",`
			`ddim_eta=0.0,`
			`img_callback=None,`
feature: tile mode from https://github.com/replicate/cog-stable-diffusion/compare/main...TomMoore515:material_stable_diffusion:main 2 years ago			`tile_mode=False,`
perf: get "half" mode working when running on cuda 2 years ago			`half_mode=None,`
feature: add ImageResult. step output option remove verbose args 2 years ago			`):`
feature: tile mode from https://github.com/replicate/cog-stable-diffusion/compare/main...TomMoore515:material_stable_diffusion:main 2 years ago			`model = load_model(tile_mode=tile_mode)`
feature: face enhancement and upscaling!! 2 years ago
perf: get "half" mode working when running on cuda 2 years ago			`if not IMAGINAIRY_ALLOW_NSFW:`
			`# needs to be loaded before we set default tensor type to half`
			`safety_models()`
			`# only run half-mode on cuda. run it by default`
feature: face enhancement and upscaling!! 2 years ago			`half_mode = half_mode is None and get_device() == "cuda"`
perf: get "half" mode working when running on cuda 2 years ago			`if half_mode:`
			`model = model.half()`
			`# needed when model is in half mode, remove if not using half mode`
feature: face enhancement and upscaling!! 2 years ago			`# torch.set_default_tensor_type(torch.HalfTensor)`
feature: add ImageResult. step output option remove verbose args 2 years ago			`prompts = [ImaginePrompt(prompts)] if isinstance(prompts, str) else prompts`
			`prompts = [prompts] if isinstance(prompts, ImaginePrompt) else prompts`
			`_img_callback = None`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`step_count = 0`
first commit 2 years ago
feature: cleaned up logging - cleans up all the logging. hide most of it - create better readme. show example images - save metadata into image 2 years ago			`precision_scope = (`
			`autocast`
			`if precision == "autocast" and get_device() in ("cuda", "cpu")`
			`else nullcontext`
			`)`
			`with (torch.no_grad(), precision_scope(get_device()), fix_torch_nn_layer_norm()):`
first commit 2 years ago			`for prompt in prompts:`
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`with LatentLoggingContext(`
			`prompt=prompt, model=model, img_callback=img_callback`
			`):`
			`logger.info(f"Generating {prompt.prompt_description()}")`
			`seed_everything(prompt.seed)`

			`uc = None`
			`if prompt.prompt_strength != 1.0:`
			`uc = model.get_learned_conditioning(1 * [""])`
			`total_weight = sum(wp.weight for wp in prompt.prompts)`
			`c = sum(`
			`[`
			`model.get_learned_conditioning(wp.text)`
			`* (wp.weight / total_weight)`
			`for wp in prompt.prompts`
			`]`
feature: image prompts 2 years ago			`)`
first commit 2 years ago
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`shape = [`
			`latent_channels,`
			`prompt.height // downsampling_factor,`
			`prompt.width // downsampling_factor,`
			`]`
feature: face enhancement and upscaling!! 2 years ago
feature: k-diffusion samplers - improved image logging functionality. can just stick log_latent wherever you want - improved some variable naming - moved all the samplers together - vendored k-diffusion library 2 years ago			`start_code = None`
			`sampler = get_sampler(prompt.sampler_type, model)`
			`if prompt.init_image:`
			`generation_strength = 1 - prompt.init_image_strength`
			`ddim_steps = int(prompt.steps / generation_strength)`
			`sampler.make_schedule(ddim_num_steps=ddim_steps, ddim_eta=ddim_eta)`

			`t_enc = int(generation_strength * ddim_steps)`
			`init_image, w, h = img_path_to_torch_image(prompt.init_image)`
			`init_image = init_image.to(get_device())`
			`init_latent = model.get_first_stage_encoding(`
			`model.encode_first_stage(init_image)`
			`)`
			`log_latent(init_latent, "init_latent")`

			`# encode (scaled latent)`
			`z_enc = sampler.stochastic_encode(`
			`init_latent, torch.tensor([t_enc]).to(get_device())`
			`)`
			`log_latent(z_enc, "z_enc")`

			`# decode it`
			`samples = sampler.decode(`
			`z_enc,`
			`c,`
			`t_enc,`
			`unconditional_guidance_scale=prompt.prompt_strength,`
			`unconditional_conditioning=uc,`
			`img_callback=_img_callback,`
			`)`
			`else:`

			`samples, _ = sampler.sample(`
			`num_steps=prompt.steps,`
			`conditioning=c,`
			`batch_size=1,`
			`shape=shape,`
			`unconditional_guidance_scale=prompt.prompt_strength,`
			`unconditional_conditioning=uc,`
			`eta=ddim_eta,`
			`initial_noise_tensor=start_code,`
			`img_callback=_img_callback,`
			`)`

			`x_samples = model.decode_first_stage(samples)`
			`x_samples = torch.clamp((x_samples + 1.0) / 2.0, min=0.0, max=1.0)`

			`for x_sample in x_samples:`
			`x_sample = 255.0 * rearrange(`
			`x_sample.cpu().numpy(), "c h w -> h w c"`
			`)`
			`x_sample_8_orig = x_sample.astype(np.uint8)`
			`img = Image.fromarray(x_sample_8_orig)`
			`upscaled_img = None`
			`if not IMAGINAIRY_ALLOW_NSFW and is_nsfw(`
			`img, x_sample, half_mode=half_mode`
			`):`
			`logger.info(" ⚠️ Filtering NSFW image")`
			`img = img.filter(ImageFilter.GaussianBlur(radius=40))`

			`if prompt.fix_faces:`
			`logger.info(" Fixing 😊 's in 🖼 using GFPGAN...")`
			`img = enhance_faces(img, fidelity=0.2)`
			`if prompt.upscale:`
			`logger.info(" Upscaling 🖼 using real-ESRGAN...")`
			`upscaled_img = upscale_image(img)`

			`yield ImagineResult(`
			`img=img, prompt=prompt, upscaled_img=upscaled_img`
			`)`
first commit 2 years ago

			`def prompt_normalized(prompt):`
			`return re.sub(r"[^a-zA-Z0-9.,]+", "_", prompt)[:130]`