|
|
from modules.prompt_parser import SdConditioning |
|
|
|
|
|
from base64 import b64decode as decode |
|
|
from io import BytesIO as bIO |
|
|
from PIL import Image |
|
|
import numpy as np |
|
|
import torch |
|
|
|
|
|
from scripts.ui_funcs import parse_mapping |
|
|
|
|
|
|
|
|
def empty_tensor(H: int, W: int): |
|
|
return torch.zeros((H, W)).unsqueeze(0) |
|
|
|
|
|
|
|
|
def advanced_mapping(sd_model, couples: list, WIDTH: int, HEIGHT: int, mapping: list): |
|
|
data = parse_mapping(mapping) |
|
|
assert len(couples) == len(data) |
|
|
|
|
|
ARGs: dict = {} |
|
|
IS_SDXL: bool = hasattr( |
|
|
sd_model.forge_objects.unet.model.diffusion_model, "label_emb" |
|
|
) |
|
|
|
|
|
for tile_index in range(len(data)): |
|
|
mask = torch.zeros((HEIGHT, WIDTH)) |
|
|
|
|
|
(X, Y, W) = data[tile_index] |
|
|
x_from = int(WIDTH * X[0]) |
|
|
x_to = int(WIDTH * X[1]) |
|
|
y_from = int(HEIGHT * Y[0]) |
|
|
y_to = int(HEIGHT * Y[1]) |
|
|
weight = W |
|
|
|
|
|
|
|
|
texts = SdConditioning([couples[tile_index]], False, WIDTH, HEIGHT, None) |
|
|
cond = sd_model.get_learned_conditioning(texts) |
|
|
pos_cond = [[cond["crossattn"]]] if IS_SDXL else [[cond]] |
|
|
|
|
|
|
|
|
|
|
|
mask[y_from:y_to, x_from:x_to] = weight |
|
|
|
|
|
|
|
|
ARGs[f"cond_{tile_index + 1}"] = pos_cond |
|
|
ARGs[f"mask_{tile_index + 1}"] = mask.unsqueeze(0) |
|
|
|
|
|
return ARGs |
|
|
|
|
|
|
|
|
def basic_mapping( |
|
|
sd_model, |
|
|
couples: list, |
|
|
WIDTH: int, |
|
|
HEIGHT: int, |
|
|
LINE_COUNT: int, |
|
|
IS_HORIZONTAL: bool, |
|
|
background: str, |
|
|
TILE_SIZE: int, |
|
|
TILE_WEIGHT: float, |
|
|
BG_WEIGHT: float, |
|
|
): |
|
|
|
|
|
ARGs: dict = {} |
|
|
IS_SDXL: bool = hasattr( |
|
|
sd_model.forge_objects.unet.model.diffusion_model, "label_emb" |
|
|
) |
|
|
|
|
|
for tile in range(LINE_COUNT): |
|
|
mask = torch.zeros((HEIGHT, WIDTH)) |
|
|
|
|
|
|
|
|
texts = SdConditioning([couples[tile]], False, WIDTH, HEIGHT, None) |
|
|
cond = sd_model.get_learned_conditioning(texts) |
|
|
pos_cond = [[cond["crossattn"]]] if IS_SDXL else [[cond]] |
|
|
|
|
|
|
|
|
|
|
|
if background == "First Line": |
|
|
if tile == 0: |
|
|
mask = torch.ones((HEIGHT, WIDTH)) * BG_WEIGHT |
|
|
else: |
|
|
if IS_HORIZONTAL: |
|
|
mask[:, (tile - 1) * TILE_SIZE : tile * TILE_SIZE] = TILE_WEIGHT |
|
|
else: |
|
|
mask[(tile - 1) * TILE_SIZE : tile * TILE_SIZE, :] = TILE_WEIGHT |
|
|
else: |
|
|
if IS_HORIZONTAL: |
|
|
mask[:, tile * TILE_SIZE : (tile + 1) * TILE_SIZE] = TILE_WEIGHT |
|
|
else: |
|
|
mask[tile * TILE_SIZE : (tile + 1) * TILE_SIZE, :] = TILE_WEIGHT |
|
|
|
|
|
|
|
|
ARGs[f"cond_{tile + 1}"] = pos_cond |
|
|
ARGs[f"mask_{tile + 1}"] = mask.unsqueeze(0) |
|
|
|
|
|
if background == "Last Line": |
|
|
ARGs[f"mask_{LINE_COUNT}"] = ( |
|
|
torch.ones((HEIGHT, WIDTH)) * BG_WEIGHT |
|
|
).unsqueeze(0) |
|
|
|
|
|
return ARGs |
|
|
|
|
|
|
|
|
def b64image2tensor(img: str, WIDTH: int, HEIGHT: int) -> torch.Tensor: |
|
|
image_bytes = decode(img) |
|
|
image = Image.open(bIO(image_bytes)).convert("L") |
|
|
|
|
|
if image.width != WIDTH or image.height != HEIGHT: |
|
|
image = image.resize((WIDTH, HEIGHT), resample=Image.Resampling.NEAREST) |
|
|
|
|
|
image = np.array(image).astype(np.float32) / 255.0 |
|
|
image = torch.from_numpy(image).unsqueeze(0) |
|
|
|
|
|
return image |
|
|
|
|
|
|
|
|
def mask_mapping( |
|
|
sd_model, |
|
|
couples: list, |
|
|
WIDTH: int, |
|
|
HEIGHT: int, |
|
|
LINE_COUNT: int, |
|
|
mapping: list[dict], |
|
|
background: str, |
|
|
BG_WEIGHT: float, |
|
|
): |
|
|
|
|
|
mapping = [ |
|
|
b64image2tensor(m["mask"], WIDTH, HEIGHT) * float(m["weight"]) for m in mapping |
|
|
] |
|
|
|
|
|
ARGs: dict = {} |
|
|
IS_SDXL: bool = hasattr( |
|
|
sd_model.forge_objects.unet.model.diffusion_model, "label_emb" |
|
|
) |
|
|
|
|
|
for layer in range(LINE_COUNT): |
|
|
mask = torch.zeros((HEIGHT, WIDTH)) |
|
|
|
|
|
|
|
|
texts = SdConditioning([couples[layer]], False, WIDTH, HEIGHT, None) |
|
|
cond = sd_model.get_learned_conditioning(texts) |
|
|
pos_cond = [[cond["crossattn"]]] if IS_SDXL else [[cond]] |
|
|
|
|
|
|
|
|
|
|
|
if background == "First Line": |
|
|
if layer == 0: |
|
|
mask = torch.ones((HEIGHT, WIDTH)) * BG_WEIGHT |
|
|
else: |
|
|
mask = mapping[layer - 1] |
|
|
else: |
|
|
mask = mapping[layer] |
|
|
|
|
|
|
|
|
ARGs[f"cond_{layer + 1}"] = pos_cond |
|
|
ARGs[f"mask_{layer + 1}"] = mask.unsqueeze(0) if mask.dim() == 2 else mask |
|
|
|
|
|
if background == "Last Line": |
|
|
ARGs[f"mask_{LINE_COUNT}"] = ( |
|
|
torch.ones((HEIGHT, WIDTH)) * BG_WEIGHT |
|
|
).unsqueeze(0) |
|
|
|
|
|
return ARGs |
|
|
|