|
from diffusers import AutoPipelineForImage2Image, AutoPipelineForText2Image |
|
import torch |
|
import os |
|
|
|
try: |
|
import intel_extension_for_pytorch as ipex |
|
except: |
|
pass |
|
|
|
from PIL import Image |
|
import numpy as np |
|
import gradio as gr |
|
import psutil |
|
import time |
|
import math |
|
|
|
SAFETY_CHECKER = os.environ.get("SAFETY_CHECKER", None) |
|
TORCH_COMPILE = os.environ.get("TORCH_COMPILE", None) |
|
HF_TOKEN = os.environ.get("HF_TOKEN", None) |
|
|
|
mps_available = hasattr(torch.backends, "mps") and torch.backends.mps.is_available() |
|
xpu_available = hasattr(torch, "xpu") and torch.xpu.is_available() |
|
device = torch.device( |
|
"cuda" if torch.cuda.is_available() else "xpu" if xpu_available else "cpu" |
|
) |
|
torch_device = device |
|
torch_dtype = torch.float16 |
|
|
|
print(f"SAFETY_CHECKER: {SAFETY_CHECKER}") |
|
print(f"TORCH_COMPILE: {TORCH_COMPILE}") |
|
print(f"device: {device}") |
|
|
|
if mps_available: |
|
device = torch.device("mps") |
|
torch_device = "cpu" |
|
torch_dtype = torch.float32 |
|
|
|
if SAFETY_CHECKER == "True": |
|
i2i_pipe = AutoPipelineForImage2Image.from_pretrained( |
|
"stabilityai/sdxl-turbo", |
|
torch_dtype=torch_dtype, |
|
variant="fp16" if torch_dtype == torch.float16 else "fp32", |
|
) |
|
t2i_pipe = AutoPipelineForText2Image.from_pretrained( |
|
"stabilityai/sdxl-turbo", |
|
torch_dtype=torch_dtype, |
|
variant="fp16" if torch_dtype == torch.float16 else "fp32", |
|
) |
|
else: |
|
i2i_pipe = AutoPipelineForImage2Image.from_pretrained( |
|
"stabilityai/sdxl-turbo", |
|
safety_checker=None, |
|
torch_dtype=torch_dtype, |
|
variant="fp16" if torch_dtype == torch.float16 else "fp32", |
|
) |
|
t2i_pipe = AutoPipelineForText2Image.from_pretrained( |
|
"stabilityai/sdxl-turbo", |
|
safety_checker=None, |
|
torch_dtype=torch_dtype, |
|
variant="fp16" if torch_dtype == torch.float16 else "fp32", |
|
) |
|
|
|
t2i_pipe.to(device=torch_device, dtype=torch_dtype).to(device) |
|
t2i_pipe.set_progress_bar_config(disable=True) |
|
i2i_pipe.to(device=torch_device, dtype=torch_dtype).to(device) |
|
i2i_pipe.set_progress_bar_config(disable=True) |
|
|
|
def resize_crop(image, size=512): |
|
image = image.convert("RGB") |
|
w, h = image.size |
|
image = image.resize((size, int(size * (h / w))), Image.BICUBIC) |
|
return image |
|
|
|
|
|
selected_image_index = None |
|
|
|
|
|
image_folder = 'images' |
|
images = [Image.open(os.path.join(image_folder, img)) for img in sorted(os.listdir(image_folder)) if img.endswith(('.png', '.jpg', '.jpeg'))] |
|
|
|
|
|
assert len(images) == 34, "There should be exactly 34 images in the 'images' folder." |
|
|
|
|
|
async def select_fn(data: gr.SelectData, prompt: str): |
|
global selected_image_index |
|
selected_image_index = data.index |
|
if prompt == "": |
|
print("Prompt is empty, returning original image") |
|
return images[selected_image_index] |
|
return await predict(prompt) |
|
|
|
async def predict(prompt): |
|
global selected_image_index |
|
strength = 0.49999999999999999 |
|
steps = 2 |
|
if selected_image_index is not None: |
|
init_image = images[selected_image_index] |
|
init_image = resize_crop(init_image) |
|
generator = torch.manual_seed(123123) |
|
last_time = time.time() |
|
|
|
if int(steps * strength) < 1: |
|
steps = math.ceil(1 / max(0.10, strength)) |
|
|
|
results = i2i_pipe( |
|
prompt=prompt, |
|
image=init_image, |
|
generator=generator, |
|
num_inference_steps=steps, |
|
guidance_scale=0.0, |
|
strength=strength, |
|
width=512, |
|
height=512, |
|
output_type="pil", |
|
) |
|
|
|
print(f"Pipe took {time.time() - last_time} seconds") |
|
nsfw_content_detected = ( |
|
results.nsfw_content_detected[0] |
|
if "nsfw_content_detected" in results |
|
else False |
|
) |
|
if nsfw_content_detected: |
|
gr.Warning("NSFW content detected.") |
|
return Image.new("RGB", (512, 512)) |
|
return results.images[0] |
|
|
|
|
|
with gr.Blocks() as app: |
|
gr.Markdown('''# Rorschach π |
|
### 1. Select a CRASH REPORT image |
|
### 2. Describe what you see |
|
<small>CRASH REPORT was a self-published, 72-page book by NoPattern Studio released in November, 2019. Limited to an edition of 300, the book contained a year's worth of experimental, exploratory 3D imagery generated entirely in Photoshop. [CRASH REPORT site](https://nopattern.com/CRASH-REPORT) [see this space's lineage graph](https://huggingface.co/spaces/EQTYLab/lineage-explorer?repo=https://huggingface.co/NoPattern/Rorschach)</small>''', elem_id="main_title") |
|
|
|
with gr.Row(): |
|
with gr.Column(): |
|
image_gallery = gr.Gallery(value=images, columns=4) |
|
with gr.Column(): |
|
prompt = gr.Textbox(label="I see...") |
|
output = gr.Image(label="Generation") |
|
|
|
|
|
|
|
image_gallery.select(select_fn, inputs=[prompt], outputs=output, show_progress=False) |
|
|
|
prompt.change(fn=predict, inputs=[prompt], outputs=output, show_progress=False) |
|
|
|
|
|
app.queue() |
|
app.launch() |
|
|