Code-Cooker / app.py
Severian's picture
Update app.py
c952c72 verified
raw
history blame
24.6 kB
import torch
import gradio as gr
from PIL import Image
import qrcode
from pathlib import Path
from multiprocessing import cpu_count
import requests
import io
import os
from PIL import Image
import spaces
import numpy as np
import cv2
from pyzxing import BarCodeReader
from PIL import ImageOps
from diffusers import (
StableDiffusionPipeline,
StableDiffusionControlNetImg2ImgPipeline,
StableDiffusionControlNetPipeline,
ControlNetModel,
DDIMScheduler,
DPMSolverMultistepScheduler,
DEISMultistepScheduler,
HeunDiscreteScheduler,
EulerDiscreteScheduler,
)
qrcode_generator = qrcode.QRCode(
version=1,
error_correction=qrcode.ERROR_CORRECT_H,
box_size=10,
border=4,
)
# Define available models
CONTROLNET_MODELS = {
"QR Code Monster": "monster-labs/control_v1p_sd15_qrcode_monster",
"QR Code": "DionTimmer/controlnet_qrcode-control_v1p_sd15",
# Add more ControlNet models here
}
DIFFUSION_MODELS = {
"Stable Diffusion v1.5": "ckpt/sd15",
"GhostMix": "sinkinai/GhostMix-V2-BakedVae",
"Real-Dream": "stablediffusionapi/edge-of-realism",
# Add more diffusion models here
}
def load_models(controlnet_model, diffusion_model):
controlnet = ControlNetModel.from_pretrained(
CONTROLNET_MODELS[controlnet_model],
torch_dtype=torch.float16
).to("cuda")
pipe = StableDiffusionControlNetImg2ImgPipeline.from_pretrained(
DIFFUSION_MODELS[diffusion_model],
controlnet=controlnet,
torch_dtype=torch.float16,
safety_checker=None,
).to("cuda")
return pipe
def resize_for_condition_image(input_image: Image.Image, resolution: int):
input_image = input_image.convert("RGB")
W, H = input_image.size
k = float(resolution) / min(H, W)
H *= k
W *= k
H = int(round(H / 64.0)) * 64
W = int(round(W / 64.0)) * 64
img = input_image.resize((W, H), resample=Image.LANCZOS)
return img
SAMPLER_MAP = {
"DPM++ Karras SDE": lambda config: DPMSolverMultistepScheduler.from_config(config, use_karras=True, algorithm_type="sde-dpmsolver++"),
"DPM++ Karras": lambda config: DPMSolverMultistepScheduler.from_config(config, use_karras=True),
"Heun": lambda config: HeunDiscreteScheduler.from_config(config),
"Euler": lambda config: EulerDiscreteScheduler.from_config(config),
"DDIM": lambda config: DDIMScheduler.from_config(config),
"DEIS": lambda config: DEISMultistepScheduler.from_config(config),
}
def scan_qr_code(image):
# Convert gradio image to PIL Image if necessary
if isinstance(image, np.ndarray):
image = Image.fromarray(image)
# Convert to grayscale
gray_image = image.convert('L')
# Convert to numpy array
np_image = np.array(gray_image)
# Method 1: Using qrcode library
try:
qr = qrcode.QRCode()
qr.add_data('')
qr.decode(gray_image)
return qr.data.decode('utf-8')
except Exception:
pass
# Method 2: Using OpenCV
try:
qr_detector = cv2.QRCodeDetector()
retval, decoded_info, points, straight_qrcode = qr_detector.detectAndDecodeMulti(np_image)
if retval:
return decoded_info[0]
except Exception:
pass
# Method 3: Fallback to zxing-cpp
try:
reader = BarCodeReader()
results = reader.decode(np_image)
if results:
return results[0].parsed
except Exception:
pass
return None
def invert_image(image):
if image is None:
return None
if isinstance(image, np.ndarray):
return 255 - image
elif isinstance(image, Image.Image):
return ImageOps.invert(image.convert('RGB'))
else:
raise ValueError("Unsupported image type")
def invert_displayed_image(image):
if image is None:
return None
inverted = invert_image(image)
if isinstance(inverted, np.ndarray):
return Image.fromarray(inverted)
return inverted
#@spaces.GPU()
def inference(
qr_code_content: str,
prompt: str,
negative_prompt: str,
guidance_scale: float = 10.0,
controlnet_conditioning_scale: float = 2.0,
strength: float = 0.8,
seed: int = -1,
init_image: Image.Image | None = None,
qrcode_image: Image.Image | None = None,
use_qr_code_as_init_image = True,
sampler = "DPM++ Karras SDE",
bg_color: str = "white",
qr_color: str = "black",
invert_final_image: bool = False,
invert_init_image: bool = False, # New parameter
controlnet_model: str = "QR Code Monster",
diffusion_model: str = "Stable Diffusion v1.5",
):
try:
# Load models based on user selection
pipe = load_models(controlnet_model, diffusion_model)
if prompt is None or prompt == "":
raise gr.Error("Prompt is required")
if qrcode_image is None and qr_code_content == "":
raise gr.Error("QR Code Image or QR Code Content is required")
pipe.scheduler = SAMPLER_MAP[sampler](pipe.scheduler.config)
if seed == -1:
seed = torch.randint(0, 2**32 - 1, (1,)).item()
generator = torch.manual_seed(seed)
if qr_code_content != "" or qrcode_image.size == (1, 1):
print("Generating QR Code from content")
qr = qrcode.QRCode(
version=1,
error_correction=qrcode.constants.ERROR_CORRECT_H,
box_size=10,
border=4,
)
qr.add_data(qr_code_content)
qr.make(fit=True)
qrcode_image = qr.make_image(fill_color=qr_color, back_color=bg_color)
qrcode_image = resize_for_condition_image(qrcode_image, 768)
else:
print("Using QR Code Image")
qrcode_image = resize_for_condition_image(qrcode_image, 768)
# Determine which image to use as init_image and control_image
if use_qr_code_as_init_image:
init_image = qrcode_image
control_image = qrcode_image
else:
control_image = qrcode_image
if init_image is None:
# If no init_image provided, set strength to 1.0 to generate a new image
strength = 1.0
# Adjust strength if using an init_image
if init_image is not None:
strength = min(strength, 0.8) # Cap strength at 0.8 when using init_image
# Invert init_image if requested
if invert_init_image and init_image is not None:
init_image = invert_image(init_image)
out = pipe(
prompt=prompt,
negative_prompt=negative_prompt,
image=init_image,
control_image=control_image,
width=768,
height=768,
guidance_scale=float(guidance_scale),
controlnet_conditioning_scale=float(controlnet_conditioning_scale),
generator=generator,
strength=float(strength),
num_inference_steps=50,
)
final_image = out.images[0]
if invert_final_image:
final_image = invert_image(final_image)
return final_image, seed
except Exception as e:
print(f"Error in inference: {str(e)}")
# Return a blank image and -1 as seed in case of an error
return Image.new('RGB', (768, 768), color='white'), -1
def invert_init_image_display(image):
if image is None:
return None
inverted = invert_image(image)
if isinstance(inverted, np.ndarray):
return Image.fromarray(inverted)
return inverted
with gr.Blocks(theme='Hev832/Applio') as blocks:
gr.Markdown(
"""
![Yamamoto Logo](/static-proxy?url=https%3A%2F%2Fcdn-uploads.huggingface.co%2Fproduction%2Fuploads%2F64740cf7485a7c8e1bd51ac9%2F_VyYxp5qE_nRZ_LJqBxmL.webp)%3C%2Fspan%3E%3C!-- HTML_TAG_END -->
# 🎨 Yamamoto QR Code Art Generator
## Transform Your QR Codes into Brand Masterpieces
Welcome to Yamamoto's innovative QR Code Art Generator! This cutting-edge tool empowers our creative team to craft
visually stunning, on-brand QR codes that perfectly blend functionality with artistic expression.
## 🚀 How It Works:
1. **Enter Your QR Code Content**: Start by inputting the URL or text for your QR code.
2. **Craft Your Prompt**: Describe the artistic style or theme you envision for your QR code.
3. **Fine-tune with Advanced Settings**: Adjust parameters to perfect your creation (see tips below).
4. **Generate and Iterate**: Click 'Run' to create your art, then refine as needed.
## 🌟 Tips for Spectacular Results:
- **Artistic Freedom**: Set between 0.8 and 0.95 for a balance of creativity and scannability.
- **QR Code Visibility**: Aim for 0.6 to 2.0 to ensure your code is both artistic and functional.
- **Prompt Crafting**: Use vivid, specific descriptions that align with your brand identity.
- **Experimentation**: Don't hesitate to try different settings and prompts to find your perfect style!
## 🎭 Prompt Ideas to Spark Your Creativity:
- "A serene Japanese garden with cherry blossoms and a koi pond"
- "A futuristic cityscape with neon lights and flying cars"
- "An abstract painting with swirling colors and geometric shapes"
- "A vintage-style travel poster featuring iconic landmarks"
Remember, the magic lies in the details of your prompt and the fine-tuning of your settings.
Happy creating!
"""
)
with gr.Row():
with gr.Column():
qr_code_content = gr.Textbox(
label="QR Code Content",
placeholder="Enter URL or text for your QR code",
info="This is what your QR code will link to or display when scanned.",
)
with gr.Accordion(label="QR Code Image (Optional)", open=False):
qr_code_image = gr.Image(
label="QR Code Image (Optional). Leave blank to automatically generate QR code",
type="pil",
)
prompt = gr.Textbox(
label="Artistic Prompt",
placeholder="Describe the style or theme for your QR code art",
value="A high-resolution, photo-realistic minimalist rendering of Mount Fuji, depicted as a sharp, semi-realistic silhouette of a mountain range on the horizon. The mountain evokes strength and motion with clean, crisp lines and a sense of natural flow. The scene should feature detailed snow textures, subtle highlights on the mountain ridges, and a powerful yet serene atmosphere. The rendering should emphasize the strength of the mountain with a focus on clarity and precision in both texture and light. (Sharp outlines:1.5), (Photo-realistic:1.4), (Detailed textures:1.3), (Minimalist:1.3), (Semi-realistic:1.3), (Monochrome contrast:1.2), (Crisp detail:1.2), (Evoking strength:1.2), inspired by traditional Japanese woodblock prints, nature photography, and minimalist design principles.",
info="Be specific and creative! This guides the AI in creating your unique QR code art.",
)
negative_prompt = gr.Textbox(
label="Elements to Avoid",
placeholder="Describe what you don't want in the image",
value="ugly, disfigured, low quality, blurry, nsfw, bad_pictures, (bad_prompt_version2:0.8), EasyNegative, 3d, cartoon, anime, sketches, (worst quality:2), (low quality:2), (normal quality:2), lowres, normal quality, ((monochrome)), ((grayscale)), poorly drawn, distorted, overexposed, flat shading, bad proportions, deformed, pixelated, messy details, lack of contrast, unrealistic textures, bad anatomy, rough edges, low resolution, text artifacts.",
info="List elements or styles you want to avoid in your QR code art.",
)
use_qr_code_as_init_image = gr.Checkbox(
label="Use QR code as init image",
value=True,
interactive=True,
info="Whether init image should be QR code. Unclick to pass init image or generate init image with Stable Diffusion 2.1"
)
with gr.Accordion(label="Init Images (Optional)", open=False, visible=True) as init_image_acc:
init_image = gr.Image(label="Init Image (Optional). Leave blank to generate image with AI", type="pil")
with gr.Row():
invert_init_image = gr.Checkbox(
label="Invert Init Image",
value=False,
info="Check this to invert the colors of the init image"
)
invert_init_image_button = gr.Button("Invert Init Image")
with gr.Accordion("Advanced Art Controls", open=True):
controlnet_conditioning_scale = gr.Slider(
minimum=0.0,
maximum=5.0,
step=0.01,
value=1.3,
label="QR Code Visibility",
)
gr.Markdown(
"""
**QR Code Visibility** determines how much the QR code itself stands out in the final design. Think of it like balancing between how "artistic" the image looks and how "functional" the QR code is.
- **Low settings (0.0-0.5)**: If you choose a lower value, the QR code will blend more into the art, and it might be hard to scan with a phone. This setting is great if you want the image to look amazing, but you might lose some of the scannability. Try this if you care more about art and less about the QR code being easily recognized.
- **Medium settings (0.6-1.5)**: This is the sweet spot where the QR code remains clearly visible while still blending in with the art. You can still scan it easily with a phone, but it looks more creative. For most users, setting it around **1.1** is a great start to balance both art and function.
- **High settings (1.6-5.0)**: If you need to make sure that the QR code is super easy to scan, even if it means the image looks less like art and more like a regular QR code, then choose a higher value. This is ideal when functionality is the main goal, and the artistic side can take a backseat.
Start with **1.3** if you're unsure, and adjust up or down depending on whether you want the QR code to be more artistic or more functional.
"""
)
strength = gr.Slider(
minimum=0.0,
maximum=1.0,
step=0.01,
value=0.9,
label="Artistic Freedom",
)
gr.Markdown(
"""
**Artistic Freedom** controls how much the AI is allowed to change the QR code's look to match your description. It's like telling the AI how creative it can get with your QR code:
- **Low settings (0.0-0.3)**: If you set this low, the AI will make small changes and your QR code will look more like a regular, plain QR code. This is useful if you want something that is still creative but not too wild, keeping it simple and easy to scan.
- **Medium settings (0.4-0.7)**: Here, the AI will add more artistic touches but keep the QR code recognizable. You get the best of both worlds—your QR code will have some creative flair, but it will still be easy to scan. For most cases, setting it to **0.6** is a great way to keep the code functional and artistic.
- **High settings (0.8-1.0)**: If you set this high, the AI will go all-out creative. The QR code will look amazing, but it might be difficult to scan because the art can start to take over the code. This setting is perfect if you're aiming for a highly creative piece of art and don't mind if it's a bit harder to scan. Start at **0.9** to explore creative but functional designs.
"""
)
guidance_scale = gr.Slider(
minimum=0.0,
maximum=50.0,
step=0.25,
value=7.5,
label="Follow the Prompt",
)
gr.Markdown(
"""
**Follow the Prompt** tells the AI how closely it should follow your description when creating the QR code art. Think of it like giving the AI instructions on how strict or flexible it can be with your design ideas:
- **Low settings (0-5)**: If you choose a lower value, the AI has more freedom to get creative on its own and may not stick too closely to your description. This is great if you want to see how the AI interprets your ideas in unexpected ways.
- **Medium settings (5-15)**: This is a good balance where the AI will mostly follow your prompt but will also add some of its own creative touches. If you want to see some surprises but still want the design to look like what you described, start at around **7.5**.
- **High settings (15+)**: If you choose a higher value, the AI will stick very closely to what you wrote in the description. This is good if you have a very specific idea and don't want the AI to change much. Just keep in mind that this might limit the AI's creativity.
Start at **7.5** for a balanced approach where the AI follows your ideas but still adds some artistic flair.
"""
)
sampler = gr.Dropdown(
choices=list(SAMPLER_MAP.keys()),
value="DPM++ Karras SDE",
label="Art Style",
)
gr.Markdown(
"""
**Art Style** changes how the AI creates the image, using different methods (or "samplers"). Each method has a different effect on how detailed or artistic the final QR code looks:
- **DPM++ Karras SDE**: This is a great all-around option for creating high-quality, detailed images. It's a good place to start if you want a balance of sharpness and creativity.
- **Euler**: This method creates very sharp, detailed images, making the QR code look crisp and clear. Choose this if you want a precise, well-defined design.
- **DDIM**: This method is better if you want the QR code to have a more artistic, abstract style. It's great for when you want the QR code to look like a piece of modern art.
Feel free to experiment with different samplers to see what works best for the look you're going for!
"""
)
seed = gr.Slider(
minimum=-1,
maximum=9999999999,
step=1,
value=-1,
label="Creative Seed",
randomize=False,
)
gr.Markdown(
"""
**Creative Seed** controls whether the AI creates a completely new design each time or sticks to a specific design. Think of it like a recipe: with the same seed number, you get the same "recipe" for your QR code every time.
- **-1**: This setting makes the AI create something completely new every time you run it. Use this if you want to explore different design ideas with each attempt.
- **Any other number**: If you set a specific number, the AI will always create the same image based on that number. This is useful if you find a design you like and want to recreate it exactly.
Try **-1** if you want to explore and generate different designs. If you find something you really love, write down the seed number and use it again to recreate the same design.
"""
)
with gr.Accordion("QR Code Customization", open=True):
bg_color = gr.ColorPicker(
label="Background Color",
value="#FFFFFF",
info="Choose the background color for the QR code"
)
qr_color = gr.ColorPicker(
label="QR Code Color",
value="#000000",
info="Choose the color for the QR code pattern"
)
invert_final_image = gr.Checkbox(
label="Invert Final Image",
value=False,
info="Check this to invert the colors of the final image"
)
with gr.Accordion("Model Selection", open=True):
controlnet_model_dropdown = gr.Dropdown(
choices=list(CONTROLNET_MODELS.keys()),
value="QR Code Monster",
label="ControlNet Model",
info="Select the ControlNet model for QR code generation"
)
diffusion_model_dropdown = gr.Dropdown(
choices=list(DIFFUSION_MODELS.keys()),
value="Stable Diffusion v1.5",
label="Diffusion Model",
info="Select the main diffusion model for image generation"
)
with gr.Row():
run_btn = gr.Button("🎨 Create Your QR Art", variant="primary")
with gr.Column():
result_image = gr.Image(label="Your Artistic QR Code")
used_seed = gr.Number(label="Seed Used", interactive=False)
with gr.Row():
scan_button = gr.Button("Scan QR Code")
invert_button = gr.Button("Invert Image")
scan_result = gr.Textbox(label="Scan Result", interactive=False)
gr.Markdown(
"""
### 🔍 Analyzing Your Creation
- Is the QR code scannable? Click the 'Scan QR Code' button to test.
- Does the art style match your prompt? If not, try adjusting the 'Prompt Adherence'.
- Want more artistic flair? Increase the 'Artistic Freedom'.
- Need a clearer QR code? Raise the 'QR Code Visibility'.
Remember, creating the perfect QR art is a journey of experimentation and refinement.
Enjoy the process of bringing your unique vision to life!
"""
)
def scan_and_display(image):
if image is None:
return "No image to scan"
scanned_text = scan_qr_code(image)
if scanned_text:
return f"Scanned successfully: {scanned_text}"
else:
return "Failed to scan QR code. Try adjusting the settings for better visibility."
def invert_displayed_image(image):
if image is None:
return None
return invert_image(image)
scan_button.click(
scan_and_display,
inputs=[result_image],
outputs=[scan_result]
)
invert_button.click(
invert_displayed_image,
inputs=[result_image],
outputs=[result_image]
)
invert_init_image_button.click(
invert_init_image_display,
inputs=[init_image],
outputs=[init_image]
)
run_btn.click(
inference,
inputs=[
qr_code_content,
prompt,
negative_prompt,
guidance_scale,
controlnet_conditioning_scale,
strength,
seed,
init_image,
qr_code_image,
use_qr_code_as_init_image,
sampler,
bg_color,
qr_color,
invert_final_image,
invert_init_image,
controlnet_model_dropdown,
diffusion_model_dropdown,
],
outputs=[result_image, used_seed],
concurrency_limit=20
)
blocks.queue(max_size=20)
blocks.launch(share=False, show_api=True)