| from diffusers import AutoPipelineForImage2Image, AutoPipelineForText2Image |
| import torch |
| import os |
|
|
| try: |
| import intel_extension_for_pytorch as ipex |
| except: |
| pass |
|
|
| from PIL import Image |
| import numpy as np |
| import gradio as gr |
| import psutil |
| import time |
| import math |
|
|
| SAFETY_CHECKER = os.environ.get("SAFETY_CHECKER", None) |
| TORCH_COMPILE = os.environ.get("TORCH_COMPILE", None) |
| HF_TOKEN = os.environ.get("HF_TOKEN", None) |
| |
| mps_available = hasattr(torch.backends, "mps") and torch.backends.mps.is_available() |
| xpu_available = hasattr(torch, "xpu") and torch.xpu.is_available() |
| device = torch.device( |
| "cuda" if torch.cuda.is_available() else "xpu" if xpu_available else "cpu" |
| ) |
| torch_device = device |
| torch_dtype = torch.float16 |
|
|
| print(f"SAFETY_CHECKER: {SAFETY_CHECKER}") |
| print(f"TORCH_COMPILE: {TORCH_COMPILE}") |
| print(f"device: {device}") |
|
|
| if mps_available: |
| device = torch.device("mps") |
| torch_device = "cpu" |
| torch_dtype = torch.float32 |
|
|
| if SAFETY_CHECKER == "True": |
| i2i_pipe = AutoPipelineForImage2Image.from_pretrained( |
| "stabilityai/sdxl-turbo", |
| torch_dtype=torch_dtype, |
| variant="fp16" if torch_dtype == torch.float16 else "fp32", |
| ) |
| t2i_pipe = AutoPipelineForText2Image.from_pretrained( |
| "stabilityai/sdxl-turbo", |
| torch_dtype=torch_dtype, |
| variant="fp16" if torch_dtype == torch.float16 else "fp32", |
| ) |
| else: |
| i2i_pipe = AutoPipelineForImage2Image.from_pretrained( |
| "stabilityai/sdxl-turbo", |
| safety_checker=None, |
| torch_dtype=torch_dtype, |
| variant="fp16" if torch_dtype == torch.float16 else "fp32", |
| ) |
| t2i_pipe = AutoPipelineForText2Image.from_pretrained( |
| "stabilityai/sdxl-turbo", |
| safety_checker=None, |
| torch_dtype=torch_dtype, |
| variant="fp16" if torch_dtype == torch.float16 else "fp32", |
| ) |
|
|
| t2i_pipe.to(device=torch_device, dtype=torch_dtype).to(device) |
| t2i_pipe.set_progress_bar_config(disable=True) |
| i2i_pipe.to(device=torch_device, dtype=torch_dtype).to(device) |
| i2i_pipe.set_progress_bar_config(disable=True) |
|
|
| def resize_crop(image, size=512): |
| image = image.convert("RGB") |
| w, h = image.size |
| image = image.resize((size, int(size * (h / w))), Image.BICUBIC) |
| return image |
|
|
| |
| selected_image_index = None |
|
|
| |
| image_folder = 'images' |
| images = [Image.open(os.path.join(image_folder, img)) for img in sorted(os.listdir(image_folder)) if img.endswith(('.png', '.jpg', '.jpeg'))] |
|
|
| |
| assert len(images) == 34, "There should be exactly 34 images in the 'images' folder." |
|
|
| |
| async def select_fn(data: gr.SelectData, prompt: str): |
| global selected_image_index |
| selected_image_index = data.index |
| if prompt == "": |
| print("Prompt is empty, returning original image") |
| return images[selected_image_index] |
| return await predict(prompt) |
| |
| async def predict(prompt): |
| global selected_image_index |
| strength = 0.49999999999999999 |
| steps = 2 |
| if selected_image_index is not None: |
| init_image = images[selected_image_index] |
| init_image = resize_crop(init_image) |
| generator = torch.manual_seed(123123) |
| last_time = time.time() |
| |
| if int(steps * strength) < 1: |
| steps = math.ceil(1 / max(0.10, strength)) |
| |
| results = i2i_pipe( |
| prompt=prompt, |
| image=init_image, |
| generator=generator, |
| num_inference_steps=steps, |
| guidance_scale=0.0, |
| strength=strength, |
| width=512, |
| height=512, |
| output_type="pil", |
| ) |
|
|
| print(f"Pipe took {time.time() - last_time} seconds") |
| nsfw_content_detected = ( |
| results.nsfw_content_detected[0] |
| if "nsfw_content_detected" in results |
| else False |
| ) |
| if nsfw_content_detected: |
| gr.Warning("NSFW content detected.") |
| return Image.new("RGB", (512, 512)) |
| return results.images[0] |
|
|
| |
| with gr.Blocks() as app: |
| gr.Markdown('''# Rorschach 🎭 |
| ### 1. Select a CRASH REPORT image |
| ### 2. Describe what you see |
| <small>CRASH REPORT was a self-published, 72-page book by NoPattern Studio released in November, 2019. Limited to an edition of 300, the book contained a year's worth of experimental, exploratory 3D imagery generated entirely in Photoshop. [CRASH REPORT site](https://nopattern.com/CRASH-REPORT) [see this space's lineage graph](https://huggingface.co/spaces/EQTYLab/lineage-explorer?repo=https://huggingface.co/NoPattern/Rorschach)</small>''', elem_id="main_title") |
| |
| with gr.Row(): |
| with gr.Column(): |
| image_gallery = gr.Gallery(value=images, columns=4) |
| with gr.Column(): |
| prompt = gr.Textbox(label="I see...") |
| output = gr.Image(label="Generation") |
|
|
| |
|
|
| image_gallery.select(select_fn, inputs=[prompt], outputs=output, show_progress=False) |
| |
| prompt.change(fn=predict, inputs=[prompt], outputs=output, show_progress=False) |
|
|
| |
| app.queue() |
| app.launch() |
|
|