Spaces:

jadechoghari
/

flux-kiwi

Runtime error

File size: 2,075 Bytes

import gradio as gr
import torch
import spaces
from diffusers import FluxPipeline


try:
    from torchao.quantization import autoquant
except ImportError:
    raise ImportError("torchao is not installed. Please install it to use the optimized pipeline.")

# normal FluxPipeline
pipeline_normal = FluxPipeline.from_pretrained(
    "sayakpaul/FLUX.1-merged",
    torch_dtype=torch.bfloat16
).to("cuda")

# optimized FluxPipeline
pipeline_optimized = FluxPipeline.from_pretrained(
    "sayakpaul/FLUX.1-merged",
    torch_dtype=torch.bfloat16
).to("cuda")

pipeline_optimized.transformer.to(memory_format=torch.channels_last)
pipeline_optimized.transformer = torch.compile(
    pipeline_optimized.transformer,
    mode="max-autotune",
    fullgraph=True
)

pipeline_optimized.transformer = autoquant(
    pipeline_optimized.transformer,
    error_on_unseen=False
)

@spaces.GPU
def generate_images(prompt, guidance_scale, num_inference_steps):
    # generate image with normal pipeline
    image_normal = pipeline_normal(
        prompt=prompt,
        guidance_scale=guidance_scale,
        num_inference_steps=int(num_inference_steps)
    ).images[0]
    
    # generate image with optimized pipeline
    image_optimized = pipeline_optimized(
        prompt=prompt,
        guidance_scale=guidance_scale,
        num_inference_steps=int(num_inference_steps)
    ).images[0]
    
    return image_normal, image_optimized

# set up Gradio interface
demo = gr.Interface(
    fn=generate_images,
    inputs=[
        gr.Textbox(lines=2, placeholder="Enter your prompt here...", label="Prompt"),
        gr.Slider(1.0, 10.0, step=0.5, value=3.5, label="Guidance Scale"),
        gr.Slider(10, 100, step=1, value=50, label="Number of Inference Steps")
    ],
    outputs=[
        gr.Image(type="pil", label="Normal FluxPipeline"),
        gr.Image(type="pil", label="Optimized FluxPipeline")
    ],
    title="FluxPipeline Comparison",
    description="Compare images generated by the normal FluxPipeline and the optimized one using torchao and torch.compile()."
)

demo.launch()