Spaces:

jadechoghari
/

flux-kiwi

Runtime error

App Files Files Community

flux-kiwi / app.py

jadechoghari

Update app.py

dd7bda3 verified 6 days ago

raw

history blame

2.88 kB

	import gradio as gr
	import torch
	import spaces
	from diffusers import FluxPipeline, DiffusionPipeline
	from torchao.quantization import autoquant



	# # # normal FluxPipeline
	# pipeline_normal = FluxPipeline.from_pretrained(
	# "sayakpaul/FLUX.1-merged",
	# torch_dtype=torch.bfloat16
	# ).to("cuda")
	# pipeline_normal.transformer.to(memory_format=torch.channels_last)
	# pipeline_normal.transformer = torch.compile(pipeline_normal.transformer, mode="max-autotune", fullgraph=True)

	pipeline_normal = DiffusionPipeline.from_pretrained("sayakpaul/FLUX.1-merged")
	pipeline_normal.load_lora_weights("DarkMoonDragon/TurboRender-flux-dev")
	# # optimized FluxPipeline
	# pipeline_optimized = FluxPipeline.from_pretrained(
	# "camenduru/FLUX.1-dev-diffusers",
	# torch_dtype=torch.bfloat16
	# ).to("cuda")
	# pipeline_optimized.transformer.to(memory_format=torch.channels_last)
	# pipeline_optimized.transformer = torch.compile(
	# pipeline_optimized.transformer,
	# mode="max-autotune",
	# fullgraph=True
	# )
	# # wrap the autoquant call in a try-except block to handle unsupported layers
	# for name, layer in pipeline_optimized.transformer.named_children():
	# try:
	# # apply autoquant to each layer
	# pipeline_optimized.transformer._modules[name] = autoquant(layer, error_on_unseen=False)
	# print(f"Successfully quantized {name}")
	# except AttributeError as e:
	# print(f"Skipping layer {name} due to error: {e}")
	# except Exception as e:
	# print(f"Unexpected error while quantizing {name}: {e}")

	# pipeline_optimized.transformer = autoquant(
	# pipeline_optimized.transformer,
	# error_on_unseen=False
	# )
	pipeline_optimized = pipeline_normal

	@spaces.GPU(duration=120)
	def generate_images(prompt, guidance_scale, num_inference_steps):
	# # generate image with normal pipeline
	# image_normal = pipeline_normal(
	# prompt=prompt,
	# guidance_scale=guidance_scale,
	# num_inference_steps=int(num_inference_steps)
	# ).images[0]

	# generate image with optimized pipeline
	image_optimized = pipeline_optimized(
	prompt=prompt,
	guidance_scale=guidance_scale,
	num_inference_steps=int(num_inference_steps)
	).images[0]

	return image_optimized

	# set up Gradio interface
	demo = gr.Interface(
	fn=generate_images,
	inputs=[
	gr.Textbox(lines=2, placeholder="Enter your prompt here...", label="Prompt"),
	gr.Slider(1.0, 10.0, step=0.5, value=3.5, label="Guidance Scale"),
	gr.Slider(10, 100, step=1, value=50, label="Number of Inference Steps")
	],
	outputs=[
	gr.Image(type="pil", label="Optimized FluxPipeline")
	],
	title="FluxPipeline Comparison",
	description="Compare images generated by the normal FluxPipeline and the optimized one using torchao and torch.compile()."
	)

	demo.launch()