Spaces:

baulab
/

SliderSpace

Running on Zero

App Files Files Community

SliderSpace / app.py

RohitGandikota

Update app.py

85c8011 verified 2 days ago

raw

history blame

21.3 kB

	import gradio as gr
	import numpy as np
	import random
	import os
	import spaces #[uncomment to use ZeroGPU]
	from diffusers import DiffusionPipeline
	import torch
	from diffusers import DiffusionPipeline, UNet2DConditionModel, LCMScheduler, AutoencoderTiny, FluxPipeline
	from huggingface_hub import hf_hub_download
	from safetensors.torch import load_file
	import sys
	sys.path.append('.')
	from utils.lora import LoRANetwork, DEFAULT_TARGET_REPLACE, UNET_TARGET_REPLACE_MODULE_CONV



	# Model configurations
	SDXL_CONCEPTS = [
	"alien", "ancient ruins", "animal", "bike", "car", "Citadel",
	"coral", "cowboy", "face", "futuristic cities", "monster",
	"mystical creature", "planet", "plant", "robot", "sculpture",
	"spaceship", "statue", "studio", "video game", "wizard"
	]

	FLUX_CONCEPTS = [
	"alien",
	"ancient ruins",
	"animal",
	"bike",
	"car",
	"Citadel",
	"face",
	"futuristic cities",
	"mystical creature",
	"planet",
	"plant",
	"robot",
	"spaceship",
	"statue",
	"studio",
	"video game",
	"wizard"
	]




	model_repo_id = "stabilityai/stable-diffusion-xl-base-1.0"
	repo_name = "tianweiy/DMD2"
	ckpt_name = "dmd2_sdxl_4step_unet_fp16.bin"


	device = "cuda" if torch.cuda.is_available() else "cpu"
	if torch.cuda.is_available():
	torch_dtype = torch.bfloat16
	else:
	torch_dtype = torch.float32

	# Load model.
	unet = UNet2DConditionModel.from_config(model_repo_id, subfolder="unet").to(device, torch_dtype)
	unet.load_state_dict(torch.load(hf_hub_download(repo_name, ckpt_name)))
	pipe = DiffusionPipeline.from_pretrained(model_repo_id, unet=unet, torch_dtype=torch_dtype).to(device)
	pipe.scheduler = LCMScheduler.from_config(pipe.scheduler.config)
	pipe.vae = AutoencoderTiny.from_pretrained("madebyollin/taesdxl", torch_dtype=torch_dtype).to(device)

	unet = pipe.unet

	## Change these parameters based on how you trained your sliderspace sliders
	train_method = 'xattn-strict'
	rank = 1
	alpha =1
	networks = {}
	modules = DEFAULT_TARGET_REPLACE
	modules += UNET_TARGET_REPLACE_MODULE_CONV
	for i in range(1):
	networks[i] = LoRANetwork(
	unet,
	rank=int(rank),
	multiplier=1.0,
	alpha=int(alpha),
	train_method=train_method,
	fast_init=True,
	).to(device, dtype=torch_dtype)



	MAX_SEED = np.iinfo(np.int32).max
	MAX_IMAGE_SIZE = 1024


	base_model_id = "black-forest-labs/FLUX.1-schnell"
	max_sequence_length = 256
	flux_pipe = FluxPipeline.from_pretrained(base_model_id, torch_dtype=torch_dtype)
	flux_pipe.vae = AutoencoderTiny.from_pretrained("madebyollin/taef1", torch_dtype=torch_dtype)
	flux_pipe = flux_pipe.to(device)
	# pipe.enable_sequential_cpu_offload()
	transformer = flux_pipe.transformer

	## Change these parameters based on how you trained your sliderspace sliders
	train_method = 'flux-attn'
	rank = 1
	alpha =1

	flux_networks = {}
	modules = DEFAULT_TARGET_REPLACE
	modules += UNET_TARGET_REPLACE_MODULE_CONV
	for i in range(1):
	flux_networks[i] = LoRANetwork(
	transformer,
	rank=int(rank),
	multiplier=1.0,
	alpha=int(alpha),
	train_method=train_method,
	fast_init=True,
	).to(device, dtype=torch_dtype)


	def update_sliderspace_choices(model_choice):
	return gr.Dropdown(
	choices=SDXL_CONCEPTS if model_choice == "SDXL-DMD" else FLUX_CONCEPTS,
	label="SliderSpace Concept",
	value=SDXL_CONCEPTS[0] if model_choice == "SDXL-DMD" else FLUX_CONCEPTS[0]
	)

	@spaces.GPU #[uncomment to use ZeroGPU]
	def infer(
	prompt,
	negative_prompt,
	seed,
	randomize_seed,
	width,
	height,
	guidance_scale,
	num_inference_steps,
	slider_space,
	discovered_directions,
	slider_scale,
	model_choice,
	progress=gr.Progress(track_tqdm=True),
	):
	if randomize_seed:
	seed = random.randint(0, MAX_SEED)

	if model_choice == 'SDXL-DMD':
	sliderspace_path = f"sliderspace_weights/{slider_space}/slider_{int(discovered_directions.split(' ')[-1])-1}.pt"

	for net in networks:
	networks[net].load_state_dict(torch.load(sliderspace_path))
	networks[net].set_lora_slider(slider_scale)
	with networks[0]:
	pass

	# original image
	generator = torch.Generator().manual_seed(seed)
	image = pipe(
	prompt=prompt,
	negative_prompt=negative_prompt,
	guidance_scale=guidance_scale,
	num_inference_steps=num_inference_steps,
	width=width,
	height=height,
	generator=generator,
	).images[0]

	# edited image
	generator = torch.Generator().manual_seed(seed)
	with networks[0]:
	slider_image = pipe(
	prompt=prompt,
	negative_prompt=negative_prompt,
	guidance_scale=guidance_scale,
	num_inference_steps=num_inference_steps,
	width=width,
	height=height,
	generator=generator,
	).images[0]
	else:
	sliderspace_path = f"flux_sliderspace_weights/{slider_space}/slider_{int(discovered_directions.split(' ')[-1])-1}.pt"
	for net in flux_networks:
	flux_networks[net].load_state_dict(torch.load(sliderspace_path))
	flux_networks[net].set_lora_slider(slider_scale)
	with flux_networks[0]:
	pass

	# original image
	generator = torch.Generator().manual_seed(seed)
	image = flux_pipe(
	prompt=prompt,
	guidance_scale=guidance_scale,
	num_inference_steps=num_inference_steps,
	width=width,
	height=height,
	generator=generator,
	max_sequence_length = 256,
	).images[0]

	# edited image
	generator = torch.Generator().manual_seed(seed)
	with flux_networks[0]:
	slider_image = flux_pipe(
	prompt=prompt,
	guidance_scale=guidance_scale,
	num_inference_steps=num_inference_steps,
	width=width,
	height=height,
	generator=generator,
	max_sequence_length = 256,
	).images[0]

	return image, slider_image, seed


	examples = [
	"Astronaut in a jungle, cold color palette, muted colors, detailed, 8k",
	"An astronaut riding a green horse",
	"A delicious ceviche cheesecake slice",
	]

	css = """
	#col-container {
	margin: 0 auto;
	max-width: 640px;
	}
	"""

	ORIGINAL_SPACE_ID = 'baulab/SliderSpace'
	SPACE_ID = os.getenv('SPACE_ID')

	SHARED_UI_WARNING = f'''## You can duplicate and use it with a gpu with at least 24GB, or clone this repository to run on your own machine.
	<center><a class="duplicate-button" style="display:inline-block" target="_blank" href="https://huggingface.co/spaces/{SPACE_ID}?duplicate=true"><img style="margin-top:0;margin-bottom:0" src="https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAAXNSR0IArs4c6QAAAP5JREFUOE+lk7FqAkEURY+ltunEgFXS2sZGIbXfEPdLlnxJyDdYB62sbbUKpLbVNhyYFzbrrA74YJlh9r079973psed0cvUD4A+4HoCjsA85X0Dfn/RBLBgBDxnQPfAEJgBY+A9gALA4tcbamSzS4xq4FOQAJgCDwV2CPKV8tZAJcAjMMkUe1vX+U+SMhfAJEHasQIWmXNN3abzDwHUrgcRGmYcgKe0bxrblHEB4E/pndMazNpSZGcsZdBlYJcEL9Afo75molJyM2FxmPgmgPqlWNLGfwZGG6UiyEvLzHYDmoPkDDiNm9JR9uboiONcBXrpY1qmgs21x1QwyZcpvxt9NS09PlsPAAAAAElFTkSuQmCC&logoWidth=14" alt="Duplicate Space"></a></center>
	'''

	with gr.Blocks(css=css) as demo:
	with gr.Column(elem_id="col-container"):
	gr.Markdown(" # SliderSpace: Decomposing Visual Capabilities of Diffusion Models")
	# Adding links under the title
	gr.Markdown("""
	🔗 [Project Page](https://sliderspace.baulab.info) \|
	💻 [GitHub Code](https://github.com/rohitgandikota/sliderspace)
	""")

	with gr.Row():
	prompt = gr.Text(
	label="Prompt",
	show_label=False,
	max_lines=1,
	placeholder="Enter your prompt",
	container=False,
	)

	run_button = gr.Button("Run", scale=0, variant="primary")

	# Add model selection dropdown
	model_choice = gr.Dropdown(
	choices=["SDXL-DMD", "FLUX-Schnell"],
	label="Model",
	value="SDXL-DMD"
	)
	# New dropdowns side by side
	with gr.Row():
	slider_space = gr.Dropdown(
	choices=SDXL_CONCEPTS,
	label="SliderSpace Concept",
	value=SDXL_CONCEPTS[0]
	)
	discovered_directions = gr.Dropdown(
	choices=[f"Slider {i}" for i in range(1, 11)],
	label="Discovered Directions",
	value="Slider 1"
	)

	slider_scale = gr.Slider(
	label="Slider Scale",
	minimum=-4,
	maximum=4,
	step=0.1,
	value=1,
	)

	with gr.Row():
	result = gr.Image(label="Original Image", show_label=True)
	slider_result = gr.Image(label="Discovered Edit Direction", show_label=True)


	with gr.Accordion("Advanced Settings", open=False):
	negative_prompt = gr.Text(
	label="Negative prompt",
	max_lines=1,
	placeholder="Enter a negative prompt",
	visible=False,
	)

	seed = gr.Slider(
	label="Seed",
	minimum=0,
	maximum=MAX_SEED,
	step=1,
	value=0,
	)

	randomize_seed = gr.Checkbox(label="Randomize seed", value=True)

	with gr.Row():
	width = gr.Slider(
	label="Width",
	minimum=256,
	maximum=MAX_IMAGE_SIZE,
	step=32,
	value=1024, # Replace with defaults that work for your model
	)

	height = gr.Slider(
	label="Height",
	minimum=256,
	maximum=MAX_IMAGE_SIZE,
	step=32,
	value=1024, # Replace with defaults that work for your model
	)

	with gr.Row():
	guidance_scale = gr.Slider(
	label="Guidance scale",
	minimum=0.0,
	maximum=2.0,
	step=0.1,
	value=0.0, # Replace with defaults that work for your model
	)

	num_inference_steps = gr.Slider(
	label="Number of inference steps",
	minimum=1,
	maximum=50,
	step=1,
	value=4, # Replace with defaults that work for your model
	)
	# Add event handler for model selection
	model_choice.change(
	fn=update_sliderspace_choices,
	inputs=[model_choice],
	outputs=[slider_space]
	)
	# gr.Examples(examples=examples, inputs=[prompt])
	gr.on(
	triggers=[run_button.click, prompt.submit],
	fn=infer,
	inputs=[
	prompt,
	negative_prompt,
	seed,
	randomize_seed,
	width,
	height,
	guidance_scale,
	num_inference_steps,
	slider_space,
	discovered_directions,
	slider_scale,
	model_choice
	],
	outputs=[result, slider_result, seed],
	)

	if __name__ == "__main__":
	demo.launch(share=True)

















	# import gradio as gr
	# import numpy as np
	# import random
	# import os
	# import spaces #[uncomment to use ZeroGPU]
	# from diffusers import DiffusionPipeline
	# import torch
	# from diffusers import DiffusionPipeline, UNet2DConditionModel, LCMScheduler
	# from huggingface_hub import hf_hub_download
	# from safetensors.torch import load_file
	# import sys
	# sys.path.append('.')
	# from utils.lora import LoRANetwork, DEFAULT_TARGET_REPLACE, UNET_TARGET_REPLACE_MODULE_CONV

	# model_repo_id = "stabilityai/stable-diffusion-xl-base-1.0"
	# repo_name = "tianweiy/DMD2"
	# ckpt_name = "dmd2_sdxl_4step_unet_fp16.bin"


	# device = "cuda" if torch.cuda.is_available() else "cpu"
	# if torch.cuda.is_available():
	# torch_dtype = torch.bfloat16
	# else:
	# torch_dtype = torch.float32

	# # Load model.
	# unet = UNet2DConditionModel.from_config(model_repo_id, subfolder="unet").to(device, torch_dtype)
	# unet.load_state_dict(torch.load(hf_hub_download(repo_name, ckpt_name)))
	# pipe = DiffusionPipeline.from_pretrained(model_repo_id, unet=unet, torch_dtype=torch_dtype).to(device)
	# pipe.scheduler = LCMScheduler.from_config(pipe.scheduler.config)


	# unet = pipe.unet

	# ## Change these parameters based on how you trained your sliderspace sliders
	# train_method = 'xattn-strict'
	# rank = 1
	# alpha =1
	# networks = {}
	# modules = DEFAULT_TARGET_REPLACE
	# modules += UNET_TARGET_REPLACE_MODULE_CONV
	# for i in range(1):
	# networks[i] = LoRANetwork(
	# unet,
	# rank=int(rank),
	# multiplier=1.0,
	# alpha=int(alpha),
	# train_method=train_method,
	# fast_init=True,
	# ).to(device, dtype=torch_dtype)



	# MAX_SEED = np.iinfo(np.int32).max
	# MAX_IMAGE_SIZE = 1024


	# @spaces.GPU #[uncomment to use ZeroGPU]
	# def infer(
	# prompt,
	# negative_prompt,
	# seed,
	# randomize_seed,
	# width,
	# height,
	# guidance_scale,
	# num_inference_steps,
	# slider_space,
	# discovered_directions,
	# slider_scale,
	# progress=gr.Progress(track_tqdm=True),
	# ):
	# if randomize_seed:
	# seed = random.randint(0, MAX_SEED)

	# sliderspace_path = f"sliderspace_weights/{slider_space}/slider_{int(discovered_directions.split(' ')[-1])-1}.pt"

	# for net in networks:
	# networks[net].load_state_dict(torch.load(sliderspace_path))

	# for net in networks:
	# networks[net].set_lora_slider(slider_scale)

	# with networks[0]:
	# pass

	# # original image
	# generator = torch.Generator().manual_seed(seed)
	# image = pipe(
	# prompt=prompt,
	# negative_prompt=negative_prompt,
	# guidance_scale=guidance_scale,
	# num_inference_steps=num_inference_steps,
	# width=width,
	# height=height,
	# generator=generator,
	# ).images[0]

	# # edited image
	# generator = torch.Generator().manual_seed(seed)
	# with networks[0]:
	# slider_image = pipe(
	# prompt=prompt,
	# negative_prompt=negative_prompt,
	# guidance_scale=guidance_scale,
	# num_inference_steps=num_inference_steps,
	# width=width,
	# height=height,
	# generator=generator,
	# ).images[0]


	# return image, slider_image, seed


	# examples = [
	# "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k",
	# "An astronaut riding a green horse",
	# "A delicious ceviche cheesecake slice",
	# ]

	# css = """
	# #col-container {
	# margin: 0 auto;
	# max-width: 640px;
	# }
	# """

	# ORIGINAL_SPACE_ID = 'baulab/SliderSpace'
	# SPACE_ID = os.getenv('SPACE_ID')

	# SHARED_UI_WARNING = f'''## You can duplicate and use it with a gpu with at least 24GB, or clone this repository to run on your own machine.
	# <center><a class="duplicate-button" style="display:inline-block" target="_blank" href="https://huggingface.co/spaces/{SPACE_ID}?duplicate=true"><img style="margin-top:0;margin-bottom:0" src="https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAABAAAAAQCAYAAAAf8/9hAAAAAXNSR0IArs4c6QAAAP5JREFUOE+lk7FqAkEURY+ltunEgFXS2sZGIbXfEPdLlnxJyDdYB62sbbUKpLbVNhyYFzbrrA74YJlh9r079973psed0cvUD4A+4HoCjsA85X0Dfn/RBLBgBDxnQPfAEJgBY+A9gALA4tcbamSzS4xq4FOQAJgCDwV2CPKV8tZAJcAjMMkUe1vX+U+SMhfAJEHasQIWmXNN3abzDwHUrgcRGmYcgKe0bxrblHEB4E/pndMazNpSZGcsZdBlYJcEL9Afo75molJyM2FxmPgmgPqlWNLGfwZGG6UiyEvLzHYDmoPkDDiNm9JR9uboiONcBXrpY1qmgs21x1QwyZcpvxt9NS09PlsPAAAAAElFTkSuQmCC&logoWidth=14" alt="Duplicate Space"></a></center>
	# '''

	# with gr.Blocks(css=css) as demo:
	# with gr.Column(elem_id="col-container"):
	# gr.Markdown(" # SliderSpace: Decomposing Visual Capabilities of Diffusion Models")
	# # Adding links under the title
	# gr.Markdown("""
	# 🔗 [Project Page](https://sliderspace.baulab.info) \|
	# 💻 [GitHub Code](https://github.com/rohitgandikota/sliderspace)
	# """)

	# with gr.Row():
	# prompt = gr.Text(
	# label="Prompt",
	# show_label=False,
	# max_lines=1,
	# placeholder="Enter your prompt",
	# container=False,
	# )

	# run_button = gr.Button("Run", scale=0, variant="primary")


	# # New dropdowns side by side
	# with gr.Row():
	# slider_space = gr.Dropdown(
	# choices= [
	# "alien",
	# "ancient ruins",
	# "animal",
	# "bike",
	# "car",
	# "Citadel",
	# "coral",
	# "cowboy",
	# "face",
	# "futuristic cities",
	# "monster",
	# "mystical creature",
	# "planet",
	# "plant",
	# "robot",
	# "sculpture",
	# "spaceship",
	# "statue",
	# "studio",
	# "video game",
	# "wizard"
	# ],
	# label="SliderSpace",
	# value="spaceship"
	# )
	# discovered_directions = gr.Dropdown(
	# choices=[f"Slider {i}" for i in range(1, 11)],
	# label="Discovered Directions",
	# value="Slider 1"
	# )

	# slider_scale = gr.Slider(
	# label="Slider Scale",
	# minimum=-4,
	# maximum=4,
	# step=0.1,
	# value=1,
	# )

	# with gr.Row():
	# result = gr.Image(label="Original Image", show_label=True)
	# slider_result = gr.Image(label="Discovered Edit Direction", show_label=True)


	# with gr.Accordion("Advanced Settings", open=False):
	# negative_prompt = gr.Text(
	# label="Negative prompt",
	# max_lines=1,
	# placeholder="Enter a negative prompt",
	# visible=False,
	# )

	# seed = gr.Slider(
	# label="Seed",
	# minimum=0,
	# maximum=MAX_SEED,
	# step=1,
	# value=0,
	# )

	# randomize_seed = gr.Checkbox(label="Randomize seed", value=True)

	# with gr.Row():
	# width = gr.Slider(
	# label="Width",
	# minimum=256,
	# maximum=MAX_IMAGE_SIZE,
	# step=32,
	# value=1024, # Replace with defaults that work for your model
	# )

	# height = gr.Slider(
	# label="Height",
	# minimum=256,
	# maximum=MAX_IMAGE_SIZE,
	# step=32,
	# value=1024, # Replace with defaults that work for your model
	# )

	# with gr.Row():
	# guidance_scale = gr.Slider(
	# label="Guidance scale",
	# minimum=0.0,
	# maximum=2.0,
	# step=0.1,
	# value=0.0, # Replace with defaults that work for your model
	# )

	# num_inference_steps = gr.Slider(
	# label="Number of inference steps",
	# minimum=1,
	# maximum=50,
	# step=1,
	# value=4, # Replace with defaults that work for your model
	# )

	# # gr.Examples(examples=examples, inputs=[prompt])
	# gr.on(
	# triggers=[run_button.click, prompt.submit],
	# fn=infer,
	# inputs=[
	# prompt,
	# negative_prompt,
	# seed,
	# randomize_seed,
	# width,
	# height,
	# guidance_scale,
	# num_inference_steps,
	# slider_space,
	# discovered_directions,
	# slider_scale
	# ],
	# outputs=[result, slider_result, seed],
	# )

	# if __name__ == "__main__":
	# demo.launch(share=True)