Spaces:

SaiShailesh
/

stable_diffusion

Build error

App Files Files Community

stable_diffusion / app.py

SaiShailesh

Upload 2 files

4c1e086 verified about 1 month ago

raw

history blame contribute delete

5.18 kB

	import streamlit as st
	import torch
	from torch import nn
	from diffusers import DDPMScheduler, UNet2DModel
	import matplotlib.pyplot as plt
	from tqdm.auto import tqdm

	# Reuse your existing model code
	class ClassConditionedUnet(nn.Module):
	def __init__(self, num_classes=3, class_emb_size=12):
	super().__init__()
	self.class_emb = nn.Embedding(num_classes, class_emb_size)
	self.model = UNet2DModel(
	sample_size=64,
	in_channels=3 + class_emb_size,
	out_channels=3,
	layers_per_block=2,
	block_out_channels=(64, 128, 256, 512),
	down_block_types=(
	"DownBlock2D",
	"DownBlock2D",
	"AttnDownBlock2D",
	"AttnDownBlock2D",
	),
	up_block_types=(
	"AttnUpBlock2D",
	"AttnUpBlock2D",
	"UpBlock2D",
	"UpBlock2D",
	),
	)

	def forward(self, x, t, class_labels):
	bs, ch, w, h = x.shape
	class_cond = self.class_emb(class_labels)
	class_cond = class_cond.view(bs, class_cond.shape[1], 1, 1).expand(bs, class_cond.shape[1], w, h)
	net_input = torch.cat((x, class_cond), 1)
	return self.model(net_input, t).sample

	@st.cache_resource
	def load_model(model_path):
	"""Load the model with caching to avoid reloading"""
	device = 'cpu' # For deployment, we'll use CPU
	net = ClassConditionedUnet().to(device)
	noise_scheduler = DDPMScheduler(num_train_timesteps=1000, beta_schedule='squaredcos_cap_v2')
	checkpoint = torch.load(model_path, map_location='cpu')
	net.load_state_dict(checkpoint['model_state_dict'])
	return net, noise_scheduler

	def generate_mixed_faces(net, noise_scheduler, mix_weights, num_images=1):
	"""Generate faces with mixed ethnic features"""
	device = next(net.parameters()).device
	net.eval()
	with torch.no_grad():
	x = torch.randn(num_images, 3, 64, 64).to(device)

	# Get embeddings for all classes
	emb_asian = net.class_emb(torch.zeros(num_images).long().to(device))
	emb_indian = net.class_emb(torch.ones(num_images).long().to(device))
	emb_european = net.class_emb(torch.full((num_images,), 2).to(device))

	progress_bar = st.progress(0)
	for idx, t in enumerate(noise_scheduler.timesteps):
	# Update progress bar
	progress_bar.progress(idx / len(noise_scheduler.timesteps))

	# Mix embeddings according to weights
	mixed_emb = (
	mix_weights[0] * emb_asian +
	mix_weights[1] * emb_indian +
	mix_weights[2] * emb_european
	)

	# Override embedding layer temporarily
	original_forward = net.class_emb.forward
	net.class_emb.forward = lambda _: mixed_emb

	residual = net(x, t, torch.zeros(num_images).long().to(device))
	x = noise_scheduler.step(residual, t, x).prev_sample

	# Restore original embedding layer
	net.class_emb.forward = original_forward

	progress_bar.progress(1.0)

	x = (x.clamp(-1, 1) + 1) / 2
	return x

	def main():
	st.title("AI Face Generator with Ethnic Features Mixing")

	# Load model
	try:
	net, noise_scheduler = load_model('final_model/final_diffusion_model.pt')
	except Exception as e:
	st.error(f"Error loading model: {str(e)}")
	return

	# Create sliders for ethnicity percentages
	st.subheader("Adjust Ethnicity Mix")
	col1, col2, col3 = st.columns(3)

	with col1:
	asian_pct = st.slider("Asian Features %", 0, 100, 33, 1)
	with col2:
	indian_pct = st.slider("Indian Features %", 0, 100, 33, 1)
	with col3:
	european_pct = st.slider("European Features %", 0, 100, 34, 1)

	# Calculate total and normalize if needed
	total = asian_pct + indian_pct + european_pct
	if total == 0:
	st.warning("Total percentage cannot be 0%. Please adjust the sliders.")
	return

	# Normalize weights to sum to 1
	weights = [asian_pct/total, indian_pct/total, european_pct/total]

	# Display current mix
	st.write("Current mix (normalized):")
	st.write(f"Asian: {weights[0]:.2%}, Indian: {weights[1]:.2%}, European: {weights[2]:.2%}")

	# Generate button
	if st.button("Generate Face"):
	try:
	with st.spinner("Generating face..."):
	# Generate the image
	generated_images = generate_mixed_faces(net, noise_scheduler, weights)

	# Convert to numpy and display
	img = generated_images[0].permute(1, 2, 0).cpu().numpy()
	st.image(img, caption="Generated Face", use_column_width=True)

	except Exception as e:
	st.error(f"Error generating image: {str(e)}")

	if __name__ == "__main__":
	main()