Spaces:

nigeljw
/

ViewDiffusion

Paused

App Files Files Community

nigeljw commited on May 16, 2023

Commit

671a051

1 Parent(s): 27ee5cf

Modified prompts

Browse files

Files changed (1) hide show

app.py +13 -11

app.py CHANGED Viewed

@@ -81,7 +81,7 @@ def Diffuse(latentWalk, generatorSeed, inputImage, mask, prompt, negativePrompt,
     if lastSeed != generatorSeed:
         generator = torch.Generator(device).manual_seed(generatorSeed)
         lastSeed = generatorSeed
     newImage = outpaintPipeline(prompt=prompt,
                     negative_prompt=negativePrompt,
                     image=inputImage,
@@ -118,10 +118,10 @@ latentWalkDesc = "This allows you to walk short spans across the latent space wi
 examplePrompt1 = "A person in a room" #A person in a room with colored hair"
 examplePrompt2 = "A person with colored hair" #"People in a room with colored hair"
 examplePrompt3 = "A person on a beach with long hair" #"A man on a beach with long hair"
-examplePrompt4 = "A person in a field under a night sky" #"A woman on a beach with long hair"
-examplePrompt5 = "A panda eating bamboo" #"A panda eating bamboo"
 examplePrompt6 = "A bird flying in the sky" #"A family together in a room"
-examplePrompt7 = "A Koala bear" #"A family together outside with colored hair"
 with gradio.Blocks(live=True) as ux:
     gradio.Markdown("This generative machine learning demonstration streams stable diffusion outpainting inference live from your camera on your computer or phone to expand your local reality and create an alternate world. High quality frame to frame determinism is a hard problem to solve for latent diffusion models as the generation is inherently relative to input noise distributions for the latents, and many factors such as the inherent Bayer noise from the camera images as well as anything that is altered between camera images (such as focus, white balance, etc) causes non-determinism between frames. Some methods apply spationtemporal attention, but this demonstration focuses on the control over the input latents to navigate the latent space. **Increase the lighting of your physical scene from your camera's perspective, and avoid self shadows of scene content, to improve the quality and consistency of the scene generation.**")
@@ -129,12 +129,14 @@ with gradio.Blocks(live=True) as ux:
         with gradio.Column():
             #staticLatents = gradio.Checkbox(label="Static Latents", info=staticLatentsDesc, value=True, interactive=True)
             inputImage = gradio.Image(label="Input Feed", source="webcam", shape=[512,512], streaming=True)
             mask = gradio.Image(label="Mask", type="pil", value=defaultMask)
             prompt = gradio.Textbox(label="Prompt", info=promptDesc, placeholder=examplePrompt1, value=examplePrompt1, lines=3)
             negativePrompt = gradio.Textbox(label="Negative Prompt", info=negPromptDesc, placeholder="Facial hair", value="Text, words", lines=3)
             guidanceScale = gradio.Slider(label="Guidance Scale", info="A higher value causes the generation to be more relative to the text prompt conditioning.", maximum=100, minimum=1, value=7.5, step= 0.1)
             numInferenceSteps = gradio.Slider(label="Number of Inference Steps", info=numInfStepsDesc, maximum=100, minimum=1, value=20, step=1)
             generatorSeed = gradio.Slider(label="Generator Seed", info=generatorSeedDesc, maximum=10000, minimum=1, value=lastSeed, step=1)
             #modelIndex = gradio.Dropdown(modelNames, label="Model", value="runwayml/stable-diffusion-inpainting")
             #inputImage.style(full_width=True)
@@ -149,13 +151,13 @@ with gradio.Blocks(live=True) as ux:
     generateLatents.click(GenerateNewLatentsForInference, outputs=latentWalk)
     inputImage.change(fn=Diffuse, inputs=inferenceInputs, outputs=outputImage, show_progress=False)
-    examples = [[1.0, 1234, "assets/input/man.png", "assets/masks/diamond.png", examplePrompt1, "", 7.5, 20],
-                [0.5, 2048, "assets/input/people.jpg", "assets/masks/star.png", examplePrompt2, "", 7.5, 15],
-                [0.3, 8192, "assets/input/man.png", "assets/masks/sphere.png", examplePrompt3, "", 7.5, 25],
-                [0.7, 1024, "assets/input/woman.jpg", "assets/masks/spiral.png", examplePrompt4, "", 7.5, 15],
-                [1.0, 512, "assets/input/man.png", "assets/masks/square.png", examplePrompt5, "", 7.5, 10],
-                [0.1, 256, "assets/input/family.jpg", "assets/masks/wave.png", examplePrompt6, "", 11.5, 30],
-                [0.9, 9999, "assets/input/family.jpg", "assets/masks/maze.png", examplePrompt7, "", 17.5, 35],]
     inputExamples = gradio.Examples(examples, inputs=inferenceInputs, outputs=outputImage, fn=Diffuse)

     if lastSeed != generatorSeed:
         generator = torch.Generator(device).manual_seed(generatorSeed)
         lastSeed = generatorSeed
     newImage = outpaintPipeline(prompt=prompt,
                     negative_prompt=negativePrompt,
                     image=inputImage,
 examplePrompt1 = "A person in a room" #A person in a room with colored hair"
 examplePrompt2 = "A person with colored hair" #"People in a room with colored hair"
 examplePrompt3 = "A person on a beach with long hair" #"A man on a beach with long hair"
+examplePrompt4 = "A person outside in a field under a starry night sky" #"A woman on a beach with long hair"
+examplePrompt5 = "A person in a forest" #"A panda eating bamboo" #"A panda eating bamboo"
 examplePrompt6 = "A bird flying in the sky" #"A family together in a room"
+examplePrompt7 = "A person in a room" #"A family together outside with colored hair"
 with gradio.Blocks(live=True) as ux:
     gradio.Markdown("This generative machine learning demonstration streams stable diffusion outpainting inference live from your camera on your computer or phone to expand your local reality and create an alternate world. High quality frame to frame determinism is a hard problem to solve for latent diffusion models as the generation is inherently relative to input noise distributions for the latents, and many factors such as the inherent Bayer noise from the camera images as well as anything that is altered between camera images (such as focus, white balance, etc) causes non-determinism between frames. Some methods apply spationtemporal attention, but this demonstration focuses on the control over the input latents to navigate the latent space. **Increase the lighting of your physical scene from your camera's perspective, and avoid self shadows of scene content, to improve the quality and consistency of the scene generation.**")
         with gradio.Column():
             #staticLatents = gradio.Checkbox(label="Static Latents", info=staticLatentsDesc, value=True, interactive=True)
             inputImage = gradio.Image(label="Input Feed", source="webcam", shape=[512,512], streaming=True)
+            #inputImage2 = gradio.Image(label="Input Feed 2", source="webcam", shape=[512,512], streaming=True)
             mask = gradio.Image(label="Mask", type="pil", value=defaultMask)
             prompt = gradio.Textbox(label="Prompt", info=promptDesc, placeholder=examplePrompt1, value=examplePrompt1, lines=3)
             negativePrompt = gradio.Textbox(label="Negative Prompt", info=negPromptDesc, placeholder="Facial hair", value="Text, words", lines=3)
             guidanceScale = gradio.Slider(label="Guidance Scale", info="A higher value causes the generation to be more relative to the text prompt conditioning.", maximum=100, minimum=1, value=7.5, step= 0.1)
             numInferenceSteps = gradio.Slider(label="Number of Inference Steps", info=numInfStepsDesc, maximum=100, minimum=1, value=20, step=1)
             generatorSeed = gradio.Slider(label="Generator Seed", info=generatorSeedDesc, maximum=10000, minimum=1, value=lastSeed, step=1)
+            #numViews = gradio.Slider(label="Number of Views", info="The number of discrete view perspectives to merge together in the view expansion.", maximum=100, minimum=1, value=1, step=1)
             #modelIndex = gradio.Dropdown(modelNames, label="Model", value="runwayml/stable-diffusion-inpainting")
             #inputImage.style(full_width=True)
     generateLatents.click(GenerateNewLatentsForInference, outputs=latentWalk)
     inputImage.change(fn=Diffuse, inputs=inferenceInputs, outputs=outputImage, show_progress=False)
+    examples = [[1.0, 1234, "assets/input/man.png","assets/masks/diamond.png", examplePrompt1, "", 7.5, 20, 1],
+                [0.5, 2048, "assets/input/woman.jpg", "assets/masks/star.png", examplePrompt2, "", 7.5, 15, 1],
+                [0.3, 8192, "assets/input/man.png", "assets/masks/sphere.png", examplePrompt3, "", 7.5, 25, 1],
+                [0.7, 1024, "assets/input/woman.jpg", "assets/masks/spiral.png", examplePrompt4, "", 7.5, 15, 1],
+                [1.0, 512, "assets/input/man.png", "assets/masks/square.png", examplePrompt5, "", 7.5, 10, 1],
+                [0.1, 256, "assets/input/woman.jpg", "assets/masks/wave.png", examplePrompt6, "", 11.5, 30, 1],
+                [0.9, 9999, "assets/input/man.png", "assets/masks/maze.png", examplePrompt7, "", 17.5, 35, 1],]
     inputExamples = gradio.Examples(examples, inputs=inferenceInputs, outputs=outputImage, fn=Diffuse)