video-upscaling-server-1

Running on A10G

App Files Files

jbilcke-hf HF staff commited on Aug 10, 2023

Commit

8024618

•

1 Parent(s): 12e4a4d

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -98

app.py CHANGED Viewed

@@ -3,11 +3,13 @@ import numpy as np
 from PIL import Image
 import cv2
 from moviepy.editor import VideoFileClip
-from share_btn import community_icon_html, loading_icon_html, share_js
 import torch
 from diffusers import DiffusionPipeline, DPMSolverMultistepScheduler
 from diffusers.utils import export_to_video
 pipe_xl = DiffusionPipeline.from_pretrained("cerspense/zeroscope_v2_XL", torch_dtype=torch.float16, revision="refs/pr/17")
 pipe_xl.vae.enable_slicing()
 pipe_xl.scheduler = DPMSolverMultistepScheduler.from_config(pipe_xl.scheduler.config)
@@ -52,119 +54,40 @@ def convert_mp4_to_frames(video_path, duration=3):
     return frames
-def infer(prompt, video_in, denoise_strength):
-    negative_prompt = "text, watermark, copyright, blurry, nsfw"
     # we cannot go beyond 3 seconds on the large A10G
-    video = convert_mp4_to_frames(video_in, duration=3)
     video_resized = [Image.fromarray(frame).resize((1024, 576)) for frame in video]
     video_frames = pipe_xl(prompt, negative_prompt=negative_prompt, video=video_resized, strength=denoise_strength).frames
     video_path = export_to_video(video_frames, output_video_path="xl_result.mp4")
     return "xl_result.mp4", gr.Group.update(visible=True)
-css = """
-#col-container {max-width: 510px; margin-left: auto; margin-right: auto;}
-a {text-decoration-line: underline; font-weight: 600;}
-.animate-spin {
-  animation: spin 1s linear infinite;
-}
-@keyframes spin {
-  from {
-      transform: rotate(0deg);
-  }
-  to {
-      transform: rotate(360deg);
-  }
-}
-#share-btn-container {
-  display: flex;
-  padding-left: 0.5rem !important;
-  padding-right: 0.5rem !important;
-  background-color: #000000;
-  justify-content: center;
-  align-items: center;
-  border-radius: 9999px !important;
-  max-width: 13rem;
-}
-#share-btn-container:hover {
-  background-color: #060606;
-}
-#share-btn {
-  all: initial;
-  color: #ffffff;
-  font-weight: 600;
-  cursor:pointer;
-  font-family: 'IBM Plex Sans', sans-serif;
-  margin-left: 0.5rem !important;
-  padding-top: 0.5rem !important;
-  padding-bottom: 0.5rem !important;
-  right:0;
-}
-#share-btn * {
-  all: unset;
-}
-#share-btn-container div:nth-child(-n+2){
-  width: auto !important;
-  min-height: 0px !important;
-}
-#share-btn-container .wrap {
-  display: none !important;
-}
-#share-btn-container.hidden {
-  display: none!important;
-}
-img[src*='#center'] {
-    display: block;
-    margin: auto;
-}
-"""
-with gr.Blocks(css=css) as demo:
-    with gr.Column(elem_id="col-container"):
-        gr.Markdown(
-            """
-            <h1 style="text-align: center;">Zeroscope XL</h1>
-            <p style="text-align: center;">
-            This space is specifically designed for upscaling content made from <br />
-            <a href="https://huggingface.co/spaces/fffiloni/zeroscope">the zeroscope_v2_576w space</a> using vid2vid. <br />
-            Remember to use the same prompt that was used to generate the original clip.<br />
-            For demo purpose, video length is limited to 3 seconds.
-            </p>
-            [![Duplicate this Space](https://huggingface.co/datasets/huggingface/badges/raw/main/duplicate-this-space-sm.svg#center)](https://huggingface.co/spaces/fffiloni/zeroscope-XL?duplicate=true)
-            """
-        )
         video_in = gr.Video(type="numpy", source="upload")
-        prompt_in = gr.Textbox(label="Prompt", placeholder="This must be the same prompt you used for the original clip :)", elem_id="prompt-in")
         denoise_strength = gr.Slider(label="Denoise strength", minimum=0.6, maximum=0.9, step=0.01, value=0.66)
-        #inference_steps = gr.Slider(label="Inference Steps", minimum=10, maximum=100, step=1, value=40, interactive=False)
         submit_btn = gr.Button("Submit")
         video_result = gr.Video(label="Video Output", elem_id="video-output")
-        with gr.Group(elem_id="share-btn-container", visible=False) as share_group:
-            community_icon = gr.HTML(community_icon_html)
-            loading_icon = gr.HTML(loading_icon_html)
-            share_button = gr.Button("Share to community", elem_id="share-btn")
     submit_btn.click(fn=infer,
-                    inputs=[prompt_in, video_in, denoise_strength],
-                    outputs=[video_result, share_group],
                     api_name="zero_xl"
                     )
-    share_button.click(None, [], [], _js=share_js)
-demo.queue(max_size=12).launch()

 from PIL import Image
 import cv2
 from moviepy.editor import VideoFileClip
 import torch
 from diffusers import DiffusionPipeline, DPMSolverMultistepScheduler
 from diffusers.utils import export_to_video
+SECRET_TOKEN = os.getenv('SECRET_TOKEN', 'default_secret')
+DESCRIPTION = 'This space is an API service meant to be used by VideoChain and VideoQuest.\nWant to use this space for yourself? Please use the original code: [https://huggingface.co/spaces/fffiloni/zeroscope-XL](https://huggingface.co/spaces/fffiloni/zeroscope-XL)'
 pipe_xl = DiffusionPipeline.from_pretrained("cerspense/zeroscope_v2_XL", torch_dtype=torch.float16, revision="refs/pr/17")
 pipe_xl.vae.enable_slicing()
 pipe_xl.scheduler = DPMSolverMultistepScheduler.from_config(pipe_xl.scheduler.config)
     return frames
+def infer(prompt, video_in, denoise_strength, duration, secret_token: str = '') -> str:
+    if secret_token != SECRET_TOKEN:
+        raise gr.Error(
+            f'Invalid secret token. Please fork the original space if you want to use it for yourself.')
+    negative_prompt = "text, watermark, copyright, blurry, cropped, noisy, pixelated, nsfw"
     # we cannot go beyond 3 seconds on the large A10G
+    video = convert_mp4_to_frames(video_in, min(duration, 3))
     video_resized = [Image.fromarray(frame).resize((1024, 576)) for frame in video]
     video_frames = pipe_xl(prompt, negative_prompt=negative_prompt, video=video_resized, strength=denoise_strength).frames
     video_path = export_to_video(video_frames, output_video_path="xl_result.mp4")
     return "xl_result.mp4", gr.Group.update(visible=True)
+with gr.Blocks() as demo:
+    gr.Markdown(DESCRIPTION)
+    with gr.Column():
+        secret_token = gr.Text(label='Secret Token', max_lines=1)
         video_in = gr.Video(type="numpy", source="upload")
+        prompt_in = gr.Textbox(label="Prompt", elem_id="prompt-in")
         denoise_strength = gr.Slider(label="Denoise strength", minimum=0.6, maximum=0.9, step=0.01, value=0.66)
+        duration = gr.Slider(label="Duration", minimum=0.5, maximum=3, step=0.5, value=3)
+        #inference_steps = gr.Slider(label="Inference Steps", minimum=7, maximum=100, step=1, value=40, interactive=False)
         submit_btn = gr.Button("Submit")
         video_result = gr.Video(label="Video Output", elem_id="video-output")
     submit_btn.click(fn=infer,
+                    inputs=[prompt_in, video_in, denoise_strength, secret_token],
+                    outputs=[video_result],
                     api_name="zero_xl"
                     )
+demo.queue(max_size=6).launch()