Spaces:

ftshijt
/

versa

Sleeping

App Files Files Community

ftshijt commited on about 1 month ago

Commit

be31546

1 Parent(s): e0b2439

Initial update for versa demo

Browse files

Files changed (6) hide show

.gitignore +55 -0
README.md +47 -6
app.py +52 -150
packages.txt +4 -0
requirements.txt +11 -6
test_versa.py +56 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,55 @@

+# Python cache files
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+env/
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+# Virtual environment
+venv/
+ENV/
+# Local development settings
+.env
+.venv
+.idea/
+.vscode/
+*.swp
+*.swo
+# Data directories
+data/
+uploads/
+results/
+# Logs
+logs/
+*.log
+# VERSA installation (will be cloned at runtime)
+versa/
+# OS generated files
+.DS_Store
+.DS_Store?
+._*
+.Spotlight-V100
+.Trashes
+ehthumbs.db
+Thumbs.db

README.md CHANGED Viewed

@@ -1,13 +1,54 @@
 ---
-title: Versa
-emoji: 🖼
-colorFrom: purple
-colorTo: red
 sdk: gradio
-sdk_version: 5.0.1
 app_file: app.py
 pinned: false
 license: apache-2.0
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: VERSA Speech & Audio Evaluation Demo
+emoji: 🎙️
+colorFrom: blue
+colorTo: indigo
 sdk: gradio
+sdk_version: 4.7.1
 app_file: app.py
 pinned: false
 license: apache-2.0
 ---
+# VERSA Speech & Audio Evaluation Demo
+This demo allows you to evaluate speech and audio files using the VERSA (Versatile Evaluation of Speech and Audio) toolkit.
+## How to Use
+1. Upload a ground truth audio file (the reference audio)
+2. Upload a prediction audio file (the audio to be evaluated)
+3. Select an evaluation metric from the dropdown menu
+4. Click the "Evaluate" button
+5. View the results in the table and raw JSON format
+## About VERSA
+VERSA is a toolkit dedicated to collecting evaluation metrics in speech and audio quality. It provides a comprehensive connection to cutting-edge evaluation techniques and is tightly integrated with ESPnet.
+With full installation, VERSA offers over 80 metrics with 700+ metric variations based on different configurations. These metrics encompass evaluations utilizing diverse external resources, including matching and non-matching reference audio, text transcriptions, and text captions.
+Learn more at the [VERSA GitHub Repository](https://github.com/wavlab-speech/versa).
+## Features
+- Easy-to-use interface for audio evaluation
+- Support for various evaluation metrics
+- Detailed results displayed in table format
+- Raw JSON output for further analysis
+## Citation
+If you use VERSA in your research, please cite:
+```
+@misc{shi2024versaversatileevaluationtoolkit,
+  title={VERSA: A Versatile Evaluation Toolkit for Speech, Audio, and Music},
+  author={Jiatong Shi and Hye-jin Shim and Jinchuan Tian and Siddhant Arora and Haibin Wu and Darius Petermann and Jia Qi Yip and You Zhang and Yuxun Tang and Wangyou Zhang and Dareen Safar Alharthi and Yichen Huang and Koichi Saito and Jionghao Han and Yiwen Zhao and Chris Donahue and Shinji Watanabe},
+  year={2024},
+  eprint={2412.17667},
+  archivePrefix={arXiv},
+  primaryClass={cs.SD},
+  url={https://arxiv.org/abs/2412.17667},
+}
+```

app.py CHANGED Viewed

@@ -1,154 +1,56 @@
-import gradio as gr
-import numpy as np
-import random
-# import spaces #[uncomment to use ZeroGPU]
-from diffusers import DiffusionPipeline
-import torch
-device = "cuda" if torch.cuda.is_available() else "cpu"
-model_repo_id = "stabilityai/sdxl-turbo"  # Replace to the model you would like to use
-if torch.cuda.is_available():
-    torch_dtype = torch.float16
-else:
-    torch_dtype = torch.float32
-pipe = DiffusionPipeline.from_pretrained(model_repo_id, torch_dtype=torch_dtype)
-pipe = pipe.to(device)
-MAX_SEED = np.iinfo(np.int32).max
-MAX_IMAGE_SIZE = 1024
-# @spaces.GPU #[uncomment to use ZeroGPU]
-def infer(
-    prompt,
-    negative_prompt,
-    seed,
-    randomize_seed,
-    width,
-    height,
-    guidance_scale,
-    num_inference_steps,
-    progress=gr.Progress(track_tqdm=True),
-):
-    if randomize_seed:
-        seed = random.randint(0, MAX_SEED)
-    generator = torch.Generator().manual_seed(seed)
-    image = pipe(
-        prompt=prompt,
-        negative_prompt=negative_prompt,
-        guidance_scale=guidance_scale,
-        num_inference_steps=num_inference_steps,
-        width=width,
-        height=height,
-        generator=generator,
-    ).images[0]
-    return image, seed
-examples = [
-    "Astronaut in a jungle, cold color palette, muted colors, detailed, 8k",
-    "An astronaut riding a green horse",
-    "A delicious ceviche cheesecake slice",
-]
-css = """
-#col-container {
-    margin: 0 auto;
-    max-width: 640px;
-}
 """
-with gr.Blocks(css=css) as demo:
-    with gr.Column(elem_id="col-container"):
-        gr.Markdown(" # Text-to-Image Gradio Template")
-        with gr.Row():
-            prompt = gr.Text(
-                label="Prompt",
-                show_label=False,
-                max_lines=1,
-                placeholder="Enter your prompt",
-                container=False,
-            )
-            run_button = gr.Button("Run", scale=0, variant="primary")
-        result = gr.Image(label="Result", show_label=False)
-        with gr.Accordion("Advanced Settings", open=False):
-            negative_prompt = gr.Text(
-                label="Negative prompt",
-                max_lines=1,
-                placeholder="Enter a negative prompt",
-                visible=False,
-            )
-            seed = gr.Slider(
-                label="Seed",
-                minimum=0,
-                maximum=MAX_SEED,
-                step=1,
-                value=0,
-            )
-            randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
-            with gr.Row():
-                width = gr.Slider(
-                    label="Width",
-                    minimum=256,
-                    maximum=MAX_IMAGE_SIZE,
-                    step=32,
-                    value=1024,  # Replace with defaults that work for your model
-                )
-                height = gr.Slider(
-                    label="Height",
-                    minimum=256,
-                    maximum=MAX_IMAGE_SIZE,
-                    step=32,
-                    value=1024,  # Replace with defaults that work for your model
-                )
-            with gr.Row():
-                guidance_scale = gr.Slider(
-                    label="Guidance scale",
-                    minimum=0.0,
-                    maximum=10.0,
-                    step=0.1,
-                    value=0.0,  # Replace with defaults that work for your model
-                )
-                num_inference_steps = gr.Slider(
-                    label="Number of inference steps",
-                    minimum=1,
-                    maximum=50,
-                    step=1,
-                    value=2,  # Replace with defaults that work for your model
-                )
-        gr.Examples(examples=examples, inputs=[prompt])
-    gr.on(
-        triggers=[run_button.click, prompt.submit],
-        fn=infer,
-        inputs=[
-            prompt,
-            negative_prompt,
-            seed,
-            randomize_seed,
-            width,
-            height,
-            guidance_scale,
-            num_inference_steps,
-        ],
-        outputs=[result, seed],
-    )
 if __name__ == "__main__":
-    demo.launch()

+#!/usr/bin/env python3
+"""
+Test script to verify that VERSA is installed correctly.
 """
+import os
+import sys
+import subprocess
+from pathlib import Path
+# Check if VERSA is installed
+VERSA_ROOT = os.path.join(os.path.dirname(os.path.abspath(__file__)), "versa")
+def check_versa():
+    """Check if VERSA is installed and working"""
+    print("Testing VERSA installation...")
+    if not os.path.exists(VERSA_ROOT):
+        print("VERSA not found.")
+        return False
+    # Check if the scorer.py exists
+    scorer_path = os.path.join(VERSA_ROOT, "versa", "bin", "scorer.py")
+    if not os.path.exists(scorer_path):
+        print(f"VERSA scorer not found at {scorer_path}")
+        return False
+    # Check if the config directory exists
+    config_dir = os.path.join(VERSA_ROOT, "egs")
+    if not os.path.exists(config_dir):
+        print(f"VERSA config directory not found at {config_dir}")
+        return False
+    # Check for available metrics
+    metrics = []
+    for root, _, files in os.walk(config_dir):
+        for file in files:
+            if file.endswith('.yaml'):
+                metrics.append(os.path.join(root, file))
+    if not metrics:
+        print("No metric configurations found in VERSA.")
+        return False
+    print(f"Found {len(metrics)} metric configurations.")
+    for metric in metrics[:5]:  # Print first 5 metrics
+        print(f"- {os.path.relpath(metric, config_dir)}")
+    if len(metrics) > 5:
+        print(f"... and {len(metrics) - 5} more.")
+    print("VERSA installation looks good!")
+    return True
 if __name__ == "__main__":
+    check_versa()

packages.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+git
+build-essential
+libsndfile1
+ffmpeg

requirements.txt CHANGED Viewed

@@ -1,6 +1,11 @@
-accelerate
-diffusers
-invisible_watermark
-torch
-transformers
-xformers

+gradio>=4.0.0
+pyyaml>=6.0
+pandas>=1.5.0
+numpy>=1.20.0
+matplotlib>=3.5.0
+soundfile>=0.12.1
+scipy>=1.7.0
+torch>=1.10.0
+torchaudio>=0.10.0
+librosa>=0.9.2
+GitPython>=3.1.30

test_versa.py ADDED Viewed

	@@ -0,0 +1,56 @@

+#!/usr/bin/env python3
+"""
+Test script to verify that VERSA is installed correctly.
+"""
+import os
+import sys
+import subprocess
+from pathlib import Path
+# Check if VERSA is installed
+VERSA_ROOT = os.path.join(os.path.dirname(os.path.abspath(__file__)), "versa")
+def check_versa():
+    """Check if VERSA is installed and working"""
+    print("Testing VERSA installation...")
+    if not os.path.exists(VERSA_ROOT):
+        print("VERSA not found.")
+        return False
+    # Check if the scorer.py exists
+    scorer_path = os.path.join(VERSA_ROOT, "versa", "bin", "scorer.py")
+    if not os.path.exists(scorer_path):
+        print(f"VERSA scorer not found at {scorer_path}")
+        return False
+    # Check if the config directory exists
+    config_dir = os.path.join(VERSA_ROOT, "egs")
+    if not os.path.exists(config_dir):
+        print(f"VERSA config directory not found at {config_dir}")
+        return False
+    # Check for available metrics
+    metrics = []
+    for root, _, files in os.walk(config_dir):
+        for file in files:
+            if file.endswith('.yaml'):
+                metrics.append(os.path.join(root, file))
+    if not metrics:
+        print("No metric configurations found in VERSA.")
+        return False
+    print(f"Found {len(metrics)} metric configurations.")
+    for metric in metrics[:5]:  # Print first 5 metrics
+        print(f"- {os.path.relpath(metric, config_dir)}")
+    if len(metrics) > 5:
+        print(f"... and {len(metrics) - 5} more.")
+    print("VERSA installation looks good!")
+    return True
+if __name__ == "__main__":
+    check_versa()