Spaces:

pablorodriper
/

video-vision-transformer

Build error

App Files Files Community

pablorodriper commited on Oct 26, 2022

Commit

9b2dc59

•

1 Parent(s): 33f824c

Upload 2 files

Browse files

Files changed (2) hide show

app.py +39 -16
predict.py +54 -0

app.py CHANGED Viewed

@@ -1,25 +1,48 @@
 import gradio as gr
 import tensorflow as tf
 from huggingface_hub import from_pretrained_keras
-description = "Keras implementation for Video Vision Transformer trained with OrganMNIST3D (CT videos)"
-article = "Classes: liver, kidney-right, kidney-left, femur-right, femur-left, bladder, heart, lung-right, lung-left, spleen, pancreas.\n\nAuthor:<a href=\"https://huggingface.co/pablorodriper/\"> Pablo Rodríguez</a>; Based on the keras example by <a href=\"https://keras.io/examples/vision/vivit/\">Aritra Roy Gosthipaty and Ayush Thakur</a>"
-title = "Video Vision Transformer on OrganMNIST3D"
-def infer(x):
-    return model.predict(tf.expand_dims(x, axis=0))[0]
-model = from_pretrained_keras("keras-io/video-vision-transformer")
-labels = ['liver', 'kidney-right', 'kidney-left', 'femur-right', 'femur-left', 'bladder', 'heart', 'lung-right', 'lung-left', 'spleen', 'pancreas']
-iface = gr.Interface(
-    fn = infer,
-    inputs = "video",
-    outputs = "number",
-    description = description,
-    title = title,
-    article = article
-    )
-iface.launch()

+import glob
 import gradio as gr
 import tensorflow as tf
 from huggingface_hub import from_pretrained_keras
+from predict import predict_label
+##Create list of examples to be loaded
+example_list = glob.glob("examples/*")
+example_list = list(map(lambda el:[el], example_list))
+demo = gr.Blocks()
+with demo:
+    gr.Markdown("# **<p align='center'>Video Vision Transformer on medmnist</p>**")
+    with gr.Tabs():
+        with gr.TabItem("Upload & Predict"):
+            with gr.Box():
+                with gr.Row():
+                    input_video = gr.Video(label="Input Video", show_label=True)
+                    output_label = gr.Label(label="Model Output", show_label=True)
+            gr.Markdown("**Predict**")
+            with gr.Box():
+                with gr.Row():
+                    submit_button = gr.Button("Submit")
+            gr.Markdown("Examples")
+            gr.Markdown("The model is trained to classify videos belonging to the following classes: liver, kidney-right, kidney-left, femur-right, femur-left, bladder, heart, lung-right, lung-left, spleen, pancreas")
+            with gr.Column():
+                gr.Examples(example_list, [input_video], [output_label], predict_label, cache_examples=True)
+    submit_button.click(predict_label, inputs=input_video, outputs=output_label)
+    gr.Markdown('\n Demo created by: <a href=\"https://huggingface.co/pablorodriper\"> Pablo Rodríguez</a> Based on the Keras example by <a href=\"https://keras.io/examples/vision/vivit/\">Aritra Roy Gosthipaty and Ayush Thakur</a>')
+demo.launch

predict.py ADDED Viewed

	@@ -0,0 +1,54 @@

+import cv2
+# import imageio
+import numpy as np
+import tensorflow as tf
+from huggingface_hub import from_pretrained_keras
+from tensorflow.keras.optimizers import Adam
+from .constants import LEARNING_RATE
+def predict_label(path):
+    frames = load_video(path)
+    model = get_model()
+    prediction = model.predict(tf.expand_dims(example, axis=0))[0]
+    label = np.argmax(pred, axis=0)
+    return label
+def load_video(path):
+    """
+    Load video from path and return a list of frames.
+    The video is converted to grayscale because it is the format expected by the model.
+    """
+    cap = cv2.VideoCapture(path)
+    frames = []
+    try:
+        while True:
+            ret, frame = cap.read()
+            if not ret:
+                break
+            frame = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
+            frames.append(frame)
+    finally:
+        cap.release()
+    return np.array(frames)
+def get_model():
+    """
+    Download the model from the Hugging Face Hub and compile it.
+    """
+    model = from_pretrained_keras("pablorodriper/video-vision-transformer")
+    model.compile(
+        optimizer=Adam(learning_rate=LEARNING_RATE),
+        loss="sparse_categorical_crossentropy",
+        # metrics=[
+        #     keras.metrics.SparseCategoricalAccuracy(name="accuracy"),
+        #     keras.metrics.SparseTopKCategoricalAccuracy(5, name="top-5-accuracy"),
+        # ],
+    )
+    return model