schroneko's picture
Update app.py
29e0785 verified
raw
history blame
159 Bytes
import gradio as gr
import spaces
@spaces.GPU
def inference():
return gr.load("models/meta-llama/Llama-Guard-3-8B-INT8")
demo = inference()
demo.launch()