import gradio as gr import spaces @spaces.GPU def inference(): return gr.load("models/meta-llama/Llama-Guard-3-8B-INT8") demo = inference() demo.launch()