import gradio as gr gr.Interface.load("models/concise/LLaMa_V2-13B-Chat-Unquantized-HF").launch()