import gradio as gr gr.Interface.load("models/manojkumarvohra/llama2-7B-Chat-hf-8bit-guanaco-pico-finetuned").launch()