import gradio as gr gr.load("models/01-ai/Yi-6B-Chat-8bits").launch()