import gradio as gr gr.load( "models/Alibaba-NLP/gte-Qwen2-1.5B-instruct", provider="hf-inference", ).launch()