from ctransformers import AutoModelForCausalLM model = AutoModelForCausalLM.from_pretrained("TheBloke/Vigostral-7B-Chat-GGUF", model_file="vigostral-7b-chat.Q4_K_M.gguf", model_type="mistral", threads = 3 )