voice-chat-with-mistral

Runtime error

gorkemgoknar commited on Nov 6, 2023

Commit

a51d57b

•

1 Parent(s): e41429f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -158,7 +158,7 @@ from llama_cpp import Llama
 # set GPU_LAYERS to 15 if you have a 8GB GPU so both models can fit in
 # else 35 full layers + XTTS works fine on T4 16GB
 # 5gb per llm, 4gb XTTS -> full layers should fit T4 16GB , 2LLM + XTTS
-GPU_LAYERS=int(os.environ.get("GPU_LAYERS", 35))
 LLAMA_VERBOSE=False
 print("Running LLM Mistral")

 # set GPU_LAYERS to 15 if you have a 8GB GPU so both models can fit in
 # else 35 full layers + XTTS works fine on T4 16GB
 # 5gb per llm, 4gb XTTS -> full layers should fit T4 16GB , 2LLM + XTTS
+GPU_LAYERS=int(os.environ.get("GPU_LAYERS", 30))
 LLAMA_VERBOSE=False
 print("Running LLM Mistral")