Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -11,7 +11,7 @@ llm = Llama(
|
|
| 11 |
filename=os.environ.get("MODEL_FILE", "Phi-3-mini-4k-instruct-q4.gguf"),
|
| 12 |
),
|
| 13 |
n_ctx=2048,
|
| 14 |
-
n_gpu_layers
|
| 15 |
)
|
| 16 |
|
| 17 |
|
|
|
|
| 11 |
filename=os.environ.get("MODEL_FILE", "Phi-3-mini-4k-instruct-q4.gguf"),
|
| 12 |
),
|
| 13 |
n_ctx=2048,
|
| 14 |
+
n_gpu_layers=-1, # change n_gpu_layers if you have more or less VRAM
|
| 15 |
)
|
| 16 |
|
| 17 |
|