Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -41,11 +41,15 @@ def load_model():
|
|
41 |
repo_id="Mykes/med_phi3-mini-4k-GGUF",
|
42 |
filename="*Q4_K_M.gguf",
|
43 |
verbose=False,
|
44 |
-
n_ctx=
|
45 |
-
n_batch=
|
46 |
-
n_threads=
|
47 |
-
use_mlock=True,
|
48 |
use_mmap=True,
|
|
|
|
|
|
|
|
|
|
|
49 |
)
|
50 |
|
51 |
llm = load_model()
|
|
|
41 |
repo_id="Mykes/med_phi3-mini-4k-GGUF",
|
42 |
filename="*Q4_K_M.gguf",
|
43 |
verbose=False,
|
44 |
+
n_ctx=256, # Reduced context window
|
45 |
+
n_batch=8, # Smaller batch size
|
46 |
+
n_threads=2, # Adjust based on your CPU cores
|
|
|
47 |
use_mmap=True,
|
48 |
+
# n_ctx=1024,
|
49 |
+
# n_batch=512,
|
50 |
+
# n_threads=8,
|
51 |
+
# use_mlock=True,
|
52 |
+
# use_mmap=True,
|
53 |
)
|
54 |
|
55 |
llm = load_model()
|