Change cache = true in config.json to significantly boost inference performance
#1
by
TheBloke
- opened
- config.json +1 -1
config.json
CHANGED
@@ -19,6 +19,6 @@
|
|
19 |
"tie_word_embeddings": false,
|
20 |
"torch_dtype": "bfloat16",
|
21 |
"transformers_version": "4.30.0.dev0",
|
22 |
-
"use_cache":
|
23 |
"vocab_size": 32000
|
24 |
}
|
|
|
19 |
"tie_word_embeddings": false,
|
20 |
"torch_dtype": "bfloat16",
|
21 |
"transformers_version": "4.30.0.dev0",
|
22 |
+
"use_cache": true,
|
23 |
"vocab_size": 32000
|
24 |
}
|