11104491
commited on
Commit
·
1999ad4
1
Parent(s):
637ee30
Update for vllm
Browse files- config.json +6 -2
- configuration_bluelm.py +3 -3
config.json
CHANGED
@@ -20,12 +20,16 @@
|
|
20 |
"pad_token_id": 3,
|
21 |
"pretraining_tp": 1,
|
22 |
"rms_norm_eps": 1e-06,
|
23 |
-
"rope_scaling": null,
|
24 |
"rope_theta": 10000.0,
|
25 |
"tie_word_embeddings": false,
|
26 |
"torch_dtype": "bfloat16",
|
27 |
"transformers_version": "4.30.1",
|
28 |
"use_cache": true,
|
29 |
"use_stable_embedding": true,
|
30 |
-
"vocab_size": 100096
|
|
|
|
|
|
|
|
|
|
|
31 |
}
|
|
|
20 |
"pad_token_id": 3,
|
21 |
"pretraining_tp": 1,
|
22 |
"rms_norm_eps": 1e-06,
|
|
|
23 |
"rope_theta": 10000.0,
|
24 |
"tie_word_embeddings": false,
|
25 |
"torch_dtype": "bfloat16",
|
26 |
"transformers_version": "4.30.1",
|
27 |
"use_cache": true,
|
28 |
"use_stable_embedding": true,
|
29 |
+
"vocab_size": 100096,
|
30 |
+
"rope_scaling": {
|
31 |
+
"type": "ntkmixed",
|
32 |
+
"factor": 16.0,
|
33 |
+
"power": 0.3
|
34 |
+
}
|
35 |
}
|
configuration_bluelm.py
CHANGED
@@ -149,14 +149,14 @@ class BlueLMConfig(PretrainedConfig):
|
|
149 |
if self.rope_scaling is None:
|
150 |
return
|
151 |
|
152 |
-
if not isinstance(self.rope_scaling, dict) or len(self.rope_scaling) !=
|
153 |
raise ValueError(
|
154 |
-
"`rope_scaling` must be a dictionary with with
|
155 |
f"got {self.rope_scaling}"
|
156 |
)
|
157 |
rope_scaling_type = self.rope_scaling.get("type", None)
|
158 |
rope_scaling_factor = self.rope_scaling.get("factor", None)
|
159 |
-
if rope_scaling_type is None or rope_scaling_type not in ["linear", "dynamic"]:
|
160 |
raise ValueError(
|
161 |
f"`rope_scaling`'s type field must be one of ['linear', 'dynamic'], got {rope_scaling_type}"
|
162 |
)
|
|
|
149 |
if self.rope_scaling is None:
|
150 |
return
|
151 |
|
152 |
+
if not isinstance(self.rope_scaling, dict) or len(self.rope_scaling) != 3:
|
153 |
raise ValueError(
|
154 |
+
"`rope_scaling` must be a dictionary with with three fields, `type` , `factor` , `power`, "
|
155 |
f"got {self.rope_scaling}"
|
156 |
)
|
157 |
rope_scaling_type = self.rope_scaling.get("type", None)
|
158 |
rope_scaling_factor = self.rope_scaling.get("factor", None)
|
159 |
+
if rope_scaling_type is None or rope_scaling_type not in ["linear", "dynamic","ntkmixed"]:
|
160 |
raise ValueError(
|
161 |
f"`rope_scaling`'s type field must be one of ['linear', 'dynamic'], got {rope_scaling_type}"
|
162 |
)
|