Qubitium commited on
Commit
2e840f6
·
verified ·
1 Parent(s): be8d061

compat changes for transformers 4.51.0-dev

Browse files

Transformers added native DeepSeek V3 support in special branch but it require the config. values to be float

pip install git+https://github.com/huggingface/[email protected]

Files changed (1) hide show
  1. config.json +3 -3
config.json CHANGED
@@ -36,9 +36,9 @@
36
  "qk_rope_head_dim": 64,
37
  "rms_norm_eps": 1e-06,
38
  "rope_scaling": {
39
- "beta_fast": 32,
40
- "beta_slow": 1,
41
- "factor": 40,
42
  "mscale": 1.0,
43
  "mscale_all_dim": 1.0,
44
  "original_max_position_embeddings": 4096,
 
36
  "qk_rope_head_dim": 64,
37
  "rms_norm_eps": 1e-06,
38
  "rope_scaling": {
39
+ "beta_fast": 32.0,
40
+ "beta_slow": 1.0,
41
+ "factor": 40.0,
42
  "mscale": 1.0,
43
  "mscale_all_dim": 1.0,
44
  "original_max_position_embeddings": 4096,