aspctu commited on
Commit
cafb432
·
verified ·
1 Parent(s): 941310e

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "producer": {
3
+ "name": "modelopt",
4
+ "version": "0.13.1"
5
+ },
6
+ "architecture": "LlamaForCausalLM",
7
+ "dtype": "bfloat16",
8
+ "logits_dtype": "float16",
9
+ "num_hidden_layers": 80,
10
+ "num_attention_heads": 64,
11
+ "num_key_value_heads": 8,
12
+ "hidden_size": 8192,
13
+ "norm_epsilon": 1e-05,
14
+ "vocab_size": 128256,
15
+ "max_position_embeddings": 131072,
16
+ "hidden_act": "silu",
17
+ "use_parallel_embedding": true,
18
+ "embedding_sharding_dim": 0,
19
+ "quantization": {
20
+ "quant_algo": "FP8",
21
+ "kv_cache_quant_algo": "FP8"
22
+ },
23
+ "mapping": {
24
+ "world_size": 4,
25
+ "tp_size": 4,
26
+ "pp_size": 1
27
+ },
28
+ "head_size": 128,
29
+ "intermediate_size": 28672,
30
+ "position_embedding_type": "rope_gpt_neox",
31
+ "share_embedding_table": false,
32
+ "residual_mlp": false,
33
+ "bias": false,
34
+ "rotary_pct": 1.0,
35
+ "rank": 0,
36
+ "decoder": "llama",
37
+ "rmsnorm": true,
38
+ "lm_head_bias": false,
39
+ "rotary_base": 500000.0,
40
+ "rotary_scaling": {
41
+ "factor": 8.0,
42
+ "low_freq_factor": 1.0,
43
+ "high_freq_factor": 4.0,
44
+ "original_max_position_embeddings": 8192,
45
+ "rope_type": "llama3"
46
+ }
47
+ }
rank0.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf752fdda3bad306e9810cd81d56b474bea00e2a4c8dfac730c82e89581efa87
3
+ size 18166240288
rank1.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a3ebe57dfe93f624def6db92fa2fc6f3d748e9d29710cf258509ad68a3248de
3
+ size 18166240288
rank2.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68a0c0c4bfa846baa2a13e8a1f03540669660dce290ccd63263ba4845b6c142f
3
+ size 18166240288
rank3.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6a735a910c5b10bb2dfa23ea9e2f9365aaba51a37ba6c3d5badec95f085619f
3
+ size 18166240288