Commit
•
9bba2ff
1
Parent(s):
a0193c5
Upload folder using huggingface_hub
Browse files- .gitattributes +10 -0
- compiled/01886c79d2e2290329b5.neff +3 -0
- compiled/21bb7c0a42cf90e50397.neff +3 -0
- compiled/33e9e252ca991248848b.neff +3 -0
- compiled/724a5268523c1ff2528d.neff +3 -0
- compiled/7ff46eafba85ffbf903d.neff +3 -0
- compiled/8edd16aaf266fbcc8a14.neff +3 -0
- compiled/b7c1a7e934ab433f3bab.neff +3 -0
- compiled/e6807852b74c21fd73ba.neff +3 -0
- compiled/e7af477de1c621a495aa.neff +3 -0
- compiled/ff1d537043c19a18f1c8.neff +3 -0
- config.json +38 -0
- generation_config.json +6 -0
.gitattributes
CHANGED
@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
compiled/01886c79d2e2290329b5.neff filter=lfs diff=lfs merge=lfs -text
|
37 |
+
compiled/21bb7c0a42cf90e50397.neff filter=lfs diff=lfs merge=lfs -text
|
38 |
+
compiled/33e9e252ca991248848b.neff filter=lfs diff=lfs merge=lfs -text
|
39 |
+
compiled/724a5268523c1ff2528d.neff filter=lfs diff=lfs merge=lfs -text
|
40 |
+
compiled/7ff46eafba85ffbf903d.neff filter=lfs diff=lfs merge=lfs -text
|
41 |
+
compiled/8edd16aaf266fbcc8a14.neff filter=lfs diff=lfs merge=lfs -text
|
42 |
+
compiled/b7c1a7e934ab433f3bab.neff filter=lfs diff=lfs merge=lfs -text
|
43 |
+
compiled/e6807852b74c21fd73ba.neff filter=lfs diff=lfs merge=lfs -text
|
44 |
+
compiled/e7af477de1c621a495aa.neff filter=lfs diff=lfs merge=lfs -text
|
45 |
+
compiled/ff1d537043c19a18f1c8.neff filter=lfs diff=lfs merge=lfs -text
|
compiled/01886c79d2e2290329b5.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e1161e72e32d000d13a311712ed5e6a1acaa3f1f33c2a169719ee01e7721cd9
|
3 |
+
size 9237504
|
compiled/21bb7c0a42cf90e50397.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b565b85bd636bcc6f25adc9516de8cd2f908ade6a4390982a35e880db43c0bac
|
3 |
+
size 71998464
|
compiled/33e9e252ca991248848b.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b893444c9c6bcbadf0f9f735af5430f44f020e4755dee2f75da7ae1ace227131
|
3 |
+
size 9903104
|
compiled/724a5268523c1ff2528d.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:166c5edcf6825ecf9d62fd320c81ad74d81faf278ef1a31c0bf4d0440c99aeba
|
3 |
+
size 8172544
|
compiled/7ff46eafba85ffbf903d.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ed1077c5393410350790fad46e7441d9e16ad036fc573205603d5b439c52631
|
3 |
+
size 8500224
|
compiled/8edd16aaf266fbcc8a14.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d5d8b8e63a1c3352528066cb64ccebb26f4f170560fde14f8467ebea83dd585
|
3 |
+
size 26717184
|
compiled/b7c1a7e934ab433f3bab.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47d5064834a547b04013c19c02ff67587715a1b01e6575e6989779f6ac80d5b6
|
3 |
+
size 7926784
|
compiled/e6807852b74c21fd73ba.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a42ce4889517041806c8f65ec9b6da4f6fe2ee44d496e4cf57933f65f225b383
|
3 |
+
size 12534784
|
compiled/e7af477de1c621a495aa.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8edc3a716dfb771167ca6f21ad7b576b8dfd94eb228aa92f0a6dcccb85d59771
|
3 |
+
size 8039424
|
compiled/ff1d537043c19a18f1c8.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b43b46c132c1302d11b56348026c1ebfa931a7f11fc90133e0c2380accaed9d5
|
3 |
+
size 153693184
|
config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "HuggingFaceH4/zephyr-7b-beta",
|
3 |
+
"architectures": [
|
4 |
+
"MistralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 4096,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 14336,
|
13 |
+
"max_position_embeddings": 32768,
|
14 |
+
"model_type": "mistral",
|
15 |
+
"neuron": {
|
16 |
+
"auto_cast_type": "bf16",
|
17 |
+
"batch_size": 4,
|
18 |
+
"checkpoint_id": "HuggingFaceH4/zephyr-7b-beta",
|
19 |
+
"checkpoint_revision": "dc24cabd13eacd3ae3a5fe574bd645483a335a4a",
|
20 |
+
"compiler_type": "neuronx-cc",
|
21 |
+
"compiler_version": "2.12.54.0+f631c2365",
|
22 |
+
"num_cores": 2,
|
23 |
+
"sequence_length": 2048,
|
24 |
+
"task": "text-generation"
|
25 |
+
},
|
26 |
+
"num_attention_heads": 32,
|
27 |
+
"num_hidden_layers": 32,
|
28 |
+
"num_key_value_heads": 8,
|
29 |
+
"pad_token_id": 2,
|
30 |
+
"rms_norm_eps": 1e-05,
|
31 |
+
"rope_theta": 10000.0,
|
32 |
+
"sliding_window": 4096,
|
33 |
+
"tie_word_embeddings": false,
|
34 |
+
"torch_dtype": "bfloat16",
|
35 |
+
"transformers_version": "4.36.2",
|
36 |
+
"use_cache": true,
|
37 |
+
"vocab_size": 32000
|
38 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.36.2"
|
6 |
+
}
|