Ubuntu
commited on
Commit
·
f5967fa
1
Parent(s):
9d5d9c2
Mixtral - branch gptq-4bit-32g-actorder_True
Browse files- config.json +55 -0
- generation_config.json +6 -0
- model-00001-of-00036.safetensors +3 -0
- model-00002-of-00036.safetensors +3 -0
- model-00003-of-00036.safetensors +3 -0
- model-00004-of-00036.safetensors +3 -0
- model-00005-of-00036.safetensors +3 -0
- model-00006-of-00036.safetensors +3 -0
- model-00007-of-00036.safetensors +3 -0
- model-00008-of-00036.safetensors +3 -0
- model-00009-of-00036.safetensors +3 -0
- model-00010-of-00036.safetensors +3 -0
- model-00011-of-00036.safetensors +3 -0
- model-00012-of-00036.safetensors +3 -0
- model-00013-of-00036.safetensors +3 -0
- model-00014-of-00036.safetensors +3 -0
- model-00015-of-00036.safetensors +3 -0
- model-00016-of-00036.safetensors +3 -0
- model-00017-of-00036.safetensors +3 -0
- model-00018-of-00036.safetensors +3 -0
- model-00019-of-00036.safetensors +3 -0
- model-00020-of-00036.safetensors +3 -0
- model-00021-of-00036.safetensors +3 -0
- model-00022-of-00036.safetensors +3 -0
- model-00023-of-00036.safetensors +3 -0
- model-00024-of-00036.safetensors +3 -0
- model-00025-of-00036.safetensors +3 -0
- model-00026-of-00036.safetensors +3 -0
- model-00027-of-00036.safetensors +3 -0
- model-00028-of-00036.safetensors +3 -0
- model-00029-of-00036.safetensors +3 -0
- model-00030-of-00036.safetensors +3 -0
- model-00031-of-00036.safetensors +3 -0
- model-00032-of-00036.safetensors +3 -0
- model-00033-of-00036.safetensors +3 -0
- model-00034-of-00036.safetensors +3 -0
- model-00035-of-00036.safetensors +3 -0
- model-00036-of-00036.safetensors +3 -0
- model.safetensors.index.json +0 -0
- special_tokens_map.json +23 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +43 -0
config.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "TheBloke/Mixtral-8x7B-Instruct-v0.1-GPTQ",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 4096,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 14336,
|
13 |
+
"max_position_embeddings": 32768,
|
14 |
+
"model_type": "mixtral",
|
15 |
+
"num_attention_heads": 32,
|
16 |
+
"num_experts_per_tok": 2,
|
17 |
+
"num_hidden_layers": 32,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"num_local_experts": 8,
|
20 |
+
"output_router_logits": false,
|
21 |
+
"pad_token_id": 0,
|
22 |
+
"pretraining_tp": 1,
|
23 |
+
"quantization_config": {
|
24 |
+
"batch_size": 1,
|
25 |
+
"bits": 4,
|
26 |
+
"block_name_to_quantize": null,
|
27 |
+
"cache_block_outputs": true,
|
28 |
+
"damp_percent": 0.1,
|
29 |
+
"dataset": null,
|
30 |
+
"desc_act": true,
|
31 |
+
"exllama_config": {
|
32 |
+
"version": 1
|
33 |
+
},
|
34 |
+
"group_size": 32,
|
35 |
+
"max_input_length": null,
|
36 |
+
"model_seqlen": null,
|
37 |
+
"module_name_preceding_first_block": null,
|
38 |
+
"pad_token_id": null,
|
39 |
+
"quant_method": "gptq",
|
40 |
+
"sym": true,
|
41 |
+
"tokenizer": null,
|
42 |
+
"true_sequential": true,
|
43 |
+
"use_cuda_fp16": false,
|
44 |
+
"use_exllama": true
|
45 |
+
},
|
46 |
+
"rms_norm_eps": 1e-05,
|
47 |
+
"rope_theta": 1000000.0,
|
48 |
+
"router_aux_loss_coef": 0.02,
|
49 |
+
"sliding_window": 4096,
|
50 |
+
"tie_word_embeddings": false,
|
51 |
+
"torch_dtype": "float16",
|
52 |
+
"transformers_version": "4.36.2",
|
53 |
+
"use_cache": true,
|
54 |
+
"vocab_size": 32000
|
55 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.36.2"
|
6 |
+
}
|
model-00001-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74c41bdc04cd199fbf435b91d3c4a2bc704645a17e23c138aa68c015ff39dd7f
|
3 |
+
size 796482960
|
model-00002-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b0679092928de50266c21540283e46106ec0d2b7eb973b2b1a6ca5b6f028706
|
3 |
+
size 772385112
|
model-00003-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f6e4f5604b11c154b54aa812a07a0c9ce1e49691a4918066443d45ec0d43416
|
3 |
+
size 772405472
|
model-00004-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31dbc81c32f81e637cc97bbce70e73bd63ca637bd102e93228e508d72c8edda4
|
3 |
+
size 772384992
|
model-00005-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6eb43fd7bfafd8767fa3bb2f312ac32202b78778e84fcf8df190f79e5a04397
|
3 |
+
size 772384992
|
model-00006-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cf895d407c7b79d57cd259449694b6c527e66c4999dd8bf38ff1f782af915c2
|
3 |
+
size 772405472
|
model-00007-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b97511661a1b8510418ce55e263f0c919e3782d07356b2994ba34893359382b0
|
3 |
+
size 772384992
|
model-00008-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dde535592fb511435172e6644fdbb3c7c4699e7017c4a03af817cbfed72a9d57
|
3 |
+
size 772384992
|
model-00009-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46ffab1278b42c047208459b0fdf6c2aefe7c551ccf2e9728fca435bbdd9c953
|
3 |
+
size 794230528
|
model-00010-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1f4520e191551d6e8a79f83eee982dfc955e04074fd433a0204b8af6cdc42ef
|
3 |
+
size 794178632
|
model-00011-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd93c715ab02b6429726354f6e840933cd8cb576e6344a3fb088a1a1ad819403
|
3 |
+
size 772384992
|
model-00012-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89362b5e06a50690332eefe471177cf3e542f471dfef50afc9a312254004dc37
|
3 |
+
size 772385112
|
model-00013-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cd538781db218dea37c567c0a725a28eac8bbaef7a1c096d4d09ec06a088bf3
|
3 |
+
size 772405608
|
model-00014-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a9dbb4ad1a1082da436a98e79d6f5fad763132c23ad3d76e9f52eaf221d0153
|
3 |
+
size 772385128
|
model-00015-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04fa52c37f9680803c6a83b8961cd3958d01ccded8766d2b9413cfba2bf846a0
|
3 |
+
size 772385128
|
model-00016-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a48c0c54d73b16b61f98eeafc59095e1710bc277d5378d6475cf916063bb2231
|
3 |
+
size 772405608
|
model-00017-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a6642a61c6bb5e4c8dfac1908ffa771336307437d25063de277a0a25a5b30bd
|
3 |
+
size 772385128
|
model-00018-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38e04ab6bdf2706963db5cc150e15cd4924526b217dfc9242d00697ac02c0c2e
|
3 |
+
size 772385128
|
model-00019-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f2fe12652acb2a89e1497ce8c1e0f14e7c43a1301eebe170b8809a99a9a1ba7
|
3 |
+
size 772405608
|
model-00020-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f402e8e381fb28624d75278736137bd3c7baf761c76c06a796edb0d884b7ee3
|
3 |
+
size 772385128
|
model-00021-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4803ddbab527d83a7e814de42825d8aa474907c81bebabb43fe997ec9ce1ead0
|
3 |
+
size 772385128
|
model-00022-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:246b765a3fc2017b305347dcd011d0a28a60a66353ed6613aaf95f66a8be3e5b
|
3 |
+
size 794230656
|
model-00023-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5cfcbe8afd1dd9b734def6313f26782934cc2f5f3f770c377c20b57e8e8d29f
|
3 |
+
size 794178752
|
model-00024-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec92d73e337223a42970798d3c70dc529256c964d8b75173342421f77734a061
|
3 |
+
size 772385128
|
model-00025-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a62e0851f46134626d379595d531a1938279bf56cd641f28566f26dfce4450e4
|
3 |
+
size 772385128
|
model-00026-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9796b576490c20144cd0d6029a57da1b54d377ae34f113eeccc4fb0ea5f57cd
|
3 |
+
size 772405608
|
model-00027-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23ba69560fb6a76631846cfd402c55afbef1b934eedbcc7cc853a21878934e5f
|
3 |
+
size 772385128
|
model-00028-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e19d3784e340c111fee7dd7aa24101da753c7f069718973e150d49c9effff5a7
|
3 |
+
size 772385128
|
model-00029-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fb225896bfccbe9687724435f7bc7f544f2cb396c4d62146ec0f3d3a335d83d
|
3 |
+
size 772405608
|
model-00030-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad5d5209ce5d6bfee4dff7ef9f59cbdcfe067ad362449312c8f651e0e50f16f1
|
3 |
+
size 772385128
|
model-00031-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62f52ee97b5bfceacdf16a23a7570f15dd4d179ec947603b40bd1618c9882654
|
3 |
+
size 772385128
|
model-00032-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:563652ca12dff1933d8c3be31cffc9bd16511915457a9e206bde09e8231c771f
|
3 |
+
size 772405608
|
model-00033-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a35690e08ff2beb2b64ff3c5f0a5784202c4632e2e42086a34494783f549bfed
|
3 |
+
size 772385128
|
model-00034-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e568341142afe7e9f69dd74ab596a7d13a81fe1e3d828809764269a2910b16a
|
3 |
+
size 772385128
|
model-00035-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11162a62cb1dfa562dd64cd90d4c3321ae74ac1860d19458b749d286cd213672
|
3 |
+
size 782070648
|
model-00036-of-00036.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7d0c42f0bc6af0aa7f77bccf3b1c818c97e6a898386bddea1eea2ffdb70c8b6
|
3 |
+
size 262144128
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
ADDED
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"unk_token": {
|
17 |
+
"content": "<unk>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": false,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
}
|
23 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dadfd56d766715c61d2ef780a525ab43b8e6da4de6865bda3d95fdef5e134055
|
3 |
+
size 493443
|
tokenizer_config.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"0": {
|
6 |
+
"content": "<unk>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": false,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"1": {
|
14 |
+
"content": "<s>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": false,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
},
|
21 |
+
"2": {
|
22 |
+
"content": "</s>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": false,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false,
|
27 |
+
"special": true
|
28 |
+
}
|
29 |
+
},
|
30 |
+
"additional_special_tokens": [],
|
31 |
+
"bos_token": "<s>",
|
32 |
+
"chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
|
33 |
+
"clean_up_tokenization_spaces": false,
|
34 |
+
"eos_token": "</s>",
|
35 |
+
"legacy": true,
|
36 |
+
"model_max_length": 1000000000000000019884624838656,
|
37 |
+
"pad_token": null,
|
38 |
+
"sp_model_kwargs": {},
|
39 |
+
"spaces_between_special_tokens": false,
|
40 |
+
"tokenizer_class": "LlamaTokenizer",
|
41 |
+
"unk_token": "<unk>",
|
42 |
+
"use_default_system_prompt": false
|
43 |
+
}
|