Text Generation
Transformers
Safetensors
mixtral
Not-For-All-Audiences
nsfw
text-generation-inference
Inference Endpoints
Upload folder using huggingface_hub
Browse files- config.json +34 -0
- model-00001-of-00023.safetensors +3 -0
- model-00002-of-00023.safetensors +3 -0
- model-00003-of-00023.safetensors +3 -0
- model-00004-of-00023.safetensors +3 -0
- model-00005-of-00023.safetensors +3 -0
- model-00006-of-00023.safetensors +3 -0
- model-00007-of-00023.safetensors +3 -0
- model-00008-of-00023.safetensors +3 -0
- model-00009-of-00023.safetensors +3 -0
- model-00010-of-00023.safetensors +3 -0
- model-00011-of-00023.safetensors +3 -0
- model-00012-of-00023.safetensors +3 -0
- model-00013-of-00023.safetensors +3 -0
- model-00014-of-00023.safetensors +3 -0
- model-00015-of-00023.safetensors +3 -0
- model-00016-of-00023.safetensors +3 -0
- model-00017-of-00023.safetensors +3 -0
- model-00018-of-00023.safetensors +3 -0
- model-00019-of-00023.safetensors +3 -0
- model-00020-of-00023.safetensors +3 -0
- model-00021-of-00023.safetensors +3 -0
- model-00022-of-00023.safetensors +3 -0
- model-00023-of-00023.safetensors +3 -0
- model.safetensors.index.json +0 -0
- special_tokens_map.json +24 -0
- tokenizer.json +0 -0
- tokenizer.model +3 -0
- tokenizer_config.json +42 -0
config.json
ADDED
@@ -0,0 +1,34 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Undi95/Emerhyst-20B",
|
3 |
+
"architectures": [
|
4 |
+
"MixtralForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 5120,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 13824,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "mixtral",
|
16 |
+
"num_attention_heads": 40,
|
17 |
+
"num_experts_per_tok": 2,
|
18 |
+
"num_hidden_layers": 62,
|
19 |
+
"num_key_value_heads": 40,
|
20 |
+
"num_local_experts": 8,
|
21 |
+
"output_router_logits": false,
|
22 |
+
"pad_token_id": 0,
|
23 |
+
"pretraining_tp": 1,
|
24 |
+
"rms_norm_eps": 1e-05,
|
25 |
+
"rope_scaling": null,
|
26 |
+
"rope_theta": 10000.0,
|
27 |
+
"router_aux_loss_coef": 0.001,
|
28 |
+
"sliding_window": 4096,
|
29 |
+
"tie_word_embeddings": false,
|
30 |
+
"torch_dtype": "float16",
|
31 |
+
"transformers_version": "4.37.0.dev0",
|
32 |
+
"use_cache": false,
|
33 |
+
"vocab_size": 32000
|
34 |
+
}
|
model-00001-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:784f087ae632ff49c9fcced0856534c8954cb08a20ce113cda1f5f1bb8fa0df2
|
3 |
+
size 9998833048
|
model-00002-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6727c6b56909527763016c40d7a94d66c8680b1e41cce68c18c996edc8afd2b
|
3 |
+
size 9909052384
|
model-00003-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfca775a97a4fbd1201a5b56068b7ecf2c399e2a3760a99b890b5f76e645dd88
|
3 |
+
size 9909052392
|
model-00004-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a20e15b8f4db619631c2bcd315c5a32820f5840b2f17ba7aa8a7b1ce2f29de4
|
3 |
+
size 9909052400
|
model-00005-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46eb0d8f314c8bcbb82e8bf52ebfb5a64acdb8ae8aef811792cf31405d555ac1
|
3 |
+
size 9909052400
|
model-00006-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aed98cff47ae8a6ed2d707569b177170bdf720e7ffd85edaf2d95c5020a58ca9
|
3 |
+
size 9909052392
|
model-00007-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f58f1a5a7ff04b11cd58941fb7f615aae0c24ecca749209d5fa051c7ebf1683
|
3 |
+
size 9909052392
|
model-00008-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:754a5a2ee5d39e691cf52346e8b218ef5ba80ff94f007187ed3c49a29badc347
|
3 |
+
size 9909052336
|
model-00009-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a726384b3aac57662e94dc13ce5777cdc4f23b972fa61b0d8b75de8c266f54b
|
3 |
+
size 9909052376
|
model-00010-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8de3823ba6a205a989aab7a65e43c7b942b6245a825095bf3141c702032a6b2
|
3 |
+
size 9909052392
|
model-00011-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:734b72ec68f27923b50a49c15c2e305ba492590d8914a43fd992fd0056b7c0f7
|
3 |
+
size 9909052400
|
model-00012-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc0076638ce27eb03fae72591b2f736f9ceb68570c22fa0bca1307bd2506c73c
|
3 |
+
size 9909052400
|
model-00013-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6731fbf94a2966ce859b46707e4b0a8cf85b6a4c88854dd8fad660eb825298b4
|
3 |
+
size 9909052392
|
model-00014-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0128d96eb753f3c3a642b534b27c9ad30826a9dbc1c12e4ae9fafcdb0828109
|
3 |
+
size 9909052392
|
model-00015-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a0d9fcbfe4deb52ceade669f7adb81c99b415850fad94378b445198e356234a
|
3 |
+
size 9909052344
|
model-00016-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b158f331ae2a3894ed6f6236614c999d3409f589cfa5f0ca96ecdcc1013c517
|
3 |
+
size 9909052376
|
model-00017-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a58b077e9ba6624cf54c8615c1141210a9260a16ab4b5f65b54c69c0af0ddc7
|
3 |
+
size 9909052392
|
model-00018-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85b9189908f583babfa3c4cc472f4025874ffc49dcc0b2c12b8384bf7f27bd12
|
3 |
+
size 9909052392
|
model-00019-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3458b9cc506d0d01557d179a5a0100057b8c533640f0db3fd97f37b3b13570a8
|
3 |
+
size 9909052400
|
model-00020-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df944c39e1332fa3960751156f090331145237dafb1737bb584fe3972cf80f86
|
3 |
+
size 9909052392
|
model-00021-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7e837120934c5eb5c4786495a9eaab7b1cc907c90f1380b7b265d269dbfe72f
|
3 |
+
size 9909052392
|
model-00022-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65ab2913dc1048139f009ee5e7f30c58ce01ca4ff8c077f5752f56cb151d6897
|
3 |
+
size 9983103984
|
model-00023-of-00023.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:978f3305c1330c933bc613b4b29ca363675e318c1035715f050a88075eaa7098
|
3 |
+
size 6139269344
|
model.safetensors.index.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": false,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"eos_token": {
|
10 |
+
"content": "</s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": false,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"pad_token": "<s>",
|
17 |
+
"unk_token": {
|
18 |
+
"content": "<unk>",
|
19 |
+
"lstrip": false,
|
20 |
+
"normalized": false,
|
21 |
+
"rstrip": false,
|
22 |
+
"single_word": false
|
23 |
+
}
|
24 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer.model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
|
3 |
+
size 499723
|
tokenizer_config.json
ADDED
@@ -0,0 +1,42 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_bos_token": true,
|
3 |
+
"add_eos_token": false,
|
4 |
+
"added_tokens_decoder": {
|
5 |
+
"0": {
|
6 |
+
"content": "<unk>",
|
7 |
+
"lstrip": false,
|
8 |
+
"normalized": false,
|
9 |
+
"rstrip": false,
|
10 |
+
"single_word": false,
|
11 |
+
"special": true
|
12 |
+
},
|
13 |
+
"1": {
|
14 |
+
"content": "<s>",
|
15 |
+
"lstrip": false,
|
16 |
+
"normalized": false,
|
17 |
+
"rstrip": false,
|
18 |
+
"single_word": false,
|
19 |
+
"special": true
|
20 |
+
},
|
21 |
+
"2": {
|
22 |
+
"content": "</s>",
|
23 |
+
"lstrip": false,
|
24 |
+
"normalized": false,
|
25 |
+
"rstrip": false,
|
26 |
+
"single_word": false,
|
27 |
+
"special": true
|
28 |
+
}
|
29 |
+
},
|
30 |
+
"bos_token": "<s>",
|
31 |
+
"clean_up_tokenization_spaces": false,
|
32 |
+
"eos_token": "</s>",
|
33 |
+
"legacy": false,
|
34 |
+
"model_max_length": 4096,
|
35 |
+
"pad_token": "<s>",
|
36 |
+
"padding_side": "left",
|
37 |
+
"sp_model_kwargs": {},
|
38 |
+
"spaces_between_special_tokens": false,
|
39 |
+
"tokenizer_class": "LlamaTokenizer",
|
40 |
+
"unk_token": "<unk>",
|
41 |
+
"use_default_system_prompt": true
|
42 |
+
}
|