Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- config.json +38 -0
- generation_config.json +6 -0
- model-00001-of-00189.safetensors +3 -0
- model-00002-of-00189.safetensors +3 -0
- model-00003-of-00189.safetensors +3 -0
- model-00004-of-00189.safetensors +3 -0
- model-00005-of-00189.safetensors +3 -0
- model-00006-of-00189.safetensors +3 -0
- model-00007-of-00189.safetensors +3 -0
- model-00008-of-00189.safetensors +3 -0
- model-00009-of-00189.safetensors +3 -0
- model-00010-of-00189.safetensors +3 -0
- model-00011-of-00189.safetensors +3 -0
- model-00012-of-00189.safetensors +3 -0
- model-00013-of-00189.safetensors +3 -0
- model-00014-of-00189.safetensors +3 -0
- model-00015-of-00189.safetensors +3 -0
- model-00016-of-00189.safetensors +3 -0
- model-00017-of-00189.safetensors +3 -0
- model-00018-of-00189.safetensors +3 -0
- model-00019-of-00189.safetensors +3 -0
- model-00020-of-00189.safetensors +3 -0
- model-00021-of-00189.safetensors +3 -0
- model-00022-of-00189.safetensors +3 -0
- model-00023-of-00189.safetensors +3 -0
- model-00024-of-00189.safetensors +3 -0
- model-00025-of-00189.safetensors +3 -0
- model-00026-of-00189.safetensors +3 -0
- model-00027-of-00189.safetensors +3 -0
- model-00028-of-00189.safetensors +3 -0
- model-00029-of-00189.safetensors +3 -0
- model-00030-of-00189.safetensors +3 -0
- model-00031-of-00189.safetensors +3 -0
- model-00032-of-00189.safetensors +3 -0
- model-00033-of-00189.safetensors +3 -0
- model-00034-of-00189.safetensors +3 -0
- model-00035-of-00189.safetensors +3 -0
- model-00036-of-00189.safetensors +3 -0
- model-00037-of-00189.safetensors +3 -0
- model-00038-of-00189.safetensors +3 -0
- model-00039-of-00189.safetensors +3 -0
- model-00040-of-00189.safetensors +3 -0
- model-00041-of-00189.safetensors +3 -0
- model-00042-of-00189.safetensors +3 -0
- model-00043-of-00189.safetensors +3 -0
- model-00044-of-00189.safetensors +3 -0
- model-00045-of-00189.safetensors +3 -0
- model-00046-of-00189.safetensors +3 -0
- model-00047-of-00189.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Nemotron-4-340B-Base-hf",
|
3 |
+
"architectures": [
|
4 |
+
"NemotronForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 2,
|
9 |
+
"eos_token_id": 3,
|
10 |
+
"head_dim": 192,
|
11 |
+
"hidden_act": "relu2",
|
12 |
+
"hidden_size": 18432,
|
13 |
+
"initializer_range": 0.0063,
|
14 |
+
"intermediate_size": 73728,
|
15 |
+
"max_position_embeddings": 4096,
|
16 |
+
"mlp_bias": false,
|
17 |
+
"model_type": "nemotron",
|
18 |
+
"norm_eps": 1e-05,
|
19 |
+
"num_attention_heads": 96,
|
20 |
+
"num_hidden_layers": 96,
|
21 |
+
"num_key_value_heads": 8,
|
22 |
+
"quantization_config": {
|
23 |
+
"activation_scheme": "dynamic",
|
24 |
+
"ignored_layers": [
|
25 |
+
"lm_head"
|
26 |
+
],
|
27 |
+
"quant_method": "fp8"
|
28 |
+
},
|
29 |
+
"rope_percent": 0.5,
|
30 |
+
"rope_percentage": 0.5,
|
31 |
+
"rope_scaling": null,
|
32 |
+
"rope_theta": 10000,
|
33 |
+
"tie_word_embeddings": false,
|
34 |
+
"torch_dtype": "bfloat16",
|
35 |
+
"transformers_version": "4.43.0.dev0",
|
36 |
+
"use_cache": true,
|
37 |
+
"vocab_size": 256000
|
38 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 2,
|
4 |
+
"eos_token_id": 3,
|
5 |
+
"transformers_version": "4.43.0.dev0"
|
6 |
+
}
|
model-00001-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:492e67d00b85927fd5106a5fcc61933a93a4da2ba3dab19ad84df45908d22f2c
|
3 |
+
size 9437184112
|
model-00002-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:206eb1589c0ec52919a0bd5fb6bba6454cc0a5b62c987675b1b5c2e0a9551cf0
|
3 |
+
size 2095055948
|
model-00003-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e22dc1406f95a7cc26fb7ccb637142678fe94c45d818ee9d7c23e95b885d4a54
|
3 |
+
size 2095203836
|
model-00004-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0cb7e046722c5d7b8453d84df84c9d2b37a6963c55d470d77ed6c193a470e494
|
3 |
+
size 1358954708
|
model-00005-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a6fc66b6dc8d3bc39fbd88ffd670ede2b54d32151f7a344908de89223b14a12
|
3 |
+
size 2095203836
|
model-00006-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa95ca271a1119e2e6ff98c86a50672a110a29ccb14bb5ed01c637813a63b20a
|
3 |
+
size 1358954708
|
model-00007-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3a0f5447817fda87bac0566c5a0061cd445acb79529d6f781da05c8863f2297
|
3 |
+
size 2095203836
|
model-00008-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f5da863a3e6ad19422f9f75d9e6f9a4b279053185201298974b9ec6ac0dcbb5
|
3 |
+
size 1358954708
|
model-00009-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d53665f8e452a4cc6b670304c9f9acb2ab3fc96912768b8267d9182c08c01f
|
3 |
+
size 2095203836
|
model-00010-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4c94783835bfe7e3b999687b98925c05cd0d38febc74ce8129820813731fddf
|
3 |
+
size 1358954708
|
model-00011-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:941968406fabb8602f1145d9e0e728780f83be55c85bdb9420319b943d83a749
|
3 |
+
size 2095203836
|
model-00012-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b45a29bc8265bd68003ec4c6cd9d967456a61d36b22087fc290368ccb7b4ab1c
|
3 |
+
size 1358954708
|
model-00013-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5f3c588f6c289165d22def9abdde4af230b78cd5697ce962593d3ffb38486c4
|
3 |
+
size 2095203836
|
model-00014-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:197befcef18e6f1ee2634db13ae3f114aff3fd6d32979cd15f7db3ce1361cd9e
|
3 |
+
size 1358954708
|
model-00015-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96540f02c449ad300d9764a9bc98698fef35d8b374e6b35d2709ed7fa04a0364
|
3 |
+
size 2095203836
|
model-00016-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6b33f3c82e2462a3852fc80459c27b5eda495cbf7efdb5fd384dd6ffec8aa7c
|
3 |
+
size 1358954708
|
model-00017-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcee331e8c683d4d5bcec6568d96360221496d3588cd5d255e4401e847938bb5
|
3 |
+
size 2095203836
|
model-00018-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2dedde9514dcd9b03a33f1b6f4bf54c14e16ee6d14a6a01bcfdb7b4864b239b5
|
3 |
+
size 1358954708
|
model-00019-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:132daf633959e27797a12924f82c5079f76018a1ecf1f26a10a0f0eabf8d3442
|
3 |
+
size 2095203836
|
model-00020-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78fbe48f9aadff8af34d7d9761ddb5d84ea00d640b788dfa9f82af36cbd45ba0
|
3 |
+
size 1358954708
|
model-00021-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5af142a24bedec15cbfaf0ace484cbdf9ff01a2b4b99f72a85c98e5dddea145
|
3 |
+
size 2095203836
|
model-00022-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:679060a348a979ff966fbf89fccceec278b0176b58199395b659ef6001324a0d
|
3 |
+
size 1358954716
|
model-00023-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c02f136ad71ba9947022ffee91b71a7bdf60d1a72111a0fe681e6a6ad9364ec7
|
3 |
+
size 2095203852
|
model-00024-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac2e54c71d5a7fb7e214c1121c7737fd495ee1cdd7cbbfe22a1013b3ad3fbfdd
|
3 |
+
size 1358954716
|
model-00025-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cc4137de93bf43bd726f822d5ecc0fb3462cf887ba0de4d327c075aa31703c0
|
3 |
+
size 2095203852
|
model-00026-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2990fdbcd669429ae8cb740013755ffb02b6be9600e2eff431621bd005a9164
|
3 |
+
size 1358954716
|
model-00027-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94c7e42d62da64c135874372113cdcfc67398867222883b8a22c5ae72dc83606
|
3 |
+
size 2095203852
|
model-00028-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5eee630e2f6f7a16a610d6811cb640c1ff61442a1ccbfc0fd48644ccdf3c5e
|
3 |
+
size 1358954716
|
model-00029-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d93081ad2411540e79148032d85f521c5fa1c22b63b19d36ba373811fd549ad1
|
3 |
+
size 2095203852
|
model-00030-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:749ac01f582ca0c981e8b3afa20c5fae32b3022e426054d179ff002a97928a6c
|
3 |
+
size 1358954716
|
model-00031-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5f96672bb43116626c47df7d139dbc5fb9cfe7a56bfaf5d90c9ae7a60c845b1b
|
3 |
+
size 2095203852
|
model-00032-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c5cfaa532708b5befa6145eeb37a0ad761cb8d103fd316ccc5b7404731b77ef
|
3 |
+
size 1358954716
|
model-00033-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b742f787298466e033701ab75be0616836ba85fad05a341482cd801297416593
|
3 |
+
size 2095203852
|
model-00034-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75f57a0c96f25c1f6c58a1a7739226bdf12ef6a17a713900a7e6dfa81aa748fd
|
3 |
+
size 1358954716
|
model-00035-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8cbd533f9e874956f922a85535b37303009dd6254f6c014f376f4c7470ab17c4
|
3 |
+
size 2095203852
|
model-00036-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4be0f31cac813940a69778066be18a8565b094734c73a5fc54749634ab3e1468
|
3 |
+
size 1358954716
|
model-00037-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57e5a9c28a897b2ac80321a1053c02cf610f0d1895ba72ffba47fa4643f9e556
|
3 |
+
size 2095203852
|
model-00038-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce7b84d7e0ede36de80d854d4140cfb8c0f66b5af4977322ec8ade864ae6b964
|
3 |
+
size 1358954716
|
model-00039-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f85733ece4a869c5e4b50647000e04c83ab5867cc0f152165504c1d15b321555
|
3 |
+
size 2095203852
|
model-00040-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d71be466b49c450f5bb49cef853bc0d70e9713c4b88178297d3847bae631808
|
3 |
+
size 1358954716
|
model-00041-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c2efd9d258014378e422ead20ce17e50c3204822092bc9bbc0673fb521057d9
|
3 |
+
size 2095203852
|
model-00042-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0176156bd2ec62eab16e4568e1b2bdb4ecd8e29c6ae09975b254fd439f86e4cc
|
3 |
+
size 1358954716
|
model-00043-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47e072411cf28b82cbc9805fb81a8ee9e4e6480c585f2d4bd25d0268dfd831f1
|
3 |
+
size 2095203852
|
model-00044-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aef2efdcda387a1c9e1b2e16b5d34258fbe1970fc17ede4adec7e2d43e640676
|
3 |
+
size 1358954716
|
model-00045-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64f42af2ad24db779bc5866943455c9c53310db8817ec2244edcb04cb84f562f
|
3 |
+
size 2095203852
|
model-00046-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea9be991f8da98514148b6eca5fe6a66c35775ca2204dc8723c0e9b29c7be89f
|
3 |
+
size 1358954716
|
model-00047-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86c9fa06f9b0bd1d3b092361d662208be9c11b157a13f7c600ddb84f97b925dc
|
3 |
+
size 2095203852
|