ininini commited on
Commit
548d8df
·
verified ·
1 Parent(s): 1275a84

(Trained with Unsloth)

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -7,6 +7,7 @@
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
  "eos_token_id": 128001,
 
10
  "hidden_act": "silu",
11
  "hidden_size": 4096,
12
  "initializer_range": 0.02,
@@ -24,8 +25,8 @@
24
  "rope_theta": 500000.0,
25
  "tie_word_embeddings": false,
26
  "torch_dtype": "bfloat16",
27
- "transformers_version": "4.44.2",
28
- "unsloth_version": "2024.10.7",
29
  "use_cache": true,
30
  "vocab_size": 128256
31
  }
 
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
  "eos_token_id": 128001,
10
+ "head_dim": 128,
11
  "hidden_act": "silu",
12
  "hidden_size": 4096,
13
  "initializer_range": 0.02,
 
25
  "rope_theta": 500000.0,
26
  "tie_word_embeddings": false,
27
  "torch_dtype": "bfloat16",
28
+ "transformers_version": "4.46.2",
29
+ "unsloth_version": "2024.12.1",
30
  "use_cache": true,
31
  "vocab_size": 128256
32
  }
generation_config.json CHANGED
@@ -7,5 +7,5 @@
7
  ],
8
  "max_length": 8192,
9
  "pad_token_id": 128255,
10
- "transformers_version": "4.44.2"
11
  }
 
7
  ],
8
  "max_length": 8192,
9
  "pad_token_id": 128255,
10
+ "transformers_version": "4.46.2"
11
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82caa8d960fcb2b142e0827452d4224e36a8fc8d2058a2d0db8a33575915c3f9
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49b52bc593846d2725257c3d0c3afb13fc1b13826ac28a99a173378dcdf2ff9d
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53c2735889efa0ddfbba5d9e96d6ccb87c776bc83fe4995358fff15785ee1de5
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2cac6a19d314302ed7a5826ed35496d69a4a5224d6379d5de62672659bedfb1
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4eff0292aa3c0c4a5d4624d5d7ff0b2d8e390fe2aa32b0f566bb679fb4ebda3
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45f34e189d8cf21a17ace5061e45b87c7fb5666e17632bb0c8a9124e6573777a
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d9956845114b093cd05f8087ed588850db49f38c3978ddd65ff1b9dc62a5d26
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:228d85ffcc041c9130a60cc91b596849838823dce00fbb95b24f7eb4d17caca0
3
  size 1168138808
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff