jssky commited on
Commit
1b3fdc3
·
verified ·
1 Parent(s): 2f5cc74

End of training

Browse files
README.md CHANGED
@@ -116,7 +116,7 @@ xformers_attention: null
116
 
117
  This model is a fine-tuned version of [Maykeye/TinyLLama-v0](https://huggingface.co/Maykeye/TinyLLama-v0) on the None dataset.
118
  It achieves the following results on the evaluation set:
119
- - Loss: 10.4767
120
 
121
  ## Model description
122
 
@@ -153,8 +153,8 @@ The following hyperparameters were used during training:
153
  |:-------------:|:------:|:----:|:---------------:|
154
  | 10.7803 | 0.0055 | 1 | 10.8762 |
155
  | 10.5919 | 0.0166 | 3 | 10.8762 |
156
- | 10.8178 | 0.0332 | 6 | 10.7948 |
157
- | 10.8378 | 0.0499 | 9 | 10.4767 |
158
 
159
 
160
  ### Framework versions
 
116
 
117
  This model is a fine-tuned version of [Maykeye/TinyLLama-v0](https://huggingface.co/Maykeye/TinyLLama-v0) on the None dataset.
118
  It achieves the following results on the evaluation set:
119
+ - Loss: 10.4596
120
 
121
  ## Model description
122
 
 
153
  |:-------------:|:------:|:----:|:---------------:|
154
  | 10.7803 | 0.0055 | 1 | 10.8762 |
155
  | 10.5919 | 0.0166 | 3 | 10.8762 |
156
+ | 10.8141 | 0.0332 | 6 | 10.7893 |
157
+ | 10.8235 | 0.0499 | 9 | 10.4596 |
158
 
159
 
160
  ### Framework versions
adapter_config.json CHANGED
@@ -21,12 +21,12 @@
21
  "revision": null,
22
  "target_modules": [
23
  "gate_proj",
24
- "o_proj",
25
- "v_proj",
26
- "down_proj",
27
  "q_proj",
28
  "k_proj",
29
- "up_proj"
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
21
  "revision": null,
22
  "target_modules": [
23
  "gate_proj",
24
+ "up_proj",
 
 
25
  "q_proj",
26
  "k_proj",
27
+ "o_proj",
28
+ "v_proj",
29
+ "down_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2aa8d36ef7ab6f0957f5faf3d1211df0a949fdac7e7e3b25d461b60f7a130a4
3
  size 793738
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77b841362d11686478355cf0ceeee738206902e0d668fb9873c2fa58b3f06178
3
  size 793738
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1178168b28c25756aa4281636b07615bd568deb155c023af2357b810c89b6bd8
3
  size 767856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:063267c323f826559daebddfb148a7f94fe2794e06e76b00be9adba90041236a
3
  size 767856
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbdcc855d0f57473d8bd7ab766a229753c5c71be0fbef544d11bf2fb79cc11ff
3
  size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9bb8d12ab7d3707b6887bbd0a3831cfac8994e15c07c849a86e5da758026626
3
  size 6712