jssky commited on
Commit
aa8d15e
1 Parent(s): b1c7fdb

End of training

Browse files
README.md CHANGED
@@ -113,7 +113,7 @@ xformers_attention: null
113
 
114
  This model is a fine-tuned version of [unsloth/gemma-1.1-2b-it](https://huggingface.co/unsloth/gemma-1.1-2b-it) on the None dataset.
115
  It achieves the following results on the evaluation set:
116
- - Loss: 6.3890
117
 
118
  ## Model description
119
 
@@ -149,9 +149,9 @@ The following hyperparameters were used during training:
149
  | Training Loss | Epoch | Step | Validation Loss |
150
  |:-------------:|:------:|:----:|:---------------:|
151
  | 15.4792 | 0.0007 | 1 | 12.3048 |
152
- | 11.3833 | 0.0022 | 3 | 12.0512 |
153
- | 7.3908 | 0.0044 | 6 | 9.4415 |
154
- | 6.6914 | 0.0066 | 9 | 6.3890 |
155
 
156
 
157
  ### Framework versions
 
113
 
114
  This model is a fine-tuned version of [unsloth/gemma-1.1-2b-it](https://huggingface.co/unsloth/gemma-1.1-2b-it) on the None dataset.
115
  It achieves the following results on the evaluation set:
116
+ - Loss: 6.4829
117
 
118
  ## Model description
119
 
 
149
  | Training Loss | Epoch | Step | Validation Loss |
150
  |:-------------:|:------:|:----:|:---------------:|
151
  | 15.4792 | 0.0007 | 1 | 12.3048 |
152
+ | 11.3833 | 0.0022 | 3 | 12.0766 |
153
+ | 7.5335 | 0.0044 | 6 | 9.5947 |
154
+ | 6.7949 | 0.0066 | 9 | 6.4829 |
155
 
156
 
157
  ### Framework versions
adapter_config.json CHANGED
@@ -20,12 +20,12 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "up_proj",
24
- "q_proj",
25
- "v_proj",
26
  "k_proj",
27
- "gate_proj",
28
  "down_proj",
 
 
 
 
29
  "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
 
23
  "k_proj",
 
24
  "down_proj",
25
+ "v_proj",
26
+ "up_proj",
27
+ "gate_proj",
28
+ "q_proj",
29
  "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9051410511f5979d2db9aaa71ea6696cb1036804d0c3cd055fe5c247b2cd4625
3
  size 78537274
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1edb1e504a7e30d638ee6c79285139309fa3794a760675d18582a75e39388a0c
3
  size 78537274
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb1c264f6196955ec5d50aceba9f69ebb491f5f59d3179389aba510cf2502268
3
  size 78480072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8301b0a7c2edb3ef49e63e955b94c5f7aa54ca23938bacd9ad6f48921e865cf
3
  size 78480072
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:722f3b82bb852127c4404471dd8bb057b70f4e0cb5a02b713538b276ca5a19c9
3
  size 6712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72b5ec9cd53bed712805221792024653bec1693ae9132893c54190849f7ca423
3
  size 6712