christineyu commited on
Commit
4c7a4cf
·
verified ·
1 Parent(s): ee34266

End of training

Browse files
Files changed (3) hide show
  1. README.md +5 -3
  2. all_results.json +5 -0
  3. eval_results.json +4 -4
README.md CHANGED
@@ -1,17 +1,19 @@
1
  ---
2
  base_model: mistralai/Mistral-7B-Instruct-v0.2
 
3
  library_name: transformers
4
- model_name: prometheus-7b-v1.5-beta-1-0109-sum-pref-overfit-v3-flash
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
  - sft
9
  licence: license
10
  ---
11
 
12
- # Model Card for prometheus-7b-v1.5-beta-1-0109-sum-pref-overfit-v3-flash
13
 
14
- This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
1
  ---
2
  base_model: mistralai/Mistral-7B-Instruct-v0.2
3
+ datasets: sum-pref-overfit
4
  library_name: transformers
5
+ model_name: sum-pref-overfit-v1-modelcard
6
  tags:
7
  - generated_from_trainer
8
+ - alignment-handbook
9
  - trl
10
  - sft
11
  licence: license
12
  ---
13
 
14
+ # Model Card for sum-pref-overfit-v1-modelcard
15
 
16
+ This model is a fine-tuned version of [mistralai/Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2) on the [sum-pref-overfit](https://huggingface.co/datasets/sum-pref-overfit) dataset.
17
  It has been trained using [TRL](https://github.com/huggingface/trl).
18
 
19
  ## Quick start
all_results.json CHANGED
@@ -1,5 +1,10 @@
1
  {
2
  "epoch": 1.0,
 
 
 
 
 
3
  "total_flos": 2.542777053216768e+16,
4
  "train_loss": 0.06061042585337521,
5
  "train_runtime": 596.3446,
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.010453196242451668,
4
+ "eval_runtime": 1.279,
5
+ "eval_samples": 10,
6
+ "eval_samples_per_second": 0.782,
7
+ "eval_steps_per_second": 0.782,
8
  "total_flos": 2.542777053216768e+16,
9
  "train_loss": 0.06061042585337521,
10
  "train_runtime": 596.3446,
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 1.0,
3
- "eval_loss": 0.01081210095435381,
4
- "eval_runtime": 1.2807,
5
  "eval_samples": 10,
6
- "eval_samples_per_second": 0.781,
7
- "eval_steps_per_second": 0.781
8
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.010453196242451668,
4
+ "eval_runtime": 1.279,
5
  "eval_samples": 10,
6
+ "eval_samples_per_second": 0.782,
7
+ "eval_steps_per_second": 0.782
8
  }