polejowska commited on
Commit
e2ae579
1 Parent(s): e33c50d

End of training

Browse files
runs/Feb28_15-54-30_7c779bfb7013/events.out.tfevents.1677599675.7c779bfb7013.343.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0a5fd7531b48f08d8e583a95477cbf4bd0b6aeeceb04582d97ac594bbb5cf31
3
- size 6243
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7020ef59b9f12b4d0db2ab12de3bf9ea99237937cb8f3ba2f219e4ca3f9bde9c
3
+ size 6597
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.0,
5
- "global_step": 282,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -50,18 +50,74 @@
50
  "step": 282
51
  },
52
  {
53
- "epoch": 3.0,
54
- "step": 282,
55
- "total_flos": 1.07525797056e+18,
56
- "train_loss": 3.0334743202155363,
57
- "train_runtime": 718.9206,
58
- "train_samples_per_second": 3.13,
59
- "train_steps_per_second": 0.392
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
60
  }
61
  ],
62
- "max_steps": 282,
63
- "num_train_epochs": 3,
64
- "total_flos": 1.07525797056e+18,
65
  "trial_name": null,
66
  "trial_params": null
67
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 7.0,
5
+ "global_step": 658,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
50
  "step": 282
51
  },
52
  {
53
+ "epoch": 4.0,
54
+ "learning_rate": 4.2857142857142856e-05,
55
+ "loss": 2.7515,
56
+ "step": 376
57
+ },
58
+ {
59
+ "epoch": 4.0,
60
+ "eval_loss": 1.964645504951477,
61
+ "eval_runtime": 35.4193,
62
+ "eval_samples_per_second": 5.647,
63
+ "eval_steps_per_second": 0.706,
64
+ "step": 376
65
+ },
66
+ {
67
+ "epoch": 5.0,
68
+ "learning_rate": 2.857142857142857e-05,
69
+ "loss": 2.724,
70
+ "step": 470
71
+ },
72
+ {
73
+ "epoch": 5.0,
74
+ "eval_loss": 2.1284220218658447,
75
+ "eval_runtime": 34.8555,
76
+ "eval_samples_per_second": 5.738,
77
+ "eval_steps_per_second": 0.717,
78
+ "step": 470
79
+ },
80
+ {
81
+ "epoch": 6.0,
82
+ "learning_rate": 1.4285714285714285e-05,
83
+ "loss": 2.6193,
84
+ "step": 564
85
+ },
86
+ {
87
+ "epoch": 6.0,
88
+ "eval_loss": 1.9379758834838867,
89
+ "eval_runtime": 36.3088,
90
+ "eval_samples_per_second": 5.508,
91
+ "eval_steps_per_second": 0.689,
92
+ "step": 564
93
+ },
94
+ {
95
+ "epoch": 7.0,
96
+ "learning_rate": 0.0,
97
+ "loss": 2.5032,
98
+ "step": 658
99
+ },
100
+ {
101
+ "epoch": 7.0,
102
+ "eval_loss": 1.9285995960235596,
103
+ "eval_runtime": 35.9858,
104
+ "eval_samples_per_second": 5.558,
105
+ "eval_steps_per_second": 0.695,
106
+ "step": 658
107
+ },
108
+ {
109
+ "epoch": 7.0,
110
+ "step": 658,
111
+ "total_flos": 2.50893526464e+18,
112
+ "train_loss": 1.5139910805189138,
113
+ "train_runtime": 964.856,
114
+ "train_samples_per_second": 5.441,
115
+ "train_steps_per_second": 0.682
116
  }
117
  ],
118
+ "max_steps": 658,
119
+ "num_train_epochs": 7,
120
+ "total_flos": 2.50893526464e+18,
121
  "trial_name": null,
122
  "trial_params": null
123
  }