Training in progress, step 3800
Browse files- adapter_model.safetensors +1 -1
- metrics.json +1 -0
- state.json +18 -3
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 35668592
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4126a86cedcc673291758a54cbca8d13b3b7d163ea1261dae62eb96e248768df
|
3 |
size 35668592
|
metrics.json
CHANGED
@@ -73,3 +73,4 @@
|
|
73 |
{"Step":3650,"eval_loss":1.74048388,"eval_runtime":29.3962,"eval_samples_per_second":3.402,"eval_steps_per_second":0.442,"epoch":2.8672427337}
|
74 |
{"Step":3700,"eval_loss":1.7404457331,"eval_runtime":29.4897,"eval_samples_per_second":3.391,"eval_steps_per_second":0.441,"epoch":2.9065200314}
|
75 |
{"Step":3750,"eval_loss":1.7380776405,"eval_runtime":29.4462,"eval_samples_per_second":3.396,"eval_steps_per_second":0.441,"epoch":2.9457973291}
|
|
|
|
73 |
{"Step":3650,"eval_loss":1.74048388,"eval_runtime":29.3962,"eval_samples_per_second":3.402,"eval_steps_per_second":0.442,"epoch":2.8672427337}
|
74 |
{"Step":3700,"eval_loss":1.7404457331,"eval_runtime":29.4897,"eval_samples_per_second":3.391,"eval_steps_per_second":0.441,"epoch":2.9065200314}
|
75 |
{"Step":3750,"eval_loss":1.7380776405,"eval_runtime":29.4462,"eval_samples_per_second":3.396,"eval_steps_per_second":0.441,"epoch":2.9457973291}
|
76 |
+
{"Step":3800,"eval_loss":1.7374665737,"eval_runtime":29.4954,"eval_samples_per_second":3.39,"eval_steps_per_second":0.441,"epoch":2.9850746269}
|
state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
"eval_steps": 50,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -1117,6 +1117,21 @@
|
|
1117 |
"eval_samples_per_second": 3.391,
|
1118 |
"eval_steps_per_second": 0.441,
|
1119 |
"step": 3700
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1120 |
}
|
1121 |
],
|
1122 |
"logging_steps": 50,
|
@@ -1136,7 +1151,7 @@
|
|
1136 |
"attributes": {}
|
1137 |
}
|
1138 |
},
|
1139 |
-
"total_flos": 4.
|
1140 |
"train_batch_size": 8,
|
1141 |
"trial_name": null,
|
1142 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.9850746268656714,
|
5 |
"eval_steps": 50,
|
6 |
+
"global_step": 3800,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
1117 |
"eval_samples_per_second": 3.391,
|
1118 |
"eval_steps_per_second": 0.441,
|
1119 |
"step": 3700
|
1120 |
+
},
|
1121 |
+
{
|
1122 |
+
"epoch": 2.9457973291437547,
|
1123 |
+
"grad_norm": 0.2325269728899002,
|
1124 |
+
"learning_rate": 1.0037823683444865e-05,
|
1125 |
+
"loss": 1.7788,
|
1126 |
+
"step": 3750
|
1127 |
+
},
|
1128 |
+
{
|
1129 |
+
"epoch": 2.9457973291437547,
|
1130 |
+
"eval_loss": 1.7380776405334473,
|
1131 |
+
"eval_runtime": 29.4462,
|
1132 |
+
"eval_samples_per_second": 3.396,
|
1133 |
+
"eval_steps_per_second": 0.441,
|
1134 |
+
"step": 3750
|
1135 |
}
|
1136 |
],
|
1137 |
"logging_steps": 50,
|
|
|
1151 |
"attributes": {}
|
1152 |
}
|
1153 |
},
|
1154 |
+
"total_flos": 4.720338670196736e+16,
|
1155 |
"train_batch_size": 8,
|
1156 |
"trial_name": null,
|
1157 |
"trial_params": null
|