stuser2023
commited on
Training in progress, epoch 1
Browse files- model.safetensors +1 -1
- run-2/checkpoint-2138/config.json +1 -1
- run-2/checkpoint-2138/model.safetensors +1 -1
- run-2/checkpoint-2138/optimizer.pt +1 -1
- run-2/checkpoint-2138/rng_state.pth +2 -2
- run-2/checkpoint-2138/scheduler.pt +1 -1
- run-2/checkpoint-2138/trainer_state.json +33 -36
- run-2/checkpoint-2138/training_args.bin +2 -2
- runs/Mar16_01-46-29_6e5f088ca464/events.out.tfevents.1710554238.6e5f088ca464.226.4 +3 -0
- training_args.bin +1 -1
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26cd8608c74765cf0d7e63a3bd73516440951ea66a7798b1db8fabaf293cd73d
|
3 |
size 267832560
|
run-2/checkpoint-2138/config.json
CHANGED
@@ -20,6 +20,6 @@
|
|
20 |
"sinusoidal_pos_embds": false,
|
21 |
"tie_weights_": true,
|
22 |
"torch_dtype": "float32",
|
23 |
-
"transformers_version": "4.
|
24 |
"vocab_size": 30522
|
25 |
}
|
|
|
20 |
"sinusoidal_pos_embds": false,
|
21 |
"tie_weights_": true,
|
22 |
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.38.2",
|
24 |
"vocab_size": 30522
|
25 |
}
|
run-2/checkpoint-2138/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267832560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26cd8608c74765cf0d7e63a3bd73516440951ea66a7798b1db8fabaf293cd73d
|
3 |
size 267832560
|
run-2/checkpoint-2138/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535727290
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27036bd6d5c147ed5ca1ab4795ea0dd675b03aeeab4bc7c35494d8353c84cd75
|
3 |
size 535727290
|
run-2/checkpoint-2138/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69e0a553a49d736b29e905a2d4bf1244efc8e9ef91880c8ee0b1a1f54b22212d
|
3 |
+
size 14244
|
run-2/checkpoint-2138/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ed3f34b5f9517f54c77536f0ba18982652f4f4de915e227c452430419d32086
|
3 |
size 1064
|
run-2/checkpoint-2138/trainer_state.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-2138",
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 2138,
|
7 |
"is_hyper_param_search": true,
|
@@ -9,58 +9,55 @@
|
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
-
"epoch": 0.
|
13 |
-
"
|
14 |
-
"
|
|
|
15 |
"step": 500
|
16 |
},
|
17 |
{
|
18 |
-
"epoch": 0.
|
19 |
-
"
|
20 |
-
"
|
|
|
21 |
"step": 1000
|
22 |
},
|
23 |
{
|
24 |
-
"epoch":
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"eval_samples_per_second": 1295.012,
|
29 |
-
"eval_steps_per_second": 81.947,
|
30 |
-
"step": 1069
|
31 |
-
},
|
32 |
-
{
|
33 |
-
"epoch": 1.4,
|
34 |
-
"learning_rate": 4.370333149644712e-06,
|
35 |
-
"loss": 0.4286,
|
36 |
"step": 1500
|
37 |
},
|
38 |
{
|
39 |
-
"epoch":
|
40 |
-
"
|
41 |
-
"
|
|
|
42 |
"step": 2000
|
43 |
},
|
44 |
{
|
45 |
-
"epoch":
|
46 |
-
"eval_loss": 0.
|
47 |
-
"eval_matthews_correlation": 0.
|
48 |
-
"eval_runtime": 0.
|
49 |
-
"eval_samples_per_second":
|
50 |
-
"eval_steps_per_second":
|
51 |
"step": 2138
|
52 |
}
|
53 |
],
|
54 |
"logging_steps": 500,
|
55 |
-
"max_steps":
|
56 |
-
"
|
|
|
57 |
"save_steps": 500,
|
58 |
-
"total_flos":
|
|
|
59 |
"trial_name": null,
|
60 |
"trial_params": {
|
61 |
-
"learning_rate":
|
62 |
-
"num_train_epochs":
|
63 |
-
"per_device_train_batch_size":
|
64 |
-
"seed":
|
65 |
}
|
66 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.3853198145814999,
|
3 |
"best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-2138",
|
4 |
+
"epoch": 1.0,
|
5 |
"eval_steps": 500,
|
6 |
"global_step": 2138,
|
7 |
"is_hyper_param_search": true,
|
|
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
+
"epoch": 0.23,
|
13 |
+
"grad_norm": 4.28505277633667,
|
14 |
+
"learning_rate": 3.0702893894484785e-06,
|
15 |
+
"loss": 0.6069,
|
16 |
"step": 500
|
17 |
},
|
18 |
{
|
19 |
+
"epoch": 0.47,
|
20 |
+
"grad_norm": 9.482794761657715,
|
21 |
+
"learning_rate": 2.9196373094951675e-06,
|
22 |
+
"loss": 0.5628,
|
23 |
"step": 1000
|
24 |
},
|
25 |
{
|
26 |
+
"epoch": 0.7,
|
27 |
+
"grad_norm": 22.521339416503906,
|
28 |
+
"learning_rate": 2.7689852295418565e-06,
|
29 |
+
"loss": 0.5565,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
30 |
"step": 1500
|
31 |
},
|
32 |
{
|
33 |
+
"epoch": 0.94,
|
34 |
+
"grad_norm": 26.7753849029541,
|
35 |
+
"learning_rate": 2.6183331495885454e-06,
|
36 |
+
"loss": 0.5184,
|
37 |
"step": 2000
|
38 |
},
|
39 |
{
|
40 |
+
"epoch": 1.0,
|
41 |
+
"eval_loss": 0.5730993747711182,
|
42 |
+
"eval_matthews_correlation": 0.3853198145814999,
|
43 |
+
"eval_runtime": 0.7612,
|
44 |
+
"eval_samples_per_second": 1370.225,
|
45 |
+
"eval_steps_per_second": 86.706,
|
46 |
"step": 2138
|
47 |
}
|
48 |
],
|
49 |
"logging_steps": 500,
|
50 |
+
"max_steps": 10690,
|
51 |
+
"num_input_tokens_seen": 0,
|
52 |
+
"num_train_epochs": 5,
|
53 |
"save_steps": 500,
|
54 |
+
"total_flos": 32530060484016.0,
|
55 |
+
"train_batch_size": 4,
|
56 |
"trial_name": null,
|
57 |
"trial_params": {
|
58 |
+
"learning_rate": 3.2209414694017896e-06,
|
59 |
+
"num_train_epochs": 5,
|
60 |
+
"per_device_train_batch_size": 4,
|
61 |
+
"seed": 16
|
62 |
}
|
63 |
}
|
run-2/checkpoint-2138/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88d2c3d6804ca2d9d22cb74f328c5ae8ec320f8d12a0ef15ea5ae2037f02bd85
|
3 |
+
size 4984
|
runs/Mar16_01-46-29_6e5f088ca464/events.out.tfevents.1710554238.6e5f088ca464.226.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2728a30252b8c7698d4b1cbbee9e9398c0d44f7fa3ab038a041c0d6da1827ad
|
3 |
+
size 5979
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4984
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88d2c3d6804ca2d9d22cb74f328c5ae8ec320f8d12a0ef15ea5ae2037f02bd85
|
3 |
size 4984
|