stuser2023 commited on
Commit
804b71d
·
verified ·
1 Parent(s): c3f3955

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9992887f6907f8916987f3e3d5b5cd5f9a668b44cebeae398a79e142aced221
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26cd8608c74765cf0d7e63a3bd73516440951ea66a7798b1db8fabaf293cd73d
3
  size 267832560
run-2/checkpoint-2138/config.json CHANGED
@@ -20,6 +20,6 @@
20
  "sinusoidal_pos_embds": false,
21
  "tie_weights_": true,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.35.2",
24
  "vocab_size": 30522
25
  }
 
20
  "sinusoidal_pos_embds": false,
21
  "tie_weights_": true,
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.38.2",
24
  "vocab_size": 30522
25
  }
run-2/checkpoint-2138/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b23a968971b19293287438eef60ae5c1918ec542ff71380aae31cd91c873538f
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26cd8608c74765cf0d7e63a3bd73516440951ea66a7798b1db8fabaf293cd73d
3
  size 267832560
run-2/checkpoint-2138/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4de823e79a240af7a023f39e071d2ee53375f471e37d82ffc8ad524d0210c963
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27036bd6d5c147ed5ca1ab4795ea0dd675b03aeeab4bc7c35494d8353c84cd75
3
  size 535727290
run-2/checkpoint-2138/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11edc7ed6e233cf8ded4a33dfcfe8204ae40733acbe38c974b94308bacdc2d6d
3
- size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69e0a553a49d736b29e905a2d4bf1244efc8e9ef91880c8ee0b1a1f54b22212d
3
+ size 14244
run-2/checkpoint-2138/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4faa4bda620d03b6edc8353e8edb3a8710818368d5ef4d63d2cae7608666363
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ed3f34b5f9517f54c77536f0ba18982652f4f4de915e227c452430419d32086
3
  size 1064
run-2/checkpoint-2138/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.48409375114357234,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-2138",
4
- "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 2138,
7
  "is_hyper_param_search": true,
@@ -9,58 +9,55 @@
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.47,
13
- "learning_rate": 5.944660653119031e-06,
14
- "loss": 0.5558,
 
15
  "step": 500
16
  },
17
  {
18
- "epoch": 0.94,
19
- "learning_rate": 5.157496901381872e-06,
20
- "loss": 0.5053,
 
21
  "step": 1000
22
  },
23
  {
24
- "epoch": 1.0,
25
- "eval_loss": 0.4907635748386383,
26
- "eval_matthews_correlation": 0.42854888313294803,
27
- "eval_runtime": 0.8054,
28
- "eval_samples_per_second": 1295.012,
29
- "eval_steps_per_second": 81.947,
30
- "step": 1069
31
- },
32
- {
33
- "epoch": 1.4,
34
- "learning_rate": 4.370333149644712e-06,
35
- "loss": 0.4286,
36
  "step": 1500
37
  },
38
  {
39
- "epoch": 1.87,
40
- "learning_rate": 3.5831693979075514e-06,
41
- "loss": 0.3992,
 
42
  "step": 2000
43
  },
44
  {
45
- "epoch": 2.0,
46
- "eval_loss": 0.5015696883201599,
47
- "eval_matthews_correlation": 0.48409375114357234,
48
- "eval_runtime": 0.8234,
49
- "eval_samples_per_second": 1266.73,
50
- "eval_steps_per_second": 80.157,
51
  "step": 2138
52
  }
53
  ],
54
  "logging_steps": 500,
55
- "max_steps": 4276,
56
- "num_train_epochs": 4,
 
57
  "save_steps": 500,
58
- "total_flos": 75782994673692.0,
 
59
  "trial_name": null,
60
  "trial_params": {
61
- "learning_rate": 6.7318244048561916e-06,
62
- "num_train_epochs": 4,
63
- "per_device_train_batch_size": 8,
64
- "seed": 14
65
  }
66
  }
 
1
  {
2
+ "best_metric": 0.3853198145814999,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-2/checkpoint-2138",
4
+ "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 2138,
7
  "is_hyper_param_search": true,
 
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.23,
13
+ "grad_norm": 4.28505277633667,
14
+ "learning_rate": 3.0702893894484785e-06,
15
+ "loss": 0.6069,
16
  "step": 500
17
  },
18
  {
19
+ "epoch": 0.47,
20
+ "grad_norm": 9.482794761657715,
21
+ "learning_rate": 2.9196373094951675e-06,
22
+ "loss": 0.5628,
23
  "step": 1000
24
  },
25
  {
26
+ "epoch": 0.7,
27
+ "grad_norm": 22.521339416503906,
28
+ "learning_rate": 2.7689852295418565e-06,
29
+ "loss": 0.5565,
 
 
 
 
 
 
 
 
30
  "step": 1500
31
  },
32
  {
33
+ "epoch": 0.94,
34
+ "grad_norm": 26.7753849029541,
35
+ "learning_rate": 2.6183331495885454e-06,
36
+ "loss": 0.5184,
37
  "step": 2000
38
  },
39
  {
40
+ "epoch": 1.0,
41
+ "eval_loss": 0.5730993747711182,
42
+ "eval_matthews_correlation": 0.3853198145814999,
43
+ "eval_runtime": 0.7612,
44
+ "eval_samples_per_second": 1370.225,
45
+ "eval_steps_per_second": 86.706,
46
  "step": 2138
47
  }
48
  ],
49
  "logging_steps": 500,
50
+ "max_steps": 10690,
51
+ "num_input_tokens_seen": 0,
52
+ "num_train_epochs": 5,
53
  "save_steps": 500,
54
+ "total_flos": 32530060484016.0,
55
+ "train_batch_size": 4,
56
  "trial_name": null,
57
  "trial_params": {
58
+ "learning_rate": 3.2209414694017896e-06,
59
+ "num_train_epochs": 5,
60
+ "per_device_train_batch_size": 4,
61
+ "seed": 16
62
  }
63
  }
run-2/checkpoint-2138/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:618b6f744377ad587ba25f1af0a1c4f702e5743116ab1fe52e9ecc52d00dc59b
3
- size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88d2c3d6804ca2d9d22cb74f328c5ae8ec320f8d12a0ef15ea5ae2037f02bd85
3
+ size 4984
runs/Mar16_01-46-29_6e5f088ca464/events.out.tfevents.1710554238.6e5f088ca464.226.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2728a30252b8c7698d4b1cbbee9e9398c0d44f7fa3ab038a041c0d6da1827ad
3
+ size 5979
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29d6b485a188c4e5c57b6f3bb948e3315674066d3a6ec8f44d6d328263cd659b
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88d2c3d6804ca2d9d22cb74f328c5ae8ec320f8d12a0ef15ea5ae2037f02bd85
3
  size 4984