ChepkiruiTonui commited on
Commit
298cfe3
·
verified ·
1 Parent(s): f544dc5

Training in progress, step 25, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -22,8 +22,8 @@
22
  "rank_pattern": {},
23
  "revision": null,
24
  "target_modules": [
25
- "q_proj",
26
- "v_proj"
27
  ],
28
  "task_type": null,
29
  "use_dora": false,
 
22
  "rank_pattern": {},
23
  "revision": null,
24
  "target_modules": [
25
+ "v_proj",
26
+ "q_proj"
27
  ],
28
  "task_type": null,
29
  "use_dora": false,
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e099098b47f29ededc98d12765b6f56996be704fdb5ae0e1eb30b2097f5133a4
3
  size 14208970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:245f29a897e7c49c00428e860ce4e07d6228260072c910e4328405c8fa1e8df0
3
  size 14208970
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f7f7bcd2757b29baab587e244e22bd4b461ca74b53ef01aa8743b5a78b17382
3
  size 4832762
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4255fb1905805371ee91d8a954ed9083758d20edd10e4c67fdd6131106c7e34e
3
  size 4832762
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6166d3c12a44bbcfc5050edc1e21540e217631ef414f110d2073dbd4209454c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be79dc9899c1eff57e53e0613a56d8f2678a4be11294551db60a4f06e44637e3
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7d135c69dc5cba3a48b39a10c49b5799e503e4202b7575790c01f57aca74aae
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c80ec05408312bf923dbbdaa282a4b00796cef23355bfe82c237478067ddd661
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,76 +1,28 @@
1
  {
2
- "best_metric": 118.39080459770115,
3
- "best_model_checkpoint": "../openai/whisper-small-finetuned/checkpoint-75",
4
- "epoch": 49.02,
5
  "eval_steps": 25,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 12.01,
13
- "grad_norm": 11.94140911102295,
14
- "learning_rate": 7.600000000000001e-06,
15
- "loss": 3.9758,
16
  "step": 25
17
  },
18
  {
19
- "epoch": 12.01,
20
- "eval_loss": 5.314132213592529,
21
- "eval_runtime": 11.7411,
22
- "eval_samples_per_second": 0.852,
23
- "eval_steps_per_second": 0.085,
24
- "eval_wer": 128.73563218390805,
25
  "step": 25
26
- },
27
- {
28
- "epoch": 24.02,
29
- "grad_norm": 3.9279041290283203,
30
- "learning_rate": 5.1e-06,
31
- "loss": 3.4485,
32
- "step": 50
33
- },
34
- {
35
- "epoch": 24.02,
36
- "eval_loss": 4.9484028816223145,
37
- "eval_runtime": 12.969,
38
- "eval_samples_per_second": 0.771,
39
- "eval_steps_per_second": 0.077,
40
- "eval_wer": 134.48275862068965,
41
- "step": 50
42
- },
43
- {
44
- "epoch": 37.01,
45
- "grad_norm": 3.5452747344970703,
46
- "learning_rate": 2.6e-06,
47
- "loss": 3.1895,
48
- "step": 75
49
- },
50
- {
51
- "epoch": 37.01,
52
- "eval_loss": 4.7514119148254395,
53
- "eval_runtime": 11.8715,
54
- "eval_samples_per_second": 0.842,
55
- "eval_steps_per_second": 0.084,
56
- "eval_wer": 118.39080459770115,
57
- "step": 75
58
- },
59
- {
60
- "epoch": 49.02,
61
- "grad_norm": 2.8297388553619385,
62
- "learning_rate": 1.0000000000000001e-07,
63
- "loss": 3.0765,
64
- "step": 100
65
- },
66
- {
67
- "epoch": 49.02,
68
- "eval_loss": 4.6838202476501465,
69
- "eval_runtime": 12.0411,
70
- "eval_samples_per_second": 0.83,
71
- "eval_steps_per_second": 0.083,
72
- "eval_wer": 118.39080459770115,
73
- "step": 100
74
  }
75
  ],
76
  "logging_steps": 25,
@@ -78,7 +30,7 @@
78
  "num_input_tokens_seen": 0,
79
  "num_train_epochs": 9223372036854775807,
80
  "save_steps": 25,
81
- "total_flos": 1.4684073984e+18,
82
  "train_batch_size": 96,
83
  "trial_name": null,
84
  "trial_params": null
 
1
  {
2
+ "best_metric": 125.62500000000001,
3
+ "best_model_checkpoint": "../openai/whisper-small-finetuned/checkpoint-25",
4
+ "epoch": 8.01,
5
  "eval_steps": 25,
6
+ "global_step": 25,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 8.01,
13
+ "grad_norm": 12.496959686279297,
14
+ "learning_rate": 7.7e-06,
15
+ "loss": 4.7293,
16
  "step": 25
17
  },
18
  {
19
+ "epoch": 8.01,
20
+ "eval_loss": 5.816229820251465,
21
+ "eval_runtime": 28.1944,
22
+ "eval_samples_per_second": 0.709,
23
+ "eval_steps_per_second": 0.035,
24
+ "eval_wer": 125.62500000000001,
25
  "step": 25
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  }
27
  ],
28
  "logging_steps": 25,
 
30
  "num_input_tokens_seen": 0,
31
  "num_train_epochs": 9223372036854775807,
32
  "save_steps": 25,
33
+ "total_flos": 4.9808378953728e+17,
34
  "train_batch_size": 96,
35
  "trial_name": null,
36
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3035a8bb40e92657c16115ccaf32e1f1aa6c07f6a6ee3edb6ffb5b6f88ce7156
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cf734b6963f8f73a8ed78acf74b0e5afa35b59bed85b09f6588300413559cfc
3
  size 5176