farmery commited on
Commit
d2b7c86
·
verified ·
1 Parent(s): 32cffb3

Training in progress, step 21, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db9d4c81f5c870d5091ce1248df2321c3627377437eb1fd3a02dd2b09cc6d84d
3
  size 645975704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dd856d4b5279e7d10774d470ff7bac9dfaf43ddd58c9a3d24478acedc82edd9
3
  size 645975704
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1f00519a1280a9ba1ae5ff258ebfbecfd3d048156dc03b5da31fc62e86da27a
3
  size 328468404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dea331b78a0088850af38aae3caf2a969275f094f678e0bfc657194711ae15c
3
  size 328468404
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3bc6a98341976d14774c9db5fc9e42d35e0df44221b751477e2174edc7ac28df
3
  size 14960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ff79fe953d04826b99fecfe7e010fe07129025452d919884191f130eb42747c
3
  size 14960
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4575ea3777bfc5a1c4772e7aa158bf61093c0ee16bcbfb398eb4b1ad9f500f0e
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:045b85bc34af39145c81016bdd7a5ad641dcaf58ffb672ec2ccc21781da3fac6
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fafa18e0be672f8fc31e8d231a7a8babae560a95bb0e01aefaa36a7ac352fe61
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:915d76157a5cbef9e1abdf860e14d4497c54f8707e539c6d6a75cf5e840a42eb
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5307b323e04b0aa5281216bce5c3f1719f8a0b241a803e1b840f8fb7bac651ff
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ef3913b9b2ad955bc286b3dc480ecd0223a8025a0332846a26073b62d442cc9
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e879686ec70e90a34bf505630c03eb25089480b81e2ef9381471251f2ea6ef8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e11730ab4a3a7ded716d3fd9997c2ef9af71a212e12a9490d14cbc3f60a6cced
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.5544554455445545,
5
  "eval_steps": 7,
6
- "global_step": 14,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -59,6 +59,35 @@
59
  "eval_samples_per_second": 66.133,
60
  "eval_steps_per_second": 4.668,
61
  "step": 14
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
62
  }
63
  ],
64
  "logging_steps": 3,
@@ -78,7 +107,7 @@
78
  "attributes": {}
79
  }
80
  },
81
- "total_flos": 3.981288225007206e+16,
82
  "train_batch_size": 4,
83
  "trial_name": null,
84
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8316831683168316,
5
  "eval_steps": 7,
6
+ "global_step": 21,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
59
  "eval_samples_per_second": 66.133,
60
  "eval_steps_per_second": 4.668,
61
  "step": 14
62
+ },
63
+ {
64
+ "epoch": 0.594059405940594,
65
+ "grad_norm": 0.7464063763618469,
66
+ "learning_rate": 9.859057841617709e-05,
67
+ "loss": 1.8413,
68
+ "step": 15
69
+ },
70
+ {
71
+ "epoch": 0.7128712871287128,
72
+ "grad_norm": 0.7601683139801025,
73
+ "learning_rate": 9.641839665080363e-05,
74
+ "loss": 1.6764,
75
+ "step": 18
76
+ },
77
+ {
78
+ "epoch": 0.8316831683168316,
79
+ "grad_norm": 0.8399017453193665,
80
+ "learning_rate": 9.330127018922194e-05,
81
+ "loss": 1.6186,
82
+ "step": 21
83
+ },
84
+ {
85
+ "epoch": 0.8316831683168316,
86
+ "eval_loss": 1.5880630016326904,
87
+ "eval_runtime": 1.2879,
88
+ "eval_samples_per_second": 65.997,
89
+ "eval_steps_per_second": 4.659,
90
+ "step": 21
91
  }
92
  ],
93
  "logging_steps": 3,
 
107
  "attributes": {}
108
  }
109
  },
110
+ "total_flos": 5.97193233751081e+16,
111
  "train_batch_size": 4,
112
  "trial_name": null,
113
  "trial_params": null