EtashGuha commited on
Commit
c8279fc
·
verified ·
1 Parent(s): 4d6f45a

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a172e85b90a703233410bfb33c6facb3a7a548775695d20e470ab954f5dc5bd
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:135eff8528ad6c5d038fc9630137d1054b68be9e9de16a63cf181b814e5a11a3
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc2d0c77dd1479b0a5b40aa407649ce8b7dfa1627e235937efbc8b516d4b5a79
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d69ed7a15b0168305cdd64ce9ddbf455a11e67df8d2f9854148d0901c8b2fcb
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3bf7f9daf575d0316513d6e6e5878cb836c80f007f9941b2c17a52c52f86fac
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53c39fb1a308761ff2f24aaeea65b8b4ec41c248e5b8ba9dd7eb129cc45887c2
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09316e8749cc6b82c55cf1ada3c0a6e136896c20df51cb2d073523a87e857ac0
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:656cdfc8446799100fd9224bd5409685ad25140ce1d59195c4e175b2dd524a40
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,8 @@
2
  {"current_steps": 20, "total_steps": 105, "loss": 1.087, "lr": 5e-06, "epoch": 0.5663716814159292, "percentage": 19.05, "elapsed_time": "0:53:44", "remaining_time": "3:48:24"}
3
  {"current_steps": 30, "total_steps": 105, "loss": 1.0474, "lr": 5e-06, "epoch": 0.8495575221238938, "percentage": 28.57, "elapsed_time": "1:20:33", "remaining_time": "3:21:23"}
4
  {"current_steps": 35, "total_steps": 105, "eval_loss": 1.021984577178955, "epoch": 0.9911504424778761, "percentage": 33.33, "elapsed_time": "1:36:48", "remaining_time": "3:13:36"}
 
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 105, "loss": 1.087, "lr": 5e-06, "epoch": 0.5663716814159292, "percentage": 19.05, "elapsed_time": "0:53:44", "remaining_time": "3:48:24"}
3
  {"current_steps": 30, "total_steps": 105, "loss": 1.0474, "lr": 5e-06, "epoch": 0.8495575221238938, "percentage": 28.57, "elapsed_time": "1:20:33", "remaining_time": "3:21:23"}
4
  {"current_steps": 35, "total_steps": 105, "eval_loss": 1.021984577178955, "epoch": 0.9911504424778761, "percentage": 33.33, "elapsed_time": "1:36:48", "remaining_time": "3:13:36"}
5
+ {"current_steps": 40, "total_steps": 105, "loss": 1.0097, "lr": 5e-06, "epoch": 1.1327433628318584, "percentage": 38.1, "elapsed_time": "1:50:31", "remaining_time": "2:59:36"}
6
+ {"current_steps": 50, "total_steps": 105, "loss": 0.9766, "lr": 5e-06, "epoch": 1.415929203539823, "percentage": 47.62, "elapsed_time": "2:16:27", "remaining_time": "2:30:06"}
7
+ {"current_steps": 60, "total_steps": 105, "loss": 0.9627, "lr": 5e-06, "epoch": 1.6991150442477876, "percentage": 57.14, "elapsed_time": "2:42:23", "remaining_time": "2:01:47"}
8
+ {"current_steps": 70, "total_steps": 105, "loss": 0.9547, "lr": 5e-06, "epoch": 1.9823008849557522, "percentage": 66.67, "elapsed_time": "3:08:20", "remaining_time": "1:34:10"}
9
+ {"current_steps": 70, "total_steps": 105, "eval_loss": 0.9805734157562256, "epoch": 1.9823008849557522, "percentage": 66.67, "elapsed_time": "3:11:46", "remaining_time": "1:35:53"}