ahmedheakl commited on
Commit
f5b9e8a
·
verified ·
1 Parent(s): 3ca3c09

Training in progress, step 118428

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. trainer_log.jsonl +34 -0
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3030f20e2501c44a36c3c2eddd7336f9b47a7216a1ca0b531e2960fe31a7642
3
  size 1260367448
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:830f394ffc9b8c1291ba686783f5c242a28412679d78c0776c4b9849a3f82081
3
  size 1260367448
trainer_log.jsonl CHANGED
@@ -11808,3 +11808,37 @@
11808
  {"current_steps": 118070, "total_steps": 118428, "loss": 0.0054, "lr": 2.7836177588891347e-10, "epoch": 1.993954132468673, "percentage": 99.7, "elapsed_time": "19:33:00", "remaining_time": "0:03:33"}
11809
  {"current_steps": 118080, "total_steps": 118428, "loss": 0.0063, "lr": 2.630281649901312e-10, "epoch": 1.9941230114499948, "percentage": 99.71, "elapsed_time": "19:33:05", "remaining_time": "0:03:27"}
11810
  {"current_steps": 118090, "total_steps": 118428, "loss": 0.006, "lr": 2.481289189887326e-10, "epoch": 1.994291890431317, "percentage": 99.71, "elapsed_time": "19:33:09", "remaining_time": "0:03:21"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11808
  {"current_steps": 118070, "total_steps": 118428, "loss": 0.0054, "lr": 2.7836177588891347e-10, "epoch": 1.993954132468673, "percentage": 99.7, "elapsed_time": "19:33:00", "remaining_time": "0:03:33"}
11809
  {"current_steps": 118080, "total_steps": 118428, "loss": 0.0063, "lr": 2.630281649901312e-10, "epoch": 1.9941230114499948, "percentage": 99.71, "elapsed_time": "19:33:05", "remaining_time": "0:03:27"}
11810
  {"current_steps": 118090, "total_steps": 118428, "loss": 0.006, "lr": 2.481289189887326e-10, "epoch": 1.994291890431317, "percentage": 99.71, "elapsed_time": "19:33:09", "remaining_time": "0:03:21"}
11811
+ {"current_steps": 118100, "total_steps": 118428, "loss": 0.0049, "lr": 2.336640391781275e-10, "epoch": 1.994460769412639, "percentage": 99.72, "elapsed_time": "19:33:14", "remaining_time": "0:03:15"}
11812
+ {"current_steps": 118110, "total_steps": 118428, "loss": 0.0095, "lr": 2.1963352681619865e-10, "epoch": 1.994629648393961, "percentage": 99.73, "elapsed_time": "19:33:19", "remaining_time": "0:03:09"}
11813
+ {"current_steps": 118120, "total_steps": 118428, "loss": 0.0073, "lr": 2.0603738312086064e-10, "epoch": 1.9947985273752828, "percentage": 99.74, "elapsed_time": "19:33:24", "remaining_time": "0:03:03"}
11814
+ {"current_steps": 118130, "total_steps": 118428, "loss": 0.0092, "lr": 1.9287560927339077e-10, "epoch": 1.9949674063566047, "percentage": 99.75, "elapsed_time": "19:33:31", "remaining_time": "0:02:57"}
11815
+ {"current_steps": 118140, "total_steps": 118428, "loss": 0.0063, "lr": 1.801482064178739e-10, "epoch": 1.9951362853379269, "percentage": 99.76, "elapsed_time": "19:33:36", "remaining_time": "0:02:51"}
11816
+ {"current_steps": 118150, "total_steps": 118428, "loss": 0.0107, "lr": 1.678551756589819e-10, "epoch": 1.995305164319249, "percentage": 99.77, "elapsed_time": "19:33:43", "remaining_time": "0:02:45"}
11817
+ {"current_steps": 118160, "total_steps": 118428, "loss": 0.007, "lr": 1.5599651806585957e-10, "epoch": 1.9954740433005709, "percentage": 99.77, "elapsed_time": "19:33:48", "remaining_time": "0:02:39"}
11818
+ {"current_steps": 118170, "total_steps": 118428, "loss": 0.0072, "lr": 1.4457223466823877e-10, "epoch": 1.9956429222818928, "percentage": 99.78, "elapsed_time": "19:33:54", "remaining_time": "0:02:33"}
11819
+ {"current_steps": 118180, "total_steps": 118428, "loss": 0.0076, "lr": 1.3358232645865888e-10, "epoch": 1.9958118012632147, "percentage": 99.79, "elapsed_time": "19:33:59", "remaining_time": "0:02:27"}
11820
+ {"current_steps": 118190, "total_steps": 118428, "loss": 0.0063, "lr": 1.2302679439191167e-10, "epoch": 1.9959806802445368, "percentage": 99.8, "elapsed_time": "19:34:04", "remaining_time": "0:02:21"}
11821
+ {"current_steps": 118200, "total_steps": 118428, "loss": 0.0076, "lr": 1.1290563938504139e-10, "epoch": 1.996149559225859, "percentage": 99.81, "elapsed_time": "19:34:10", "remaining_time": "0:02:15"}
11822
+ {"current_steps": 118210, "total_steps": 118428, "loss": 0.0075, "lr": 1.0321886231734468e-10, "epoch": 1.9963184382071808, "percentage": 99.82, "elapsed_time": "19:34:17", "remaining_time": "0:02:09"}
11823
+ {"current_steps": 118220, "total_steps": 118428, "loss": 0.0067, "lr": 9.396646403037057e-11, "epoch": 1.9964873171885027, "percentage": 99.82, "elapsed_time": "19:34:23", "remaining_time": "0:02:03"}
11824
+ {"current_steps": 118230, "total_steps": 118428, "loss": 0.0045, "lr": 8.514844532792055e-11, "epoch": 1.9966561961698246, "percentage": 99.83, "elapsed_time": "19:34:28", "remaining_time": "0:01:58"}
11825
+ {"current_steps": 118240, "total_steps": 118428, "loss": 0.0069, "lr": 7.676480697604849e-11, "epoch": 1.9968250751511467, "percentage": 99.84, "elapsed_time": "19:34:33", "remaining_time": "0:01:52"}
11826
+ {"current_steps": 118250, "total_steps": 118428, "loss": 0.01, "lr": 6.88155497030607e-11, "epoch": 1.9969939541324688, "percentage": 99.85, "elapsed_time": "19:34:39", "remaining_time": "0:01:46"}
11827
+ {"current_steps": 118260, "total_steps": 118428, "loss": 0.0095, "lr": 6.130067420007101e-11, "epoch": 1.9971628331137907, "percentage": 99.86, "elapsed_time": "19:34:46", "remaining_time": "0:01:40"}
11828
+ {"current_steps": 118270, "total_steps": 118428, "loss": 0.0073, "lr": 5.422018111933547e-11, "epoch": 1.9973317120951126, "percentage": 99.87, "elapsed_time": "19:34:52", "remaining_time": "0:01:34"}
11829
+ {"current_steps": 118280, "total_steps": 118428, "loss": 0.008, "lr": 4.7574071075917604e-11, "epoch": 1.9975005910764345, "percentage": 99.88, "elapsed_time": "19:34:57", "remaining_time": "0:01:28"}
11830
+ {"current_steps": 118290, "total_steps": 118428, "loss": 0.0058, "lr": 4.136234464768851e-11, "epoch": 1.9976694700577566, "percentage": 99.88, "elapsed_time": "19:35:01", "remaining_time": "0:01:22"}
11831
+ {"current_steps": 118300, "total_steps": 118428, "loss": 0.0059, "lr": 3.558500237421658e-11, "epoch": 1.9978383490390788, "percentage": 99.89, "elapsed_time": "19:35:06", "remaining_time": "0:01:16"}
11832
+ {"current_steps": 118310, "total_steps": 118428, "loss": 0.0064, "lr": 3.024204475732262e-11, "epoch": 1.9980072280204006, "percentage": 99.9, "elapsed_time": "19:35:11", "remaining_time": "0:01:10"}
11833
+ {"current_steps": 118320, "total_steps": 118428, "loss": 0.0074, "lr": 2.533347226107985e-11, "epoch": 1.9981761070017225, "percentage": 99.91, "elapsed_time": "19:35:16", "remaining_time": "0:01:04"}
11834
+ {"current_steps": 118330, "total_steps": 118428, "loss": 0.0068, "lr": 2.0859285312369026e-11, "epoch": 1.9983449859830444, "percentage": 99.92, "elapsed_time": "19:35:20", "remaining_time": "0:00:58"}
11835
+ {"current_steps": 118340, "total_steps": 118428, "loss": 0.0049, "lr": 1.6819484299213095e-11, "epoch": 1.9985138649643666, "percentage": 99.93, "elapsed_time": "19:35:26", "remaining_time": "0:00:52"}
11836
+ {"current_steps": 118350, "total_steps": 118428, "loss": 0.0059, "lr": 1.3214069573552757e-11, "epoch": 1.9986827439456887, "percentage": 99.93, "elapsed_time": "19:35:32", "remaining_time": "0:00:46"}
11837
+ {"current_steps": 118360, "total_steps": 118428, "loss": 0.0042, "lr": 1.004304144736068e-11, "epoch": 1.9988516229270106, "percentage": 99.94, "elapsed_time": "19:35:37", "remaining_time": "0:00:40"}
11838
+ {"current_steps": 118370, "total_steps": 118428, "loss": 0.0071, "lr": 7.306400197082398e-12, "epoch": 1.9990205019083325, "percentage": 99.95, "elapsed_time": "19:35:42", "remaining_time": "0:00:34"}
11839
+ {"current_steps": 118380, "total_steps": 118428, "loss": 0.005, "lr": 5.004146059750525e-12, "epoch": 1.9991893808896544, "percentage": 99.96, "elapsed_time": "19:35:46", "remaining_time": "0:00:28"}
11840
+ {"current_steps": 118390, "total_steps": 118428, "loss": 0.0064, "lr": 3.1362792363154313e-12, "epoch": 1.9993582598709765, "percentage": 99.97, "elapsed_time": "19:35:52", "remaining_time": "0:00:22"}
11841
+ {"current_steps": 118400, "total_steps": 118428, "loss": 0.0081, "lr": 1.7027998883145658e-12, "epoch": 1.9995271388522986, "percentage": 99.98, "elapsed_time": "19:35:58", "remaining_time": "0:00:16"}
11842
+ {"current_steps": 118410, "total_steps": 118428, "loss": 0.0063, "lr": 7.037081406480184e-13, "epoch": 1.9996960178336205, "percentage": 99.98, "elapsed_time": "19:36:04", "remaining_time": "0:00:10"}
11843
+ {"current_steps": 118420, "total_steps": 118428, "loss": 0.0072, "lr": 1.3900407991318533e-13, "epoch": 1.9998648968149424, "percentage": 99.99, "elapsed_time": "19:36:10", "remaining_time": "0:00:04"}
11844
+ {"current_steps": 118428, "total_steps": 118428, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "19:36:36", "remaining_time": "0:00:00"}