Training in progress, epoch 12
Browse files
log.txt
CHANGED
@@ -143,3 +143,17 @@
|
|
143 |
{'loss': 0.1227, 'grad_norm': 5.548469543457031, 'learning_rate': 1.4123206160308016e-05, 'epoch': 10.76}
|
144 |
{'loss': 0.1164, 'grad_norm': 10.179027557373047, 'learning_rate': 1.3831524909578814e-05, 'epoch': 10.85}
|
145 |
{'loss': 0.1231, 'grad_norm': 1.8333979845046997, 'learning_rate': 1.353984365884961e-05, 'epoch': 10.94}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
143 |
{'loss': 0.1227, 'grad_norm': 5.548469543457031, 'learning_rate': 1.4123206160308016e-05, 'epoch': 10.76}
|
144 |
{'loss': 0.1164, 'grad_norm': 10.179027557373047, 'learning_rate': 1.3831524909578814e-05, 'epoch': 10.85}
|
145 |
{'loss': 0.1231, 'grad_norm': 1.8333979845046997, 'learning_rate': 1.353984365884961e-05, 'epoch': 10.94}
|
146 |
+
[1 2 2 ... 1 2 0] [0 0 2 ... 0 1 0]
|
147 |
+
{'eval_loss': 4.385825157165527, 'eval_accuracy': 0.41023189098732965, 'eval_runtime': 6.3967, 'eval_samples_per_second': 653.926, 'eval_steps_per_second': 20.479, 'epoch': 11.0}
|
148 |
+
{'loss': 0.1038, 'grad_norm': 17.937191009521484, 'learning_rate': 1.3248162408120407e-05, 'epoch': 11.03}
|
149 |
+
{'loss': 0.0987, 'grad_norm': 9.12984848022461, 'learning_rate': 1.2956481157391204e-05, 'epoch': 11.11}
|
150 |
+
{'loss': 0.1078, 'grad_norm': 6.416741847991943, 'learning_rate': 1.2664799906662e-05, 'epoch': 11.2}
|
151 |
+
{'loss': 0.0947, 'grad_norm': 27.995830535888672, 'learning_rate': 1.2373118655932796e-05, 'epoch': 11.29}
|
152 |
+
{'loss': 0.0984, 'grad_norm': 11.60288143157959, 'learning_rate': 1.2081437405203595e-05, 'epoch': 11.38}
|
153 |
+
{'loss': 0.104, 'grad_norm': 5.211322784423828, 'learning_rate': 1.1789756154474391e-05, 'epoch': 11.46}
|
154 |
+
{'loss': 0.1049, 'grad_norm': 19.860586166381836, 'learning_rate': 1.1498074903745188e-05, 'epoch': 11.55}
|
155 |
+
{'loss': 0.1045, 'grad_norm': 17.643003463745117, 'learning_rate': 1.1206393653015984e-05, 'epoch': 11.64}
|
156 |
+
{'loss': 0.1039, 'grad_norm': 23.73241424560547, 'learning_rate': 1.0914712402286782e-05, 'epoch': 11.73}
|
157 |
+
{'loss': 0.0976, 'grad_norm': 1.1808760166168213, 'learning_rate': 1.0623031151557579e-05, 'epoch': 11.81}
|
158 |
+
{'loss': 0.1075, 'grad_norm': 10.200865745544434, 'learning_rate': 1.0331349900828375e-05, 'epoch': 11.9}
|
159 |
+
{'loss': 0.1027, 'grad_norm': 7.143473148345947, 'learning_rate': 1.0039668650099172e-05, 'epoch': 11.99}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267829484
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd0193cb9599cdaa25476fa738b6ac2161dd0af4b659fb499a8e4030912898fd
|
3 |
size 267829484
|
runs/Mar14_16-58-52_cehsc-app-001.ad.unlv.edu/events.out.tfevents.1710460734.cehsc-app-001.ad.unlv.edu.4089564.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4ad6a9975ffc98147d173d0bd42479a262fb96dc2b2068fa1b4592d2ab71535
|
3 |
+
size 37830
|