Training in progress, epoch 9
Browse files
log.txt
CHANGED
@@ -103,3 +103,16 @@
|
|
103 |
{'loss': 0.2293, 'grad_norm': 17.969135284423828, 'learning_rate': 2.4040368685100922e-05, 'epoch': 7.79}
|
104 |
{'loss': 0.2305, 'grad_norm': 13.376370429992676, 'learning_rate': 2.374868743437172e-05, 'epoch': 7.88}
|
105 |
{'loss': 0.2403, 'grad_norm': 8.350042343139648, 'learning_rate': 2.3457006183642515e-05, 'epoch': 7.96}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
103 |
{'loss': 0.2293, 'grad_norm': 17.969135284423828, 'learning_rate': 2.4040368685100922e-05, 'epoch': 7.79}
|
104 |
{'loss': 0.2305, 'grad_norm': 13.376370429992676, 'learning_rate': 2.374868743437172e-05, 'epoch': 7.88}
|
105 |
{'loss': 0.2403, 'grad_norm': 8.350042343139648, 'learning_rate': 2.3457006183642515e-05, 'epoch': 7.96}
|
106 |
+
[0 2 2 ... 1 0 1] [0 0 2 ... 0 1 0]
|
107 |
+
{'eval_loss': 2.7002346515655518, 'eval_accuracy': 0.40855845087257947, 'eval_runtime': 6.9152, 'eval_samples_per_second': 604.896, 'eval_steps_per_second': 18.944, 'epoch': 8.0}
|
108 |
+
{'loss': 0.194, 'grad_norm': 5.118299961090088, 'learning_rate': 2.3165324932913312e-05, 'epoch': 8.05}
|
109 |
+
{'loss': 0.1641, 'grad_norm': 6.422851085662842, 'learning_rate': 2.2873643682184108e-05, 'epoch': 8.14}
|
110 |
+
{'loss': 0.1696, 'grad_norm': 0.9757495522499084, 'learning_rate': 2.2581962431454905e-05, 'epoch': 8.23}
|
111 |
+
{'loss': 0.1714, 'grad_norm': 8.895563125610352, 'learning_rate': 2.22902811807257e-05, 'epoch': 8.31}
|
112 |
+
{'loss': 0.1747, 'grad_norm': 11.234411239624023, 'learning_rate': 2.19985999299965e-05, 'epoch': 8.4}
|
113 |
+
{'loss': 0.1802, 'grad_norm': 17.129392623901367, 'learning_rate': 2.1706918679267298e-05, 'epoch': 8.49}
|
114 |
+
{'loss': 0.1773, 'grad_norm': 15.17518424987793, 'learning_rate': 2.1415237428538097e-05, 'epoch': 8.58}
|
115 |
+
{'loss': 0.1795, 'grad_norm': 20.55030632019043, 'learning_rate': 2.1123556177808894e-05, 'epoch': 8.66}
|
116 |
+
{'loss': 0.185, 'grad_norm': 16.464384078979492, 'learning_rate': 2.083187492707969e-05, 'epoch': 8.75}
|
117 |
+
{'loss': 0.1794, 'grad_norm': 20.86390495300293, 'learning_rate': 2.0540193676350487e-05, 'epoch': 8.84}
|
118 |
+
{'loss': 0.1843, 'grad_norm': 14.848393440246582, 'learning_rate': 2.0248512425621283e-05, 'epoch': 8.93}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267829484
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dcee5d29c3c6cec18051dcfaf82426afc937dc4cdad0f9b2adfdc7fb21cf305
|
3 |
size 267829484
|
runs/Mar14_16-58-52_cehsc-app-001.ad.unlv.edu/events.out.tfevents.1710460734.cehsc-app-001.ad.unlv.edu.4089564.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:740aaa121039875d7f10e7b71a065104da5764aa826854864c3548628c554048
|
3 |
+
size 29318
|