fionazhang/mistral-experiment-3
Browse files- learning_curve.png +0 -0
- training_args.bin +1 -1
- training_logs.json +1 -1
learning_curve.png
CHANGED
![]() |
![]() |
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4728
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5fd135d1555136230c4d62def3a8f67add80b273cd0b5ce5a95f6173b0f5304
|
3 |
size 4728
|
training_logs.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
[{"loss": 13.1588, "learning_rate": 0.0002, "epoch": 0.22, "step": 25}, {"loss": 9.279, "learning_rate": 0.0002, "epoch": 0.43, "step": 50}, {"loss": 8.3847, "learning_rate": 0.0002, "epoch": 0.65, "step": 75}, {"loss": 8.0383, "learning_rate": 0.0002, "epoch": 0.86, "step": 100}, {"train_runtime":
|
|
|
1 |
+
[{"loss": 13.1588, "learning_rate": 0.0002, "epoch": 0.22, "step": 25}, {"loss": 9.279, "learning_rate": 0.0002, "epoch": 0.43, "step": 50}, {"loss": 8.3847, "learning_rate": 0.0002, "epoch": 0.65, "step": 75}, {"loss": 8.0383, "learning_rate": 0.0002, "epoch": 0.86, "step": 100}, {"train_runtime": 305.8967, "train_samples_per_second": 1.507, "train_steps_per_second": 0.379, "total_flos": 2373225471000576.0, "train_loss": 9.44900262766871, "epoch": 1.0, "step": 116}]
|