DuongTrongChi
commited on
Training in progress, step 391, checkpoint
Browse files
last-checkpoint/adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 100198584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9efa6add42e5fefba9d56a1afcc7355eca82c2424267276f7b90c9528c7123ba
|
3 |
size 100198584
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 50675604
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fe1f005838acb336ca4fe0ab46eb7f60f522df631c4bef7cf7e92b1a0d3032f
|
3 |
size 50675604
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5a8867b92ac804cb31a1e033b1e487ddd7366d0bc3c5cae4e0f95d48f50a374
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 0.
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -2709,6 +2709,41 @@
|
|
2709 |
"learning_rate": 1.2946979038224414e-05,
|
2710 |
"loss": 1.1242,
|
2711 |
"step": 386
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2712 |
}
|
2713 |
],
|
2714 |
"logging_steps": 1,
|
@@ -2728,7 +2763,7 @@
|
|
2728 |
"attributes": {}
|
2729 |
}
|
2730 |
},
|
2731 |
-
"total_flos": 4.
|
2732 |
"train_batch_size": 4,
|
2733 |
"trial_name": null,
|
2734 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.4290809327846365,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 391,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
2709 |
"learning_rate": 1.2946979038224414e-05,
|
2710 |
"loss": 1.1242,
|
2711 |
"step": 386
|
2712 |
+
},
|
2713 |
+
{
|
2714 |
+
"epoch": 0.4246913580246914,
|
2715 |
+
"grad_norm": 0.16041865944862366,
|
2716 |
+
"learning_rate": 1.2922318125770655e-05,
|
2717 |
+
"loss": 1.1821,
|
2718 |
+
"step": 387
|
2719 |
+
},
|
2720 |
+
{
|
2721 |
+
"epoch": 0.4257887517146776,
|
2722 |
+
"grad_norm": 0.13168294727802277,
|
2723 |
+
"learning_rate": 1.2897657213316894e-05,
|
2724 |
+
"loss": 1.1585,
|
2725 |
+
"step": 388
|
2726 |
+
},
|
2727 |
+
{
|
2728 |
+
"epoch": 0.4268861454046639,
|
2729 |
+
"grad_norm": 0.11569740623235703,
|
2730 |
+
"learning_rate": 1.2872996300863132e-05,
|
2731 |
+
"loss": 1.1275,
|
2732 |
+
"step": 389
|
2733 |
+
},
|
2734 |
+
{
|
2735 |
+
"epoch": 0.4279835390946502,
|
2736 |
+
"grad_norm": 0.14467458426952362,
|
2737 |
+
"learning_rate": 1.2848335388409371e-05,
|
2738 |
+
"loss": 1.1436,
|
2739 |
+
"step": 390
|
2740 |
+
},
|
2741 |
+
{
|
2742 |
+
"epoch": 0.4290809327846365,
|
2743 |
+
"grad_norm": 0.11647368967533112,
|
2744 |
+
"learning_rate": 1.2823674475955612e-05,
|
2745 |
+
"loss": 1.1061,
|
2746 |
+
"step": 391
|
2747 |
}
|
2748 |
],
|
2749 |
"logging_steps": 1,
|
|
|
2763 |
"attributes": {}
|
2764 |
}
|
2765 |
},
|
2766 |
+
"total_flos": 4.0602758438180045e+17,
|
2767 |
"train_batch_size": 4,
|
2768 |
"trial_name": null,
|
2769 |
"trial_params": null
|