DuongTrongChi commited on
Commit
8a4fc49
·
verified ·
1 Parent(s): 728f981

Training in progress, step 391, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d467248f80e50b7299be4a044d3c34650a4bb3d921ee97e1d2cbac5af5b7fc6
3
  size 100198584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9efa6add42e5fefba9d56a1afcc7355eca82c2424267276f7b90c9528c7123ba
3
  size 100198584
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea91a98de0b3ad51bc037e37c58325d581d5d9a687104d1c0db3b0ba2b46168e
3
  size 50675604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fe1f005838acb336ca4fe0ab46eb7f60f522df631c4bef7cf7e92b1a0d3032f
3
  size 50675604
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43819302638e139ec073cc0bd87e7c492c70c5966a60959bb8d025a1d3e72519
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5a8867b92ac804cb31a1e033b1e487ddd7366d0bc3c5cae4e0f95d48f50a374
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.4235939643347051,
5
  "eval_steps": 500,
6
- "global_step": 386,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -2709,6 +2709,41 @@
2709
  "learning_rate": 1.2946979038224414e-05,
2710
  "loss": 1.1242,
2711
  "step": 386
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2712
  }
2713
  ],
2714
  "logging_steps": 1,
@@ -2728,7 +2763,7 @@
2728
  "attributes": {}
2729
  }
2730
  },
2731
- "total_flos": 4.0076346624661094e+17,
2732
  "train_batch_size": 4,
2733
  "trial_name": null,
2734
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.4290809327846365,
5
  "eval_steps": 500,
6
+ "global_step": 391,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
2709
  "learning_rate": 1.2946979038224414e-05,
2710
  "loss": 1.1242,
2711
  "step": 386
2712
+ },
2713
+ {
2714
+ "epoch": 0.4246913580246914,
2715
+ "grad_norm": 0.16041865944862366,
2716
+ "learning_rate": 1.2922318125770655e-05,
2717
+ "loss": 1.1821,
2718
+ "step": 387
2719
+ },
2720
+ {
2721
+ "epoch": 0.4257887517146776,
2722
+ "grad_norm": 0.13168294727802277,
2723
+ "learning_rate": 1.2897657213316894e-05,
2724
+ "loss": 1.1585,
2725
+ "step": 388
2726
+ },
2727
+ {
2728
+ "epoch": 0.4268861454046639,
2729
+ "grad_norm": 0.11569740623235703,
2730
+ "learning_rate": 1.2872996300863132e-05,
2731
+ "loss": 1.1275,
2732
+ "step": 389
2733
+ },
2734
+ {
2735
+ "epoch": 0.4279835390946502,
2736
+ "grad_norm": 0.14467458426952362,
2737
+ "learning_rate": 1.2848335388409371e-05,
2738
+ "loss": 1.1436,
2739
+ "step": 390
2740
+ },
2741
+ {
2742
+ "epoch": 0.4290809327846365,
2743
+ "grad_norm": 0.11647368967533112,
2744
+ "learning_rate": 1.2823674475955612e-05,
2745
+ "loss": 1.1061,
2746
+ "step": 391
2747
  }
2748
  ],
2749
  "logging_steps": 1,
 
2763
  "attributes": {}
2764
  }
2765
  },
2766
+ "total_flos": 4.0602758438180045e+17,
2767
  "train_batch_size": 4,
2768
  "trial_name": null,
2769
  "trial_params": null