avsolatorio commited on
Commit
d244a3e
·
verified ·
1 Parent(s): 6ba2c47

Training in progress, step 2000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40e2abc797e770c0783bb4f4e58709545091c5c4243e7b0f1cc8900c4c179a7f
3
  size 567860028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49908c6b3a97869b28d3107cd8ede521c11f0540d75bf57e64890e1b42a681d8
3
  size 567860028
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:abee8f95f340dfe01d344aaff64323a816c943331f6304c89b5c4f77e0a2c8fe
3
  size 1135783354
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f37bfd767a7944f522f8b0967bd0b7c7dfe12f1a9adfde5992bc86f6d2dfc4fe
3
  size 1135783354
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78c451f916508297d3207f2dab1c39b19208c892726d699392b564615e2b984b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c677e9a5a7f527c7d59e3734e6ea532e988e424c79842c29a15f61acb3d85678
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ee802392f623a24841bae03e3b1a90568251d05c67f2dfba666ec36a6359794
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc53ec4ee360520441164c72c89b9d8c72fa6dd1be6626eb79abc2dc4e85148b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.21147018671035767,
3
- "best_model_checkpoint": "doc-topic-model_eval-01_train-00/checkpoint-1000",
4
- "epoch": 7.874015748031496,
5
  "eval_steps": 1000,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -33,6 +33,32 @@
33
  "eval_samples_per_second": 684.36,
34
  "eval_steps_per_second": 2.7,
35
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
36
  }
37
  ],
38
  "logging_steps": 500,
@@ -52,7 +78,7 @@
52
  "attributes": {}
53
  }
54
  },
55
- "total_flos": 449829603283536.0,
56
  "train_batch_size": 64,
57
  "trial_name": null,
58
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.10989262908697128,
3
+ "best_model_checkpoint": "doc-topic-model_eval-01_train-00/checkpoint-2000",
4
+ "epoch": 15.748031496062993,
5
  "eval_steps": 1000,
6
+ "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
33
  "eval_samples_per_second": 684.36,
34
  "eval_steps_per_second": 2.7,
35
  "step": 1000
36
+ },
37
+ {
38
+ "epoch": 11.811023622047244,
39
+ "grad_norm": 0.3979816138744354,
40
+ "learning_rate": 1.157726377952756e-06,
41
+ "loss": 0.1864,
42
+ "step": 1500
43
+ },
44
+ {
45
+ "epoch": 15.748031496062993,
46
+ "grad_norm": 0.2547377347946167,
47
+ "learning_rate": 1.126968503937008e-06,
48
+ "loss": 0.1321,
49
+ "step": 2000
50
+ },
51
+ {
52
+ "epoch": 15.748031496062993,
53
+ "eval_accuracy": 0.981383845685049,
54
+ "eval_f1": 0.0,
55
+ "eval_loss": 0.10989262908697128,
56
+ "eval_precision": 0.0,
57
+ "eval_recall": 0.0,
58
+ "eval_runtime": 11.8538,
59
+ "eval_samples_per_second": 684.169,
60
+ "eval_steps_per_second": 2.7,
61
+ "step": 2000
62
  }
63
  ],
64
  "logging_steps": 500,
 
78
  "attributes": {}
79
  }
80
  },
81
+ "total_flos": 898582275611208.0,
82
  "train_batch_size": 64,
83
  "trial_name": null,
84
  "trial_params": null