Training in progress, step 200
Browse files
README.md
CHANGED
@@ -48,9 +48,6 @@ The following hyperparameters were used during training:
|
|
48 |
- eval_batch_size: 8
|
49 |
- seed: 42
|
50 |
- distributed_type: multi-GPU
|
51 |
-
- num_devices: 2
|
52 |
-
- total_train_batch_size: 16
|
53 |
-
- total_eval_batch_size: 16
|
54 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
55 |
- lr_scheduler_type: linear
|
56 |
- training_steps: 2500
|
@@ -60,10 +57,10 @@ The following hyperparameters were used during training:
|
|
60 |
|
61 |
| Training Loss | Epoch | Step | Validation Loss | Answer | Header | Question | Overall Precision | Overall Recall | Overall F1 | Overall Accuracy |
|
62 |
|:-------------:|:------:|:----:|:---------------:|:---------------------------------------------------------:|:---------------------------------------------------------:|:---------------------------------------------------------:|:-----------------:|:--------------:|:----------:|:----------------:|
|
63 |
-
| 0.
|
64 |
| 0.0001 | 400.0 | 400 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
65 |
| 0.0001 | 600.0 | 600 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
66 |
-
| 0.
|
67 |
| 0.0 | 1000.0 | 1000 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
68 |
| 0.0 | 1200.0 | 1200 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
69 |
| 0.0 | 1400.0 | 1400 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
|
|
48 |
- eval_batch_size: 8
|
49 |
- seed: 42
|
50 |
- distributed_type: multi-GPU
|
|
|
|
|
|
|
51 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
52 |
- lr_scheduler_type: linear
|
53 |
- training_steps: 2500
|
|
|
57 |
|
58 |
| Training Loss | Epoch | Step | Validation Loss | Answer | Header | Question | Overall Precision | Overall Recall | Overall F1 | Overall Accuracy |
|
59 |
|:-------------:|:------:|:----:|:---------------:|:---------------------------------------------------------:|:---------------------------------------------------------:|:---------------------------------------------------------:|:-----------------:|:--------------:|:----------:|:----------------:|
|
60 |
+
| 0.07 | 200.0 | 200 | 0.0001 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
61 |
| 0.0001 | 400.0 | 400 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
62 |
| 0.0001 | 600.0 | 600 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
63 |
+
| 0.0001 | 800.0 | 800 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
64 |
| 0.0 | 1000.0 | 1000 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
65 |
| 0.0 | 1200.0 | 1200 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
66 |
| 0.0 | 1400.0 | 1400 | 0.0000 | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 3} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 1} | {'precision': 1.0, 'recall': 1.0, 'f1': 1.0, 'number': 2} | 1.0 | 1.0 | 1.0 | 1.0 |
|
logs/events.out.tfevents.1719315843.Allianz-Editique.1648.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c898b7c5d0f65d95a263897616e68bc1ce5655c141d123bddc3a979bf86ce14f
|
3 |
+
size 14134
|
logs/events.out.tfevents.1719316217.Allianz-Editique.1756.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:820582fb7e86aa486096aa6c4a3b13fe78f772f5d0ffc5a415a56e470a424e76
|
3 |
+
size 5200
|
logs/events.out.tfevents.1719316973.Allianz-Editique.2806.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:084e011ed0df4e788894fed1150b430d01d64dbb044b266eae366bea2aa60513
|
3 |
+
size 5915
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 520727564
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d21ad6e388c713d39294b657f9fd53674d35cad03d405ee18b8fe954b96d8d6
|
3 |
size 520727564
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:446cdb81cf3a41fbc6e18bb92555ca8fb3363f8c2f49496534563d650608d915
|
3 |
size 5176
|