Update README.md
Browse files
README.md
CHANGED
@@ -65,11 +65,13 @@ inference:
|
|
65 |
parameters:
|
66 |
max_length: 96
|
67 |
num_beams: 4
|
|
|
68 |
datasets:
|
69 |
- pszemraj/fleece2instructions-inputs-alpaca-cleaned
|
70 |
language:
|
71 |
- en
|
72 |
pipeline_tag: text2text-generation
|
|
|
73 |
---
|
74 |
|
75 |
|
@@ -129,5 +131,4 @@ The following hyperparameters were used during training:
|
|
129 |
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
|
130 |
|:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|:-------:|
|
131 |
| 1.1147 | 1.0 | 680 | 0.9901 | 61.8451 | 38.8293 | 58.3372 | 59.8658 | 25.2401 |
|
132 |
-
| 0.9565 | 2.0 | 1360 | 0.9579 | 62.3604 | 39.5109 | 58.8843 | 60.4494 | 24.9917 |
|
133 |
-
|
|
|
65 |
parameters:
|
66 |
max_length: 96
|
67 |
num_beams: 4
|
68 |
+
early_stopping: true
|
69 |
datasets:
|
70 |
- pszemraj/fleece2instructions-inputs-alpaca-cleaned
|
71 |
language:
|
72 |
- en
|
73 |
pipeline_tag: text2text-generation
|
74 |
+
library_name: transformers
|
75 |
---
|
76 |
|
77 |
|
|
|
131 |
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
|
132 |
|:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|:-------:|
|
133 |
| 1.1147 | 1.0 | 680 | 0.9901 | 61.8451 | 38.8293 | 58.3372 | 59.8658 | 25.2401 |
|
134 |
+
| 0.9565 | 2.0 | 1360 | 0.9579 | 62.3604 | 39.5109 | 58.8843 | 60.4494 | 24.9917 |
|
|