stulcrad
/

CNEC_1_1_ext_slavicbert

@@ -24,16 +24,16 @@ model-index:
     metrics:
     - name: Precision
       type: precision
-      value: 0.8562564632885212
     - name: Recall
       type: recall
-      value: 0.8850881881346874
     - name: F1
       type: f1
-      value: 0.8704336399474377
     - name: Accuracy
       type: accuracy
-      value: 0.9598901383634761
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -43,11 +43,11 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [DeepPavlov/bert-base-bg-cs-pl-ru-cased](https://huggingface.co/DeepPavlov/bert-base-bg-cs-pl-ru-cased) on the cnec dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.2811
-- Precision: 0.8563
-- Recall: 0.8851
-- F1: 0.8704
-- Accuracy: 0.9599
 ## Model description
@@ -78,20 +78,20 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
-| 0.3365        | 1.72  | 500  | 0.1751          | 0.8068    | 0.8546 | 0.8300 | 0.9522   |
-| 0.1326        | 3.44  | 1000 | 0.1573          | 0.8427    | 0.8675 | 0.8549 | 0.9589   |
-| 0.0901        | 5.15  | 1500 | 0.1800          | 0.8401    | 0.8707 | 0.8551 | 0.9582   |
-| 0.0631        | 6.87  | 2000 | 0.1975          | 0.8490    | 0.8803 | 0.8643 | 0.9589   |
-| 0.0453        | 8.59  | 2500 | 0.2075          | 0.8447    | 0.8808 | 0.8624 | 0.9608   |
-| 0.034         | 10.31 | 3000 | 0.2156          | 0.8497    | 0.8824 | 0.8658 | 0.9605   |
-| 0.0268        | 12.03 | 3500 | 0.2378          | 0.8499    | 0.8808 | 0.8651 | 0.9596   |
-| 0.0205        | 13.75 | 4000 | 0.2446          | 0.8557    | 0.8878 | 0.8715 | 0.9611   |
-| 0.0176        | 15.46 | 4500 | 0.2494          | 0.8571    | 0.8883 | 0.8724 | 0.9611   |
-| 0.0141        | 17.18 | 5000 | 0.2607          | 0.8586    | 0.8824 | 0.8703 | 0.9597   |
-| 0.0105        | 18.9  | 5500 | 0.2793          | 0.8542    | 0.8830 | 0.8683 | 0.9599   |
-| 0.0091        | 20.62 | 6000 | 0.2738          | 0.8487    | 0.8846 | 0.8663 | 0.9586   |
-| 0.0076        | 22.34 | 6500 | 0.2773          | 0.8556    | 0.8867 | 0.8709 | 0.9604   |
-| 0.0075        | 24.05 | 7000 | 0.2811          | 0.8563    | 0.8851 | 0.8704 | 0.9599   |
 ### Framework versions

     metrics:
     - name: Precision
       type: precision
+      value: 0.8606811145510835
     - name: Recall
       type: recall
+      value: 0.8915018706574025
     - name: F1
       type: f1
+      value: 0.8758204253084799
     - name: Accuracy
       type: accuracy
+      value: 0.9626885008032336
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [DeepPavlov/bert-base-bg-cs-pl-ru-cased](https://huggingface.co/DeepPavlov/bert-base-bg-cs-pl-ru-cased) on the cnec dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.2572
+- Precision: 0.8607
+- Recall: 0.8915
+- F1: 0.8758
+- Accuracy: 0.9627
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
+| 0.3946        | 1.72  | 500  | 0.1925          | 0.7835    | 0.8471 | 0.8141 | 0.9467   |
+| 0.1653        | 3.44  | 1000 | 0.1627          | 0.8340    | 0.8675 | 0.8504 | 0.9572   |
+| 0.1183        | 5.15  | 1500 | 0.1700          | 0.8378    | 0.8808 | 0.8588 | 0.9595   |
+| 0.0869        | 6.87  | 2000 | 0.1901          | 0.8554    | 0.8728 | 0.8640 | 0.9589   |
+| 0.0661        | 8.59  | 2500 | 0.2037          | 0.8482    | 0.8867 | 0.8670 | 0.9595   |
+| 0.053         | 10.31 | 3000 | 0.2011          | 0.8460    | 0.8867 | 0.8659 | 0.9609   |
+| 0.043         | 12.03 | 3500 | 0.2216          | 0.8555    | 0.8888 | 0.8718 | 0.9593   |
+| 0.0358        | 13.75 | 4000 | 0.2245          | 0.8492    | 0.8878 | 0.8680 | 0.9603   |
+| 0.0296        | 15.46 | 4500 | 0.2401          | 0.8513    | 0.8872 | 0.8689 | 0.9603   |
+| 0.0264        | 17.18 | 5000 | 0.2415          | 0.8564    | 0.8862 | 0.8710 | 0.9610   |
+| 0.0212        | 18.9  | 5500 | 0.2570          | 0.8557    | 0.8872 | 0.8712 | 0.9622   |
+| 0.0205        | 20.62 | 6000 | 0.2540          | 0.8567    | 0.8883 | 0.8722 | 0.9616   |
+| 0.0167        | 22.34 | 6500 | 0.2573          | 0.8568    | 0.8894 | 0.8728 | 0.9614   |
+| 0.0161        | 24.05 | 7000 | 0.2572          | 0.8607    | 0.8915 | 0.8758 | 0.9627   |
 ### Framework versions

config.json CHANGED Viewed

@@ -3,11 +3,11 @@
   "architectures": [
     "BertForTokenClassification"
   ],
-  "attention_probs_dropout_prob": 0.2,
   "classifier_dropout": null,
   "directionality": "bidi",
   "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.2,
   "hidden_size": 768,
   "id2label": {
     "0": "O",

   "architectures": [
     "BertForTokenClassification"
   ],
+  "attention_probs_dropout_prob": 0.25,
   "classifier_dropout": null,
   "directionality": "bidi",
   "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.25,
   "hidden_size": 768,
   "id2label": {
     "0": "O",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5f47ad202035e914421575684fb0e0d300e4e243c5995019a49a425ed2a6be53
 size 709120892

 version https://git-lfs.github.com/spec/v1
+oid sha256:a0e7ed7b2f0a383fb42f326aec99b4e9d86ad31f79108387e2d08226cac7b2c5
 size 709120892

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc69bb8a341bf9f8e86fccf8322066958128491e182e96f7e21b34713eb24b31
 size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:3302de9de94fb5ee05ad0c98a1ea6b3a542d27d68cb9f15b444a5baf10c8e3e4
 size 4664