stulcrad
/

CNEC_1_1_ext_Czert-B-base-cased

@@ -24,16 +24,16 @@ model-index:
     metrics:
     - name: Precision
       type: precision
-      value: 0.8373035985808414
     - name: Recall
       type: recall
-      value: 0.882950293960449
     - name: F1
       type: f1
-      value: 0.8595213319458898
     - name: Accuracy
       type: accuracy
-      value: 0.9564921160210239
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -43,11 +43,11 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [UWB-AIR/Czert-B-base-cased](https://huggingface.co/UWB-AIR/Czert-B-base-cased) on the cnec dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.2425
-- Precision: 0.8373
-- Recall: 0.8830
-- F1: 0.8595
-- Accuracy: 0.9565
 ## Model description
@@ -67,8 +67,8 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
-- train_batch_size: 64
-- eval_batch_size: 64
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
@@ -78,9 +78,13 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
-| 0.2228        | 6.85  | 500  | 0.1804          | 0.8316    | 0.8685 | 0.8497 | 0.9540   |
-| 0.0528        | 13.7  | 1000 | 0.2139          | 0.8366    | 0.8813 | 0.8584 | 0.9567   |
-| 0.0283        | 20.55 | 1500 | 0.2425          | 0.8373    | 0.8830 | 0.8595 | 0.9565   |
 ### Framework versions

     metrics:
     - name: Precision
       type: precision
+      value: 0.8383838383838383
     - name: Recall
       type: recall
+      value: 0.8872260823089257
     - name: F1
       type: f1
+      value: 0.8621137366917683
     - name: Accuracy
       type: accuracy
+      value: 0.9569787813899163
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [UWB-AIR/Czert-B-base-cased](https://huggingface.co/UWB-AIR/Czert-B-base-cased) on the cnec dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.2513
+- Precision: 0.8384
+- Recall: 0.8872
+- F1: 0.8621
+- Accuracy: 0.9570
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
+- train_batch_size: 32
+- eval_batch_size: 32
 - seed: 42
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1     | Accuracy |
 |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|:--------:|
+| 0.3012        | 3.42  | 500  | 0.1677          | 0.8115    | 0.8626 | 0.8363 | 0.9518   |
+| 0.1081        | 6.85  | 1000 | 0.1869          | 0.8218    | 0.8749 | 0.8475 | 0.9548   |
+| 0.0654        | 10.27 | 1500 | 0.2132          | 0.8311    | 0.8813 | 0.8555 | 0.9559   |
+| 0.0449        | 13.7  | 2000 | 0.2284          | 0.8296    | 0.8797 | 0.8540 | 0.9559   |
+| 0.0341        | 17.12 | 2500 | 0.2353          | 0.8348    | 0.8856 | 0.8594 | 0.9575   |
+| 0.0267        | 20.55 | 3000 | 0.2413          | 0.8397    | 0.8872 | 0.8628 | 0.9581   |
+| 0.0227        | 23.97 | 3500 | 0.2513          | 0.8384    | 0.8872 | 0.8621 | 0.9570   |
 ### Framework versions

config.json CHANGED Viewed

@@ -3,11 +3,11 @@
   "architectures": [
     "BertForTokenClassification"
   ],
-  "attention_probs_dropout_prob": 0.2,
   "classifier_dropout": null,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.2,
   "hidden_size": 768,
   "id2label": {
     "0": "O",

   "architectures": [
     "BertForTokenClassification"
   ],
+  "attention_probs_dropout_prob": 0.25,
   "classifier_dropout": null,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.25,
   "hidden_size": 768,
   "id2label": {
     "0": "O",

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fb4e69a5cb9975765f849fb1ee5e60866b0eed1c001427da75b2d9d06ca7646c
 size 435636076

 version https://git-lfs.github.com/spec/v1
+oid sha256:865f2e9ef40a41f5eca3869e95c3069720ec0ac686f26468e2e7162ae6c6be30
 size 435636076

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a723514b6dabb4a26429b166ab4402f751a876b7d8b0de64e1e0209f59a6f689
 size 4728

 version https://git-lfs.github.com/spec/v1
+oid sha256:baac67bd063bdd12190f8f78097c4da13b3a661f5f2630e0c0e73b7455ceed94
 size 4728