thejosango
/

nuha-binary

@@ -24,13 +24,13 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: 0.6868284228769497
     - name: Precision
       type: precision
-      value: 0.6468092051574996
     - name: Recall
       type: recall
-      value: 0.7321263624607427
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -40,10 +40,10 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.5763
-- F1: 0.6868
-- Precision: 0.6468
-- Recall: 0.7321
 - Support: None
 ## Model description
@@ -76,15 +76,15 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
-| 0.572         | 0.25  | 500  | 0.5492          | 0.6774 | 0.5836    | 0.8069 | None    |
-| 0.5571        | 0.5   | 1000 | 0.5384          | 0.6937 | 0.6053    | 0.8123 | None    |
-| 0.541         | 0.75  | 1500 | 0.5344          | 0.6967 | 0.6324    | 0.7755 | None    |
-| 0.5359        | 1.0   | 2000 | 0.5300          | 0.7032 | 0.6300    | 0.7957 | None    |
-| 0.4984        | 1.26  | 2500 | 0.5406          | 0.7023 | 0.6597    | 0.7508 | None    |
-| 0.4878        | 1.51  | 3000 | 0.5415          | 0.7012 | 0.6425    | 0.7718 | None    |
-| 0.4847        | 1.76  | 3500 | 0.5435          | 0.6980 | 0.6422    | 0.7645 | None    |
-| 0.4779        | 2.01  | 4000 | 0.5526          | 0.7034 | 0.6377    | 0.7842 | None    |
-| 0.4265        | 2.26  | 4500 | 0.5763          | 0.6868 | 0.6468    | 0.7321 | None    |
 ### Framework versions

     metrics:
     - name: F1
       type: f1
+      value: 0.6878727634194831
     - name: Precision
       type: precision
+      value: 0.646361273554256
     - name: Recall
       type: recall
+      value: 0.7350822094956586
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [thejosango/nuha-mlm](https://huggingface.co/thejosango/nuha-mlm) on the nuha-dataset dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.5743
+- F1: 0.6879
+- Precision: 0.6464
+- Recall: 0.7351
 - Support: None
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss | F1     | Precision | Recall | Support |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:---------:|:------:|:-------:|
+| 0.5741        | 0.25  | 500  | 0.5494          | 0.6764 | 0.5835    | 0.8045 | None    |
+| 0.5583        | 0.5   | 1000 | 0.5383          | 0.6912 | 0.6070    | 0.8025 | None    |
+| 0.5425        | 0.75  | 1500 | 0.5350          | 0.6938 | 0.6323    | 0.7687 | None    |
+| 0.5367        | 1.0   | 2000 | 0.5300          | 0.7020 | 0.6309    | 0.7912 | None    |
+| 0.4991        | 1.26  | 2500 | 0.5417          | 0.7015 | 0.6592    | 0.7497 | None    |
+| 0.4887        | 1.51  | 3000 | 0.5418          | 0.7009 | 0.6438    | 0.7691 | None    |
+| 0.4859        | 1.76  | 3500 | 0.5432          | 0.6983 | 0.6422    | 0.7650 | None    |
+| 0.4787        | 2.01  | 4000 | 0.5492          | 0.7041 | 0.6376    | 0.7861 | None    |
+| 0.4276        | 2.26  | 4500 | 0.5743          | 0.6879 | 0.6464    | 0.7351 | None    |
 ### Framework versions

config.json CHANGED Viewed

@@ -4,7 +4,7 @@
     "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
-  "classifier_dropout": 0.25,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,

     "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": 0.5,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,

config.toml CHANGED Viewed

@@ -1,5 +1,5 @@
 [experiment]
-name = "binary-55"
 type = "binary"
@@ -14,7 +14,7 @@ undersampling_strategy = false
 pretrained_model_name_or_path = "thejosango/nuha-mlm"
 revision = "ce20f497544665775129f9ff5b3cd2a3e350dce8"
 num_hidden_layers = 4
-classifier_dropout = 0.25
 [training]
 num_train_epochs = 5

 [experiment]
+name = "binary-56"
 type = "binary"
 pretrained_model_name_or_path = "thejosango/nuha-mlm"
 revision = "ce20f497544665775129f9ff5b3cd2a3e350dce8"
 num_hidden_layers = 4
+classifier_dropout = 0.50
 [training]
 num_train_epochs = 5

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28c3aa09ebd3a0c1b7b418bed98c4e2a3db1ba33304f8af556ae95907e3c2cae
 size 313992076

 version https://git-lfs.github.com/spec/v1
+oid sha256:53bc9d93dcdcd0e5cd9c277e391694643dd8356deda25ae33f7a8b50837d49a6
 size 313992076

tokenizer.json CHANGED Viewed

@@ -6,7 +6,14 @@
     "strategy": "LongestFirst",
     "stride": 0
   },
-  "padding": null,
   "added_tokens": [
     {
       "id": 0,

     "strategy": "LongestFirst",
     "stride": 0
   },
+  "padding": {
+    "strategy": "BatchLongest",
+    "direction": "Right",
+    "pad_to_multiple_of": null,
+    "pad_id": 0,
+    "pad_type_id": 0,
+    "pad_token": "[PAD]"
+  },
   "added_tokens": [
     {
       "id": 0,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8a03f95e740df4d0f787430d74d3e1a322dbd96f1199c899477c0651189f7b9e
 size 4091

 version https://git-lfs.github.com/spec/v1
+oid sha256:538dcd3d5266e8ce191235a9b808e1948c5c7bea875e61d84994880afc0a76d0
 size 4091