End of training

Files changed (7) hide show

README.md CHANGED Viewed

@@ -14,7 +14,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [dccuchile/bert-base-spanish-wwm-uncased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-uncased) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.4346
 ## Model description
@@ -40,21 +40,22 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - num_epochs: 5
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 4.1178        | 1.0   | 35   | 3.5855          |
-| 3.0127        | 2.0   | 70   | 2.7329          |
-| 2.6519        | 3.0   | 105  | 2.7326          |
-| 2.5643        | 4.0   | 140  | 2.5444          |
-| 2.2931        | 5.0   | 175  | 2.3511          |
 ### Framework versions
-- Transformers 4.33.1
-- Pytorch 2.0.1+cu118
-- Datasets 2.14.5
-- Tokenizers 0.13.3

 This model is a fine-tuned version of [dccuchile/bert-base-spanish-wwm-uncased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-uncased) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.1710
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - num_epochs: 5
+- mixed_precision_training: Native AMP
 ### Training results
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 3.9411        | 1.0   | 35   | 3.4726          |
+| 2.9468        | 2.0   | 70   | 2.7930          |
+| 2.631         | 3.0   | 105  | 2.4120          |
+| 2.3962        | 4.0   | 140  | 2.4462          |
+| 2.3435        | 5.0   | 175  | 2.5299          |
 ### Framework versions
+- Transformers 4.35.2
+- Pytorch 2.1.0+cu118
+- Datasets 2.15.0
+- Tokenizers 0.15.0

config.json CHANGED Viewed

@@ -20,7 +20,7 @@
   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
-  "transformers_version": "4.33.1",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 31002

   "pad_token_id": 1,
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 31002

generation_config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
   "_from_model_config": true,
   "pad_token_id": 1,
-  "transformers_version": "4.33.1"
 }

 {
   "_from_model_config": true,
   "pad_token_id": 1,
+  "transformers_version": "4.35.2"
 }

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8aa039cf17575c55f661460560e8f8147866191bb2b51c8fd7ec8b5f04e58ef5
+size 439557376

special_tokens_map.json CHANGED Viewed

@@ -1,7 +1,37 @@
 {
-  "cls_token": "[CLS]",
-  "mask_token": "[MASK]",
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "unk_token": "[UNK]"
 }

 {
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tokenizer_config.json CHANGED Viewed

@@ -1,5 +1,47 @@
 {
   "TOKENIZERS_PARALLELISM": false,
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,

 {
   "TOKENIZERS_PARALLELISM": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d02a894340e02f30a81fcce59bb0cc00774f4dc2e64aeffdde355811f6ee14dd
-size 4027

 version https://git-lfs.github.com/spec/v1
+oid sha256:58fc6e5f2eed403814830789fdae13ae6366d8742252ab5d6159aa45e8a8faf4
+size 4600