End of training

Browse files

Files changed (9) hide show

README.md +114 -0
added_tokens.json +3 -0
bpe.codes +0 -0
config.json +37 -0
model.safetensors +3 -0
special_tokens_map.json +9 -0
tokenizer_config.json +54 -0
training_args.bin +3 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,114 @@

+---
+library_name: transformers
+license: agpl-3.0
+base_model: vinai/phobert-base-v2
+tags:
+- generated_from_trainer
+metrics:
+- accuracy
+- f1
+model-index:
+- name: PhoBert_Lexical_Dataset45K
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# PhoBert_Lexical_Dataset45K
+This model is a fine-tuned version of [vinai/phobert-base-v2](https://huggingface.co/vinai/phobert-base-v2) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.4880
+- Accuracy: 0.8851
+- F1: 0.8858
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 2e-05
+- train_batch_size: 64
+- eval_batch_size: 64
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 15
+### Training results
+| Training Loss | Epoch   | Step  | Validation Loss | Accuracy | F1     |
+|:-------------:|:-------:|:-----:|:---------------:|:--------:|:------:|
+| No log        | 0.2841  | 200   | 0.3476          | 0.8474   | 0.8494 |
+| No log        | 0.5682  | 400   | 0.3035          | 0.8692   | 0.8703 |
+| No log        | 0.8523  | 600   | 0.3132          | 0.8654   | 0.8674 |
+| 0.3678        | 1.1364  | 800   | 0.2832          | 0.8797   | 0.8797 |
+| 0.3678        | 1.4205  | 1000  | 0.2805          | 0.8828   | 0.8815 |
+| 0.3678        | 1.7045  | 1200  | 0.2622          | 0.8862   | 0.8874 |
+| 0.3678        | 1.9886  | 1400  | 0.2751          | 0.8898   | 0.8889 |
+| 0.2662        | 2.2727  | 1600  | 0.2627          | 0.8873   | 0.8886 |
+| 0.2662        | 2.5568  | 1800  | 0.2514          | 0.8945   | 0.8940 |
+| 0.2662        | 2.8409  | 2000  | 0.2433          | 0.8941   | 0.8949 |
+| 0.219         | 3.125   | 2200  | 0.2600          | 0.8914   | 0.8922 |
+| 0.219         | 3.4091  | 2400  | 0.2563          | 0.8933   | 0.8937 |
+| 0.219         | 3.6932  | 2600  | 0.2592          | 0.8909   | 0.8919 |
+| 0.219         | 3.9773  | 2800  | 0.2390          | 0.8969   | 0.8974 |
+| 0.1865        | 4.2614  | 3000  | 0.2925          | 0.8820   | 0.8834 |
+| 0.1865        | 4.5455  | 3200  | 0.2922          | 0.8871   | 0.8883 |
+| 0.1865        | 4.8295  | 3400  | 0.2975          | 0.8838   | 0.8854 |
+| 0.1591        | 5.1136  | 3600  | 0.2935          | 0.8920   | 0.8926 |
+| 0.1591        | 5.3977  | 3800  | 0.2860          | 0.8893   | 0.8901 |
+| 0.1591        | 5.6818  | 4000  | 0.2943          | 0.8939   | 0.8940 |
+| 0.1591        | 5.9659  | 4200  | 0.2898          | 0.8970   | 0.8973 |
+| 0.1394        | 6.25    | 4400  | 0.3268          | 0.8886   | 0.8886 |
+| 0.1394        | 6.5341  | 4600  | 0.3399          | 0.8804   | 0.8820 |
+| 0.1394        | 6.8182  | 4800  | 0.3353          | 0.8887   | 0.8894 |
+| 0.1159        | 7.1023  | 5000  | 0.3313          | 0.8950   | 0.8956 |
+| 0.1159        | 7.3864  | 5200  | 0.3496          | 0.8955   | 0.8956 |
+| 0.1159        | 7.6705  | 5400  | 0.3509          | 0.8920   | 0.8925 |
+| 0.1159        | 7.9545  | 5600  | 0.3534          | 0.8842   | 0.8855 |
+| 0.1005        | 8.2386  | 5800  | 0.3529          | 0.8932   | 0.8936 |
+| 0.1005        | 8.5227  | 6000  | 0.3641          | 0.8914   | 0.8916 |
+| 0.1005        | 8.8068  | 6200  | 0.3572          | 0.8907   | 0.8911 |
+| 0.0838        | 9.0909  | 6400  | 0.4026          | 0.8873   | 0.8873 |
+| 0.0838        | 9.375   | 6600  | 0.4049          | 0.8869   | 0.8876 |
+| 0.0838        | 9.6591  | 6800  | 0.4024          | 0.8808   | 0.8822 |
+| 0.0838        | 9.9432  | 7000  | 0.4161          | 0.8874   | 0.8886 |
+| 0.0732        | 10.2273 | 7200  | 0.4098          | 0.8881   | 0.8885 |
+| 0.0732        | 10.5114 | 7400  | 0.4010          | 0.8880   | 0.8885 |
+| 0.0732        | 10.7955 | 7600  | 0.4166          | 0.8890   | 0.8891 |
+| 0.0616        | 11.0795 | 7800  | 0.4317          | 0.8853   | 0.8859 |
+| 0.0616        | 11.3636 | 8000  | 0.4323          | 0.8878   | 0.8884 |
+| 0.0616        | 11.6477 | 8200  | 0.4550          | 0.8862   | 0.8872 |
+| 0.0616        | 11.9318 | 8400  | 0.4509          | 0.8882   | 0.8890 |
+| 0.0547        | 12.2159 | 8600  | 0.4463          | 0.8871   | 0.8877 |
+| 0.0547        | 12.5    | 8800  | 0.4705          | 0.8842   | 0.8849 |
+| 0.0547        | 12.7841 | 9000  | 0.4663          | 0.8876   | 0.8880 |
+| 0.0472        | 13.0682 | 9200  | 0.4825          | 0.8867   | 0.8876 |
+| 0.0472        | 13.3523 | 9400  | 0.4796          | 0.8858   | 0.8864 |
+| 0.0472        | 13.6364 | 9600  | 0.4856          | 0.8853   | 0.8862 |
+| 0.0472        | 13.9205 | 9800  | 0.4896          | 0.8840   | 0.8851 |
+| 0.0433        | 14.2045 | 10000 | 0.4810          | 0.8859   | 0.8864 |
+| 0.0433        | 14.4886 | 10200 | 0.4900          | 0.8842   | 0.8851 |
+| 0.0433        | 14.7727 | 10400 | 0.4880          | 0.8851   | 0.8858 |
+### Framework versions
+- Transformers 4.44.2
+- Pytorch 2.1.2
+- Datasets 2.20.0
+- Tokenizers 0.19.1

added_tokens.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "<mask>": 64000
+}

bpe.codes ADDED Viewed

The diff for this file is too large to render. See raw diff

config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "_name_or_path": "vinai/phobert-base-v2",
+  "architectures": [
+    "PhoBertLexical"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "B\u00ecnh th\u01b0\u1eddng",
+    "1": "T\u00ednh nhi\u1ec7m th\u1ea5p"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "B\u00ecnh th\u01b0\u1eddng": 0,
+    "T\u00ednh nhi\u1ec7m th\u1ea5p": 1
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 258,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_classes": 2,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "tokenizer_class": "PhobertTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 64001
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66bf97a0d03400e94ef827ea14b689f5f1d371ff76d7964ccf21114b445affab
+size 538468008

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,54 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "64000": {
+      "content": "<mask>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "PhobertTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5ca6b40e044ac8c03746c84895aaa1c4a450d33e9ad6858384f8d18dc8910cc
+size 5176

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff