End of training

Browse files

Files changed (8) hide show

README.md +83 -0
config.json +1 -1
generation_config.json +8 -0
model.safetensors +1 -1
runs/Jun03_14-29-44_d532e7250bcf/events.out.tfevents.1717425200.d532e7250bcf.24.0 +3 -0
runs/Jun03_14-29-44_d532e7250bcf/events.out.tfevents.1717465648.d532e7250bcf.24.1 +3 -0
tokenizer_config.json +4 -0
training_args.bin +1 -1

README.md ADDED Viewed

	@@ -0,0 +1,83 @@

+---
+base_model: Zelyanoth/my_fon_translation_model
+tags:
+- generated_from_trainer
+datasets:
+- generator
+metrics:
+- bleu
+model-index:
+- name: my_fon_translation_model
+  results:
+  - task:
+      name: Sequence-to-sequence Language Modeling
+      type: text2text-generation
+    dataset:
+      name: generator
+      type: generator
+      config: default
+      split: train
+      args: default
+    metrics:
+    - name: Bleu
+      type: bleu
+      value: 4.6993
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# my_fon_translation_model
+This model is a fine-tuned version of [Zelyanoth/my_fon_translation_model](https://huggingface.co/Zelyanoth/my_fon_translation_model) on the generator dataset.
+It achieves the following results on the evaluation set:
+- Loss: 5.3862
+- Bleu: 4.6993
+- Gen Len: 8.9558
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 1.87e-05
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 9
+### Training results
+| Training Loss | Epoch | Step   | Validation Loss | Bleu   | Gen Len |
+|:-------------:|:-----:|:------:|:---------------:|:------:|:-------:|
+| 1.3141        | 1.0   | 13165  | 5.0069          | 3.3364 | 9.1891  |
+| 1.1534        | 2.0   | 26330  | 5.1888          | 3.7137 | 9.1076  |
+| 1.1158        | 3.0   | 39495  | 5.1695          | 4.1907 | 8.9998  |
+| 0.9801        | 4.0   | 52660  | 5.2281          | 4.2697 | 8.8066  |
+| 0.941         | 5.0   | 65825  | 5.3425          | 4.3691 | 9.0261  |
+| 0.8676        | 6.0   | 78990  | 5.3371          | 4.0892 | 9.3749  |
+| 0.8247        | 7.0   | 92155  | 5.3622          | 4.4876 | 9.1058  |
+| 0.7925        | 8.0   | 105320 | 5.3538          | 4.728  | 8.9704  |
+| 0.7639        | 9.0   | 118485 | 5.3862          | 4.6993 | 8.9558  |
+### Framework versions
+- Transformers 4.39.3
+- Pytorch 2.1.2
+- Datasets 2.18.0
+- Tokenizers 0.15.2

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "facebook/nllb-200-distilled-600M",
   "activation_dropout": 0.0,
   "activation_function": "relu",
   "architectures": [

 {
+  "_name_or_path": "Zelyanoth/my_fon_translation_model",
   "activation_dropout": 0.0,
   "activation_function": "relu",
   "architectures": [

generation_config.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+  "bos_token_id": 0,
+  "decoder_start_token_id": 2,
+  "eos_token_id": 2,
+  "max_length": 200,
+  "pad_token_id": 1,
+  "transformers_version": "4.39.3"
+}

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:12e7afa0895df9fe5407e11567f0b10e4042b1118e54a4cb9cecd0760ebd5d75
 size 2460354912

 version https://git-lfs.github.com/spec/v1
+oid sha256:73c59a394f1e8374730089541779b0f587d0aeeb81a3fd5ae7cf0d1d4401bdc3
 size 2460354912

runs/Jun03_14-29-44_d532e7250bcf/events.out.tfevents.1717425200.d532e7250bcf.24.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:03b8b008cb81b285acab91ce9d7990c35b18bddf723493ae63853d38fc6e2896
+size 59699

runs/Jun03_14-29-44_d532e7250bcf/events.out.tfevents.1717465648.d532e7250bcf.24.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c675917f89de83756c804e23868f6b0ebbfba8fbf99090d5cb229cbc2c36952
+size 465

tokenizer_config.json CHANGED Viewed

@@ -1867,12 +1867,16 @@
   "eos_token": "</s>",
   "legacy_behaviour": false,
   "mask_token": "<mask>",
   "model_max_length": 1024,
   "pad_token": "<pad>",
   "sep_token": "</s>",
   "sp_model_kwargs": {},
   "src_lang": "fon_Latn",
   "tgt_lang": "fra_Latn",
   "tokenizer_class": "NllbTokenizer",
   "unk_token": "<unk>"
 }

   "eos_token": "</s>",
   "legacy_behaviour": false,
   "mask_token": "<mask>",
+  "max_length": 512,
   "model_max_length": 1024,
   "pad_token": "<pad>",
   "sep_token": "</s>",
   "sp_model_kwargs": {},
   "src_lang": "fon_Latn",
+  "stride": 0,
   "tgt_lang": "fra_Latn",
   "tokenizer_class": "NllbTokenizer",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0baa59cf2a8cd1535166b1cc266c56543e8dab8d8952c7a482ef4e7f13cf0dcb
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:272cc57eb8a21f9aeb7fc2b7016f258cfb8a4278ee75da9d3d982fb6f8078634
 size 5112