joshcarp commited on
Commit
905dbb1
1 Parent(s): d72d61f

Model save

Browse files
Files changed (3) hide show
  1. README.md +27 -12
  2. generation_config.json +1 -1
  3. model.safetensors +1 -1
README.md CHANGED
@@ -1,8 +1,8 @@
1
  ---
2
  license: mit
 
3
  tags:
4
  - generated_from_trainer
5
- base_model: gpt2
6
  model-index:
7
  - name: gpt2-evy
8
  results: []
@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
- - Loss: 1.2879
19
 
20
  ## Model description
21
 
@@ -46,19 +46,34 @@ The following hyperparameters were used during training:
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:----:|:---------------:|
49
- | No log | 1.0 | 48 | 1.4347 |
50
- | No log | 2.0 | 96 | 1.2810 |
51
- | 1.3199 | 3.0 | 144 | 1.2442 |
52
- | 1.3199 | 4.0 | 192 | 1.2476 |
53
- | 0.879 | 5.0 | 240 | 1.2303 |
54
- | 0.879 | 6.0 | 288 | 1.2328 |
55
- | 0.7449 | 7.0 | 336 | 1.2577 |
56
- | 0.7449 | 8.0 | 384 | 1.2879 |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
 
58
 
59
  ### Framework versions
60
 
61
- - Transformers 4.40.2
62
- - Pytorch 2.2.1+cu121
63
  - Datasets 2.19.1
64
  - Tokenizers 0.19.1
 
1
  ---
2
  license: mit
3
+ base_model: gpt2
4
  tags:
5
  - generated_from_trainer
 
6
  model-index:
7
  - name: gpt2-evy
8
  results: []
 
15
 
16
  This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
+ - Loss: 0.5637
19
 
20
  ## Model description
21
 
 
46
 
47
  | Training Loss | Epoch | Step | Validation Loss |
48
  |:-------------:|:-----:|:----:|:---------------:|
49
+ | No log | 1.0 | 31 | 1.1270 |
50
+ | No log | 2.0 | 62 | 0.9170 |
51
+ | No log | 3.0 | 93 | 0.8410 |
52
+ | 1.3727 | 4.0 | 124 | 0.7949 |
53
+ | 1.3727 | 5.0 | 155 | 0.7361 |
54
+ | 1.3727 | 6.0 | 186 | 0.7021 |
55
+ | 0.9077 | 7.0 | 217 | 0.6789 |
56
+ | 0.9077 | 8.0 | 248 | 0.6490 |
57
+ | 0.9077 | 9.0 | 279 | 0.6346 |
58
+ | 0.7106 | 10.0 | 310 | 0.6219 |
59
+ | 0.7106 | 11.0 | 341 | 0.5986 |
60
+ | 0.7106 | 12.0 | 372 | 0.5797 |
61
+ | 0.5814 | 13.0 | 403 | 0.5835 |
62
+ | 0.5814 | 14.0 | 434 | 0.5872 |
63
+ | 0.5814 | 15.0 | 465 | 0.5741 |
64
+ | 0.5814 | 16.0 | 496 | 0.5749 |
65
+ | 0.4916 | 17.0 | 527 | 0.5662 |
66
+ | 0.4916 | 18.0 | 558 | 0.5529 |
67
+ | 0.4916 | 19.0 | 589 | 0.5672 |
68
+ | 0.4005 | 20.0 | 620 | 0.5646 |
69
+ | 0.4005 | 21.0 | 651 | 0.5701 |
70
+ | 0.4005 | 22.0 | 682 | 0.5650 |
71
+ | 0.357 | 23.0 | 713 | 0.5637 |
72
 
73
 
74
  ### Framework versions
75
 
76
+ - Transformers 4.41.0
77
+ - Pytorch 2.3.0+cu121
78
  - Datasets 2.19.1
79
  - Tokenizers 0.19.1
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 50256,
4
  "eos_token_id": 50256,
5
- "transformers_version": "4.40.2"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 50256,
4
  "eos_token_id": 50256,
5
+ "transformers_version": "4.41.0"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e206e896c82a075a90bf2f86649f9387e71855d3224a755c0e77e107618921cc
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5c0e35f2d813737a44ac311005bc894f3066454328f76553174304565eb1471
3
  size 497774208