AlekseyKorshuk commited on
Commit
ca209f5
1 Parent(s): 1790f07

huggingartists

Browse files
Files changed (7) hide show
  1. README.md +3 -3
  2. evaluation.txt +1 -1
  3. optimizer.pt +1 -1
  4. rng_state.pth +1 -1
  5. scheduler.pt +1 -1
  6. trainer_state.json +14 -6
  7. training_args.bin +1 -1
README.md CHANGED
@@ -45,15 +45,15 @@ from datasets import load_dataset
45
  dataset = load_dataset("huggingartists/queen")
46
  ```
47
 
48
- [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/29edwcv0/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Queen's lyrics.
53
 
54
- Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/135qvcfh) for full transparency and reproducibility.
55
 
56
- At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/135qvcfh/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
 
45
  dataset = load_dataset("huggingartists/queen")
46
  ```
47
 
48
+ [Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/1odfy5f2/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
49
 
50
  ## Training procedure
51
 
52
  The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Queen's lyrics.
53
 
54
+ Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/n5mutjgn) for full transparency and reproducibility.
55
 
56
+ At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/n5mutjgn/artifacts) is logged and versioned.
57
 
58
  ## How to use
59
 
evaluation.txt CHANGED
@@ -1 +1 @@
1
- {"eval_loss": 0.9767317771911621, "eval_runtime": 2.1966, "eval_samples_per_second": 43.704, "eval_steps_per_second": 5.463, "epoch": 12.0}
 
1
+ {"eval_loss": 0.7435600757598877, "eval_runtime": 1.9524, "eval_samples_per_second": 44.56, "eval_steps_per_second": 5.634, "epoch": 2.0}
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ee8cef8141948570d21835c08d084a9b314fbdef3ba8f904e6e203013456a0d
3
  size 995604017
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c66880bc32b68f34b3eb7af0a61b4e00e160a67a148722eca25b7babef5c4229
3
  size 995604017
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afadc6c82078abf8ebc3154d7c31c5702ef7fa29db799979801c5d8393338a19
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad122a9ca484f0a33b6603349e6dcbd96996d2bf9f426d0ada5eb32987c4387e
3
  size 14503
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d825f1ad452557c55ae3db5704cfc8ff0c2aef068797ec1bf426331ec8788e52
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:243af1ebed26a3a8d0b96be16a026fc3571686ab7c16190d8dea7c3ff4208aee
3
  size 623
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.9767317771911621,
3
- "best_model_checkpoint": "output/queen/checkpoint-68",
4
  "epoch": 1.0,
5
- "global_step": 68,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -92,11 +92,19 @@
92
  "eval_samples_per_second": 46.272,
93
  "eval_steps_per_second": 5.784,
94
  "step": 68
 
 
 
 
 
 
 
 
95
  }
96
  ],
97
- "max_steps": 816,
98
- "num_train_epochs": 12,
99
- "total_flos": 70156910592000.0,
100
  "trial_name": null,
101
  "trial_params": null
102
  }
 
1
  {
2
+ "best_metric": 0.7435600757598877,
3
+ "best_model_checkpoint": "output/queen/checkpoint-69",
4
  "epoch": 1.0,
5
+ "global_step": 69,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
92
  "eval_samples_per_second": 46.272,
93
  "eval_steps_per_second": 5.784,
94
  "step": 68
95
+ },
96
+ {
97
+ "epoch": 1.0,
98
+ "eval_loss": 0.7435600757598877,
99
+ "eval_runtime": 1.811,
100
+ "eval_samples_per_second": 48.039,
101
+ "eval_steps_per_second": 6.074,
102
+ "step": 69
103
  }
104
  ],
105
+ "max_steps": 138,
106
+ "num_train_epochs": 2,
107
+ "total_flos": 70418202624000.0,
108
  "trial_name": null,
109
  "trial_params": null
110
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de2b73e108df809dd60f215a7871329eac5738c939f3a5b41fa7a79d90523567
3
  size 3311
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3276c6263f8b9603729e374cfea7b7138a847c1c3c8a37df36295a1f7cfc5e34
3
  size 3311