File size: 2,041 Bytes
dbfa988
a3a68ac
dbfa988
a3a68ac
dbfa988
a3a68ac
dbfa988
 
 
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
 
a3a68ac
dbfa988
 
 
 
a3a68ac
 
 
 
 
dbfa988
 
 
a3a68ac
 
 
dbfa988
a3a68ac
 
 
dbfa988
 
 
 
 
 
 
a3a68ac
dbfa988
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
{
  "best_metric": 3.3333333333333335,
  "best_model_checkpoint": "/cosmos/home/sp-operator/ai/training/models/huggingface/scripts/../breeze-listen-dsw-base-te/checkpoint-200",
  "epoch": 99.001,
  "eval_steps": 200,
  "global_step": 200,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 12.0,
      "learning_rate": 4.973833272194737e-06,
      "loss": 1.7212,
      "step": 25
    },
    {
      "epoch": 24.0,
      "learning_rate": 6.195318418690893e-06,
      "loss": 1.1394,
      "step": 50
    },
    {
      "epoch": 37.0,
      "learning_rate": 6.881634451095711e-06,
      "loss": 0.5083,
      "step": 75
    },
    {
      "epoch": 49.0,
      "learning_rate": 7.361221988663844e-06,
      "loss": 0.1183,
      "step": 100
    },
    {
      "epoch": 62.0,
      "learning_rate": 7.730207550743121e-06,
      "loss": 0.022,
      "step": 125
    },
    {
      "epoch": 74.0,
      "learning_rate": 8.03016458599496e-06,
      "loss": 0.005,
      "step": 150
    },
    {
      "epoch": 87.0,
      "learning_rate": 8.282894746203441e-06,
      "loss": 0.0016,
      "step": 175
    },
    {
      "epoch": 99.0,
      "learning_rate": 8.501266121799902e-06,
      "loss": 0.0008,
      "step": 200
    },
    {
      "epoch": 99.0,
      "eval_loss": 0.05462646484375,
      "eval_runtime": 53.8277,
      "eval_samples_per_second": 0.725,
      "eval_steps_per_second": 0.056,
      "eval_wer": 3.3333333333333335,
      "step": 200
    },
    {
      "epoch": 99.0,
      "step": 200,
      "total_flos": 2.2700998962393907e+17,
      "train_loss": 0.0,
      "train_runtime": 2.6625,
      "train_samples_per_second": 24037.247,
      "train_steps_per_second": 751.164
    }
  ],
  "logging_steps": 25,
  "max_steps": 2000,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 9223372036854775807,
  "save_steps": 200,
  "total_flos": 2.2700998962393907e+17,
  "train_batch_size": 32,
  "trial_name": null,
  "trial_params": null
}