stuser2023 commited on
Commit
c85eed8
1 Parent(s): 82d6c7a

Training in progress, epoch 2

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0719fed60e9318276761def82f7efa080ae59ab6c2baf25c074e5ce01b18e5ca
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77554997fc9372d2f41138d5724d1fb0cf6940cbf2e4a35b5ff66d9db597aaf
3
  size 267832560
run-0/checkpoint-2138/config.json CHANGED
@@ -20,6 +20,6 @@
20
  "sinusoidal_pos_embds": false,
21
  "tie_weights_": true,
22
  "torch_dtype": "float32",
23
- "transformers_version": "4.35.2",
24
  "vocab_size": 30522
25
  }
 
20
  "sinusoidal_pos_embds": false,
21
  "tie_weights_": true,
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.38.2",
24
  "vocab_size": 30522
25
  }
run-0/checkpoint-2138/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4a449f5ba8d475db833357bb2a8e66d95f049863cfcf9a02e6b387a5e18218e
3
  size 267832560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77554997fc9372d2f41138d5724d1fb0cf6940cbf2e4a35b5ff66d9db597aaf
3
  size 267832560
run-0/checkpoint-2138/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed069420c568f99a89b1955fe08ef09cb877b068c6d8a9fb7b78bc7e3e9e1704
3
  size 535727290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7c4acbf29aee80bdaedfcc1ecdb85d5eb6e4e2b3b53854a2fe2810c68f8e681
3
  size 535727290
run-0/checkpoint-2138/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:172382e51eea4b612f92e96325ff52d51e3f94993499db917d83eb34dc31402c
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ecee28ec0d36e12d2a69d8440b854f0bb324c6899b79460571e75a4f0858ec9
3
+ size 14308
run-0/checkpoint-2138/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c60e27aef9e14addcecd59a048c0436b9257803bc2e4a736b74b3d2ea97f1435
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b764fbf1f3cb45f22e3739f3d6144dc33a78eb8bc8dc38b08acdc1f16b7b1adc
3
  size 1064
run-0/checkpoint-2138/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.12300105566407585,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-2138",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,57 +10,63 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.47,
13
- "learning_rate": 9.447053301406701e-07,
14
- "loss": 0.6327,
 
15
  "step": 500
16
  },
17
  {
18
  "epoch": 0.94,
19
- "learning_rate": 7.702122880016472e-07,
20
- "loss": 0.5907,
 
21
  "step": 1000
22
  },
23
  {
24
  "epoch": 1.0,
25
- "eval_loss": 0.5891121625900269,
26
- "eval_matthews_correlation": 0.0,
27
- "eval_runtime": 0.6963,
28
- "eval_samples_per_second": 1497.889,
29
- "eval_steps_per_second": 94.785,
30
  "step": 1069
31
  },
32
  {
33
  "epoch": 1.4,
34
- "learning_rate": 5.957192458626242e-07,
35
- "loss": 0.5573,
 
36
  "step": 1500
37
  },
38
  {
39
  "epoch": 1.87,
40
- "learning_rate": 4.2122620372360136e-07,
41
- "loss": 0.5487,
 
42
  "step": 2000
43
  },
44
  {
45
  "epoch": 2.0,
46
- "eval_loss": 0.55595862865448,
47
- "eval_matthews_correlation": 0.12300105566407585,
48
- "eval_runtime": 0.7049,
49
- "eval_samples_per_second": 1479.688,
50
- "eval_steps_per_second": 93.633,
51
  "step": 2138
52
  }
53
  ],
54
  "logging_steps": 500,
55
  "max_steps": 3207,
 
56
  "num_train_epochs": 3,
57
  "save_steps": 500,
58
- "total_flos": 75548589472164.0,
 
59
  "trial_name": null,
60
  "trial_params": {
61
- "learning_rate": 1.119198372279693e-06,
62
  "num_train_epochs": 3,
63
  "per_device_train_batch_size": 8,
64
- "seed": 19
65
  }
66
  }
 
1
  {
2
+ "best_metric": 0.41870797137315424,
3
  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-2138",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.47,
13
+ "grad_norm": 5.35684061050415,
14
+ "learning_rate": 2.775809181053764e-06,
15
+ "loss": 0.5956,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.94,
20
+ "grad_norm": 11.188376426696777,
21
+ "learning_rate": 2.263099690648562e-06,
22
+ "loss": 0.5375,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 1.0,
27
+ "eval_loss": 0.5379385948181152,
28
+ "eval_matthews_correlation": 0.29871168199754417,
29
+ "eval_runtime": 0.7649,
30
+ "eval_samples_per_second": 1363.614,
31
+ "eval_steps_per_second": 86.288,
32
  "step": 1069
33
  },
34
  {
35
  "epoch": 1.4,
36
+ "grad_norm": 10.391807556152344,
37
+ "learning_rate": 1.7503902002433598e-06,
38
+ "loss": 0.4937,
39
  "step": 1500
40
  },
41
  {
42
  "epoch": 1.87,
43
+ "grad_norm": 19.357559204101562,
44
+ "learning_rate": 1.2376807098381578e-06,
45
+ "loss": 0.4738,
46
  "step": 2000
47
  },
48
  {
49
  "epoch": 2.0,
50
+ "eval_loss": 0.526983916759491,
51
+ "eval_matthews_correlation": 0.41870797137315424,
52
+ "eval_runtime": 0.7468,
53
+ "eval_samples_per_second": 1396.551,
54
+ "eval_steps_per_second": 88.372,
55
  "step": 2138
56
  }
57
  ],
58
  "logging_steps": 500,
59
  "max_steps": 3207,
60
+ "num_input_tokens_seen": 0,
61
  "num_train_epochs": 3,
62
  "save_steps": 500,
63
+ "total_flos": 75492963513744.0,
64
+ "train_batch_size": 8,
65
  "trial_name": null,
66
  "trial_params": {
67
+ "learning_rate": 3.288518671458966e-06,
68
  "num_train_epochs": 3,
69
  "per_device_train_batch_size": 8,
70
+ "seed": 24
71
  }
72
  }
run-0/checkpoint-2138/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2697eed6b7ac5cb3358c6f6a74efea40e321a5f5e6bfffafbe5f4a6b261625ae
3
- size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d71decb8fd1c3b29f479f69dd55dfb41734b34761f0097d998f78bf9dd25bdb
3
+ size 4984
runs/Mar16_01-46-29_6e5f088ca464/events.out.tfevents.1710553848.6e5f088ca464.226.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0778b483e02ac32d52ec3b2a5dfa1bb4b42ba00cdcaa3f12b4939d2d6ca472f
3
- size 5345
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac7778f58cb3039c820ca741293fa3121735d684832990ccb4eded482d24e50a
3
+ size 6102