lesso commited on
Commit
a5d4841
·
verified ·
1 Parent(s): b4a01bf

Training in progress, step 3, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,12 +20,12 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "up_proj",
24
  "down_proj",
25
- "k_proj",
26
  "q_proj",
27
  "o_proj",
28
- "gate_proj",
29
  "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "gate_proj",
24
  "down_proj",
25
+ "up_proj",
26
  "q_proj",
27
  "o_proj",
28
+ "k_proj",
29
  "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac4e49830ca4084ef96f5c95d7ee075a79d349858c85e07cc39702093eaa3455
3
  size 80013120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49746f42e10d14a022ce382d0b0f149a2cab0eb4aa73d58370661e1ee25ce37c
3
  size 80013120
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2671111e7f8b7b54f65ad73c945053eefc3d6789e802b6ccdc864b5ab113e011
3
  size 160172858
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b31d967effc0ea305c9e8a5260be0e8e95ca32237e42ccccff7da79ba25713b5
3
  size 160172858
last-checkpoint/trainer_state.json CHANGED
@@ -10,7 +10,7 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0008097165991902834,
13
- "grad_norm": 5.536149024963379,
14
  "learning_rate": 2e-05,
15
  "loss": 14.12,
16
  "step": 1
@@ -18,14 +18,14 @@
18
  {
19
  "epoch": 0.0008097165991902834,
20
  "eval_loss": 16.039548873901367,
21
- "eval_runtime": 46.298,
22
- "eval_samples_per_second": 5.637,
23
- "eval_steps_per_second": 5.637,
24
  "step": 1
25
  },
26
  {
27
  "epoch": 0.0016194331983805667,
28
- "grad_norm": 5.57291841506958,
29
  "learning_rate": 4e-05,
30
  "loss": 14.9434,
31
  "step": 2
@@ -34,15 +34,15 @@
34
  "epoch": 0.0024291497975708503,
35
  "grad_norm": NaN,
36
  "learning_rate": 4e-05,
37
- "loss": 17.5653,
38
  "step": 3
39
  },
40
  {
41
  "epoch": 0.0024291497975708503,
42
- "eval_loss": 16.010469436645508,
43
- "eval_runtime": 48.2421,
44
- "eval_samples_per_second": 5.41,
45
- "eval_steps_per_second": 5.41,
46
  "step": 3
47
  }
48
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0008097165991902834,
13
+ "grad_norm": 5.4282379150390625,
14
  "learning_rate": 2e-05,
15
  "loss": 14.12,
16
  "step": 1
 
18
  {
19
  "epoch": 0.0008097165991902834,
20
  "eval_loss": 16.039548873901367,
21
+ "eval_runtime": 47.0534,
22
+ "eval_samples_per_second": 5.547,
23
+ "eval_steps_per_second": 5.547,
24
  "step": 1
25
  },
26
  {
27
  "epoch": 0.0016194331983805667,
28
+ "grad_norm": 5.544086456298828,
29
  "learning_rate": 4e-05,
30
  "loss": 14.9434,
31
  "step": 2
 
34
  "epoch": 0.0024291497975708503,
35
  "grad_norm": NaN,
36
  "learning_rate": 4e-05,
37
+ "loss": 17.5639,
38
  "step": 3
39
  },
40
  {
41
  "epoch": 0.0024291497975708503,
42
+ "eval_loss": 16.009519577026367,
43
+ "eval_runtime": 47.55,
44
+ "eval_samples_per_second": 5.489,
45
+ "eval_steps_per_second": 5.489,
46
  "step": 3
47
  }
48
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc7eb56965fd55276c944caeebbd855891392f90553ede8609b47d5de737c680
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba57699bba9b310c57bde7376897c4b366951d205389ca4384cb9831382eab5b
3
  size 6776