willtensora commited on
Commit
1f00c9f
·
verified ·
1 Parent(s): 32797a5

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "q_proj",
24
  "v_proj",
 
 
25
  "o_proj",
26
- "gate_proj",
27
- "up_proj",
28
  "k_proj",
29
- "down_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "v_proj",
24
+ "q_proj",
25
+ "down_proj",
26
  "o_proj",
 
 
27
  "k_proj",
28
+ "up_proj",
29
+ "gate_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91a9ea1223ba85bbea9348c544be11652f89e0e757979feed1bcb01f6c918891
3
  size 25271744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b49608e88641713ee5a2f11cc0f9b4df4195c3ece8e936a8dd4dced5882d814
3
  size 25271744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:336c1293365b64ddb78543f3bc45d81537f442d08bc1806978f0ed670257d124
3
  size 13685516
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea761731c07c68e93df9c9f52a0c1f1bc01f318ce497dba7102ff183eda25794
3
  size 13685516
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9999fe17ac6d10df0b24edf483ce019f56daddfb3edc069a21c03ccaa11df1b8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a833f22f25ea3834727974efdfc06b3927711900cd9acb75c7c0258b248c9673
3
  size 14244
last-checkpoint/trainer_state.json CHANGED
@@ -10,24 +10,24 @@
10
  "log_history": [
11
  {
12
  "epoch": 6.727664155005382e-05,
13
- "grad_norm": 17.90272331237793,
14
  "learning_rate": 0.0001,
15
  "loss": 7.986,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.00013455328310010763,
20
- "grad_norm": 3.7075886726379395,
21
  "learning_rate": 0.0002,
22
  "loss": 2.0306,
23
  "step": 2
24
  },
25
  {
26
  "epoch": 0.00013455328310010763,
27
- "eval_loss": 2.1211705207824707,
28
- "eval_runtime": 5.4013,
29
- "eval_samples_per_second": 27.956,
30
- "eval_steps_per_second": 27.956,
31
  "step": 2
32
  }
33
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 6.727664155005382e-05,
13
+ "grad_norm": 16.59201431274414,
14
  "learning_rate": 0.0001,
15
  "loss": 7.986,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.00013455328310010763,
20
+ "grad_norm": 3.2888948917388916,
21
  "learning_rate": 0.0002,
22
  "loss": 2.0306,
23
  "step": 2
24
  },
25
  {
26
  "epoch": 0.00013455328310010763,
27
+ "eval_loss": 2.1215152740478516,
28
+ "eval_runtime": 5.4188,
29
+ "eval_samples_per_second": 27.866,
30
+ "eval_steps_per_second": 27.866,
31
  "step": 2
32
  }
33
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f7cf9b3f4a9b6aee0af9bb352b3071b1f748975269b94023838baf634daee8c
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b6377427e4e4bf683c90c59945e864e887a68d19ec55ff4999690a80faf10af
3
  size 6776