willtensora commited on
Commit
0358dab
·
verified ·
1 Parent(s): 83137f2

Training in progress, epoch 0, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "up_proj",
24
  "k_proj",
25
- "o_proj",
26
  "down_proj",
27
  "q_proj",
28
- "gate_proj",
29
- "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "gate_proj",
24
  "k_proj",
25
+ "v_proj",
26
  "down_proj",
27
  "q_proj",
28
+ "o_proj",
29
+ "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f25359b683e22b03b52ac4093c485073114aedd358f879a11e84cf90e49a4a93
3
  size 9048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e91ecc3215812954a830f1f723d3eedc0c15dbb2e729c236a25ebebff95a5ea
3
  size 9048
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ded90c3181b31ec9bbc4afc53a003b8495f6c9234eeca06d2be815e87a774daf
3
  size 28134
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a3417c1810d1006c9fdc86a246e24fb6fb6a16f833a1c9b9fddfd514117cd35
3
  size 28134
last-checkpoint/trainer_state.json CHANGED
@@ -10,17 +10,17 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0002666666666666667,
13
- "grad_norm": 0.018526403233408928,
14
  "learning_rate": 0.0,
15
  "loss": 11.9308,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.0002666666666666667,
20
- "eval_loss": 11.933902740478516,
21
- "eval_runtime": 0.0582,
22
- "eval_samples_per_second": 275.089,
23
- "eval_steps_per_second": 68.772,
24
  "step": 1
25
  }
26
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0002666666666666667,
13
+ "grad_norm": 0.02039993554353714,
14
  "learning_rate": 0.0,
15
  "loss": 11.9308,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.0002666666666666667,
20
+ "eval_loss": 11.933893203735352,
21
+ "eval_runtime": 0.0595,
22
+ "eval_samples_per_second": 269.009,
23
+ "eval_steps_per_second": 67.252,
24
  "step": 1
25
  }
26
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbe6e9ba442b0bc5f9aa6ba82a0cda937bd3591b0b1cf9d2912657df85f80600
3
  size 6776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4262191338f57e0cb296b0162fc58ae0cec82361790f58f1dc600363293ba4aa
3
  size 6776