jssky commited on
Commit
ea139aa
1 Parent(s): c4f66c9

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99d1f1b94a3a9b94941cf858fb3821dcb4031dca53de45a34a9bc5d94e9b94cb
3
  size 73911112
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65c0efd3867c28a57d9a7229e3d2efbcbb30c5b7f59f4921b03b5c78c36ef2d5
3
  size 73911112
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7af4808ac012592bf59bbeb49e07ccc22677aeb0e20b31fceb18a0fc8a94f611
3
  size 37965300
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2df70deb4bed64976588dbf287d4ff4f2c2fc5cf6e6ced9196520cd691b760f
3
  size 37965300
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1881ec4d999362af1e52c36de1e218d3800542004d7f7c7edd42a089b7296ccc
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dbb2e8ac6910520ef7694e04efc0c3d22d47c0a6764ae2a666b6a667647ed1d
3
  size 15984
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00d02bbc0fa1d27820c289ea283e0155cafcbd62fa1759df4850d0a715649da0
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a64ea9853e527aeaa3e3e8ab63280f7a104d71f06cbc00b6586cb1151066797
3
  size 15984
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c73827ec09ff37ba195a38bf7f08f0537cea0c0a55db5d2fc0d29f759ccdcccb
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb597193ff9d2e676d231c4c21c97756a564739529ec012a7405fe102e2d6bf0
3
  size 15984
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4822c4ae863c6a81149f37fecf8fc589c5a0e68b5f03747420a5cc6ab7af0d14
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8844277a61aa266c1286de806f9fbc3a0e4ffe07a5d322e90f868a6bef7c6200
3
  size 15984
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e9b440498b750929a8558219fefc2e4ad160122931aa3d6799fc4f65cdd7304
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:516bda9bd375b4dbffe21ea5098d3ba187c60e9ac82d932b20a8bdf7f85f5e7f
3
  size 15984
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f0c18fbbe129f61ea282f7dbcc97540666d69c89e3f1cc4842d356efb45d0d6
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6da94ae89efb6930839681ba2aa052a5e83a69a0af729ccfc303f5699e7189e8
3
  size 15984
last-checkpoint/rng_state_6.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a99554429161338da1a7001f3a511ce540238038412b9c31276e6f7379ad186a
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8788fd8bf5c71109ab3d1b1b8fb5df84005194baadaf8d32a3898477ae2e1c3e
3
  size 15984
last-checkpoint/rng_state_7.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e39d4edd2882a248daa72fe9c907359ed8ef2a193dbcaec84663291acb998ec0
3
  size 15984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b5cb477ad7cfcb7f3e9b4e0628a58437296983ffbd992ed46c97df77959dad1
3
  size 15984
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26a93b2a1f4b5368650119fe6e0d6eec6d19cda6badeba4d21943ab48964fa00
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c8e6b04902f17ae368c3e6cfd97a31ad4de2f025d673daea8c033ce0e260946
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.0026344676180021956,
5
  "eval_steps": 3,
6
- "global_step": 9,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -102,6 +102,13 @@
102
  "eval_samples_per_second": 79.998,
103
  "eval_steps_per_second": 10.01,
104
  "step": 9
 
 
 
 
 
 
 
105
  }
106
  ],
107
  "logging_steps": 1,
@@ -116,12 +123,12 @@
116
  "should_evaluate": false,
117
  "should_log": false,
118
  "should_save": true,
119
- "should_training_stop": false
120
  },
121
  "attributes": {}
122
  }
123
  },
124
- "total_flos": 9405135625125888.0,
125
  "train_batch_size": 1,
126
  "trial_name": null,
127
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.0029271862422246614,
5
  "eval_steps": 3,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
102
  "eval_samples_per_second": 79.998,
103
  "eval_steps_per_second": 10.01,
104
  "step": 9
105
+ },
106
+ {
107
+ "epoch": 0.0029271862422246614,
108
+ "grad_norm": 3.3299129009246826,
109
+ "learning_rate": 0.00018,
110
+ "loss": 6.7157,
111
+ "step": 10
112
  }
113
  ],
114
  "logging_steps": 1,
 
123
  "should_evaluate": false,
124
  "should_log": false,
125
  "should_save": true,
126
+ "should_training_stop": true
127
  },
128
  "attributes": {}
129
  }
130
  },
131
+ "total_flos": 1.045015069458432e+16,
132
  "train_batch_size": 1,
133
  "trial_name": null,
134
  "trial_params": null