aapot
commited on
Commit
•
d5f3c4c
1
Parent(s):
bf90457
Add 920k train step and HF flax model
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- checkpoint_920000/checkpoint +3 -0
- checkpoint_920000/state.param_states.decoder.decoder_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.decoder_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +3 -0
- checkpoint_920000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0 +3 -0
- checkpoint_920000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray +3 -0
checkpoint_920000/checkpoint
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab0add48bd3eab85f7f3b60d01124ea06657bcea101fa0266044520e6d5dacbf
|
3 |
+
size 6520637
|
checkpoint_920000/state.param_states.decoder.decoder_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.decoder_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:250a8645dad199b469c760c132d021082101ab66dadf93aad988b001a4412909
|
3 |
+
size 2660
|
checkpoint_920000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_0.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6807c97f1bd1c6f2db6f31a5f7d2f28b8539dde7069a8d1a114c2d698d9ddb0f
|
3 |
+
size 2757
|
checkpoint_920000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_0.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43e52613d75e8a2d2488487c6c7a8e0b64643f2ecff3f875c060f645fd3f1669
|
3 |
+
size 2753
|
checkpoint_920000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7e1edbeb9c5ec22f89809f30b43ed95f72f2c7689c802173da451ccee234d97
|
3 |
+
size 2812
|
checkpoint_920000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_1.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:788f8295dd3151135c0c9e86f60996ceab540a2cfc0b32432719fcfe2bc6ab01
|
3 |
+
size 2766
|
checkpoint_920000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_1.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c20f4388dfcfce046c4876e52caddeb5aa1c283094808b6b4aff4f37f432cf47
|
3 |
+
size 2771
|
checkpoint_920000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_1.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cec2286ba86fcbb6e478df3175c8ed9ba01511c5f74b623c5dc8f7f009458a9e
|
3 |
+
size 2833
|
checkpoint_920000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_10.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:722a9658f13769fbddd48f6d1611caeeb27ab54063f40f255e3b576ab6a8cfd5
|
3 |
+
size 2780
|
checkpoint_920000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_10.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75c70654c223f3d69c88191536bc85242f8224eace19d0f2d3e658028808cec8
|
3 |
+
size 2797
|
checkpoint_920000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_10.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5845d2c2095ac93f26c5c29d49eb60c9f20f9892ac1f3ca8b8e6b79115432e4c
|
3 |
+
size 2805
|
checkpoint_920000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_11.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ac9227199a7fe910a8ec1cd8baad217077a3b0e0a2ad603f42145e7bc1a7e24
|
3 |
+
size 2773
|
checkpoint_920000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_11.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1a021a139126283e91db2ef83aebb113d4f8a0405a439303b2c5593be18f888
|
3 |
+
size 2789
|
checkpoint_920000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9a98c05d3231e14c3841fb016d27e2dcfe9c32ea4609bbb9331693970554a7e
|
3 |
+
size 2842
|
checkpoint_920000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_12.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09c1ddcd2a5f2e4f666fe384d0884347cb791758f167e284907e2f13daa90582
|
3 |
+
size 2751
|
checkpoint_920000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_12.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2381a6b0ca92837f48d0078c123bfb9294e4f9441de8e148643cf1ff8dd42cf9
|
3 |
+
size 2744
|
checkpoint_920000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_12.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:502e23824cc173b972985c34598308c6b9457edffd36a4d72bcc8041b6b6314f
|
3 |
+
size 2756
|
checkpoint_920000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_13.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b25d9313860152c909595d23d32bdde57301c01fd8d2cc19e3e2b494297f476d
|
3 |
+
size 2792
|
checkpoint_920000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_13.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0381a0be3873d85342e77976b88693cb399caa3bc91282d9b8fda80dd7e7501
|
3 |
+
size 2719
|
checkpoint_920000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_13.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:054b0bcbc9e3e84d3fee9ac0e409865b3a4367d6c4e5a48ac9c3d54d222068d1
|
3 |
+
size 2763
|
checkpoint_920000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_14.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6213f81e32ae5b458e8aced933053b3fc9f84671daa02a6f37d85ac376ec286a
|
3 |
+
size 2783
|
checkpoint_920000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_14.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e66c3a8e8d7857eaf2889e77d0fdd14873f68e4033393f6710188e20db7d339
|
3 |
+
size 2747
|
checkpoint_920000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c485b95b2d1f47bf90625f82ff850a4dba45782dc2ebe1c00b50858bb611f495
|
3 |
+
size 2762
|
checkpoint_920000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64f02f8042f9584a76052423ef56333b077297ddcec13c71d92ec257e5c808bb
|
3 |
+
size 2732
|
checkpoint_920000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|
checkpoint_920000/state.param_states.decoder.layers_15.pre_mlp_layer_norm.scale.v/0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0227b9dde599395bb132893ccb5065cdaefb19579820751cdf6025e1285055d5
|
3 |
+
size 2761
|
checkpoint_920000/state.param_states.decoder.layers_15.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:daaea0b8b1a0dcfac0b0d9f58d65a2da57a63bbfb167fa23901e6a9fc9155af8
|
3 |
+
size 168
|