diff --git a/ndarray-cache.json b/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..22309a34402fd0d5e837c0dc4d2821de4965902b
--- /dev/null
+++ b/ndarray-cache.json
@@ -0,0 +1,7275 @@
+{
+ "metadata": {
+ "ParamSize": 565
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 327680000,
+ "records": [
+ {
+ "name": "param_0",
+ "shape": [
+ 32000,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 327680000,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_1",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_7",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_10",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_15",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 25497600,
+ "records": [
+ {
+ "name": "param_2",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_3",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 1228800
+ },
+ {
+ "name": "param_4",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 2457600
+ },
+ {
+ "name": "param_5",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 15564800
+ },
+ {
+ "name": "param_6",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 15974400
+ },
+ {
+ "name": "param_8",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16384000
+ },
+ {
+ "name": "param_9",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 18595840
+ },
+ {
+ "name": "param_11",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 20807680
+ },
+ {
+ "name": "param_12",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 21913600
+ },
+ {
+ "name": "param_13",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 23019520
+ },
+ {
+ "name": "param_14",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 23029760
+ },
+ {
+ "name": "param_16",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 23040000
+ },
+ {
+ "name": "param_17",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 24268800
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_21",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_24",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_29",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_18",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_19",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_20",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_22",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_23",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_25",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_26",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_27",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_28",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_30",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_31",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_35",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_38",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_43",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_32",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_33",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_34",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_36",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_37",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_39",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_40",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_41",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_42",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_44",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_45",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_49",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_52",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_57",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_46",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_47",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_48",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_50",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_51",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_53",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_54",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_55",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_56",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_58",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_59",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_63",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_66",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_71",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_60",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_61",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_62",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_64",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_65",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_67",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_68",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_69",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_70",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_72",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_73",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_77",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_80",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_85",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_74",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_75",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_76",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_78",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_79",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_81",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_82",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_83",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_84",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_86",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_87",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_91",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_94",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_99",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_88",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_89",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_90",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_92",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_93",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_95",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_96",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_97",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_98",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_100",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_101",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_105",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_108",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_113",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_102",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_103",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_104",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_106",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_107",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_109",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_110",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_111",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_112",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_114",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_115",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_119",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_122",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_127",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_116",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_117",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_118",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_120",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_121",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_123",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_124",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_125",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_126",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_128",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_129",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_133",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_136",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_141",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_130",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_131",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_132",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_134",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_135",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_137",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_138",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_139",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_140",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_142",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_143",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_147",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_150",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_155",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_144",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_145",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_146",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_148",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_149",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_151",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_152",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_153",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_154",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_156",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_157",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_161",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_164",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_169",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_158",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_159",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_160",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_162",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_163",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_165",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_166",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_167",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_168",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_170",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_171",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_175",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_51.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_178",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_52.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_183",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_53.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_172",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_173",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_174",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_176",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_177",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_179",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_180",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_181",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_182",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_184",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_185",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_54.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_189",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_55.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_192",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_56.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_197",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_57.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_186",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_187",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_188",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_190",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_191",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_193",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_194",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_195",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_196",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_198",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_199",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_58.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_203",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_59.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_206",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_60.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_211",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_61.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_200",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_201",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_202",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_204",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_205",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_207",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_208",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_209",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_210",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_212",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_213",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_62.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_217",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_63.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_220",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_64.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_225",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_65.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_214",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_215",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_216",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_218",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_219",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_221",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_222",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_223",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_224",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_226",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_227",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_66.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_231",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_67.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_234",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_68.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_239",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_69.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_228",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_229",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_230",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_232",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_233",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_235",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_236",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_237",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_238",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_240",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_241",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_70.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_245",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_71.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_248",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_72.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_253",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_73.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_242",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_243",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_244",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_246",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_247",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_249",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_250",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_251",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_252",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_254",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_255",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_74.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_259",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_75.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_262",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_76.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_267",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_77.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_256",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_257",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_258",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_260",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_261",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_263",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_264",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_265",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_266",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_268",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_269",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_78.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_273",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_79.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_276",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_80.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_281",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_81.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_270",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_271",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_272",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_274",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_275",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_277",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_278",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_279",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_280",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_282",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_283",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_82.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_287",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_83.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_290",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_84.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_295",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_85.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_284",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_285",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_286",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_288",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_289",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_291",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_292",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_293",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_294",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_296",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_297",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_86.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_301",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_87.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_304",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_88.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_309",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_89.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_298",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_299",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_300",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_302",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_303",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_305",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_306",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_307",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_308",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_310",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_311",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_90.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_315",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_91.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_318",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_92.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_323",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_93.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_312",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_313",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_314",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_316",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_317",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_319",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_320",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_321",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_322",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_324",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_325",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_94.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_329",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_95.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_332",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_96.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_337",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_97.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_326",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_327",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_328",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_330",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_331",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_333",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_334",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_335",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_336",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_338",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_339",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_98.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_343",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_99.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_346",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_100.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_351",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_101.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_340",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_341",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_342",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_344",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_345",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_347",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_348",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_349",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_350",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_352",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_353",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_102.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_357",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_103.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_360",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_104.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_365",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_105.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_354",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_355",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_356",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_358",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_359",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_361",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_362",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_363",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_364",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_366",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_367",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_106.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_371",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_107.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_374",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_108.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_379",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_109.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_368",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_369",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_370",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_372",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_373",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_375",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_376",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_377",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_378",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_380",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_381",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_110.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_385",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_111.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_388",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_112.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_393",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_113.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_382",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_383",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_384",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_386",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_387",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_389",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_390",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_391",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_392",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_394",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_395",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_114.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_399",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_115.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_402",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_116.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_407",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_117.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_396",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_397",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_398",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_400",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_401",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_403",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_404",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_405",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_406",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_408",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_409",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_118.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_413",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_119.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_416",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_120.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_421",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_121.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_410",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_411",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_412",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_414",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_415",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_417",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_418",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_419",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_420",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_422",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_423",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_122.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_427",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_123.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_430",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_124.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_435",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_125.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_424",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_425",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_426",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_428",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_429",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_431",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_432",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_433",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_434",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_436",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_437",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_126.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_441",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_127.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_444",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_128.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_449",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_129.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_438",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_439",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_440",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_442",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_443",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_445",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_446",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_447",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_448",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_450",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_451",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_130.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_455",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_131.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_458",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_132.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_463",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_133.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_452",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_453",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_454",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_456",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_457",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_459",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_460",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_461",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_462",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_464",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_465",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_134.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_469",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_135.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_472",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_136.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_477",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_137.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_466",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_467",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_468",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_470",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_471",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_473",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_474",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_475",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_476",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_478",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_479",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_138.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_483",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_139.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_486",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_140.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_491",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_141.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_480",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_481",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_482",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_484",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_485",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_487",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_488",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_489",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_490",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_492",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_493",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_142.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_497",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_143.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_500",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_144.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_505",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_145.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_494",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_495",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_496",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_498",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_499",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_501",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_502",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_503",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_504",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_506",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_507",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_146.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_511",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_147.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_514",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_148.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_519",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_149.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_508",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_509",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_510",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_512",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_513",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_515",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_516",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_517",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_518",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_520",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_521",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_150.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_525",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_151.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_528",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_152.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_533",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_153.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_522",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_523",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_524",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_526",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_527",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_529",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_530",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_531",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_532",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_534",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_535",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_154.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_539",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_155.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_542",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_156.bin",
+ "format": "raw-shard",
+ "nbytes": 39321600,
+ "records": [
+ {
+ "name": "param_547",
+ "shape": [
+ 15360,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 39321600,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_157.bin",
+ "format": "raw-shard",
+ "nbytes": 23040000,
+ "records": [
+ {
+ "name": "param_536",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_537",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_538",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_540",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_541",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_543",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_544",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_545",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_546",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_548",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_549",
+ "shape": [
+ 15360,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1228800,
+ "byteOffset": 21811200
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_158.bin",
+ "format": "raw-shard",
+ "nbytes": 70778880,
+ "records": [
+ {
+ "name": "param_553",
+ "shape": [
+ 27648,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 70778880,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_159.bin",
+ "format": "raw-shard",
+ "nbytes": 35389440,
+ "records": [
+ {
+ "name": "param_556",
+ "shape": [
+ 5120,
+ 1728
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 35389440,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_160.bin",
+ "format": "raw-shard",
+ "nbytes": 327680000,
+ "records": [
+ {
+ "name": "param_562",
+ "shape": [
+ 32000,
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 327680000,
+ "byteOffset": 0
+ }
+ ]
+ },
+ {
+ "dataPath": "params_shard_161.bin",
+ "format": "raw-shard",
+ "nbytes": 21641216,
+ "records": [
+ {
+ "name": "param_550",
+ "shape": [
+ 5120,
+ 640
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 13107200,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_551",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13107200
+ },
+ {
+ "name": "param_552",
+ "shape": [
+ 5120,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 409600,
+ "byteOffset": 13516800
+ },
+ {
+ "name": "param_554",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 13926400
+ },
+ {
+ "name": "param_555",
+ "shape": [
+ 27648,
+ 40
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 2211840,
+ "byteOffset": 16138240
+ },
+ {
+ "name": "param_557",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 18350080
+ },
+ {
+ "name": "param_558",
+ "shape": [
+ 5120,
+ 108
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1105920,
+ "byteOffset": 19456000
+ },
+ {
+ "name": "param_559",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20561920
+ },
+ {
+ "name": "param_560",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20572160
+ },
+ {
+ "name": "param_561",
+ "shape": [
+ 5120
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 10240,
+ "byteOffset": 20582400
+ },
+ {
+ "name": "param_563",
+ "shape": [
+ 2048,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 524288,
+ "byteOffset": 20592640
+ },
+ {
+ "name": "param_564",
+ "shape": [
+ 2048,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 524288,
+ "byteOffset": 21116928
+ }
+ ]
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params_shard_0.bin b/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..93481e627138571c7ce6beecc3102fdd2a6bcf58
--- /dev/null
+++ b/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:805cb841e53af199f048b2272d93c4bc2bad4bd9bb865429a3c1fbb5b29a2516
+size 327680000
diff --git a/params_shard_1.bin b/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7b1fa4aeb03f00fec77bd64fb51a4d9bdeed39cb
--- /dev/null
+++ b/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:61f07cb1b6a92770b88b7747ed92749cd79bd88dabc072a00ea9ddb53cdee771
+size 39321600
diff --git a/params_shard_10.bin b/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ee1e661c27424dc0def503945da43ed75a48efbd
--- /dev/null
+++ b/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:48783dd2a0ae931c8c9b8b4a897e73d610593a034def55814c663780c045df60
+size 70778880
diff --git a/params_shard_100.bin b/params_shard_100.bin
new file mode 100644
index 0000000000000000000000000000000000000000..598d95c2d44ffcfd2cec35ff94396c06306b442b
--- /dev/null
+++ b/params_shard_100.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e90fca277a6f74949cc5e25befcb181856d2102895c3dcaf1410059541877e04
+size 39321600
diff --git a/params_shard_101.bin b/params_shard_101.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dc385fb727af9add4a1e523a62c0cff470133778
--- /dev/null
+++ b/params_shard_101.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2339894ab48dcf655b5a1d31da74350814168de45bceba27b9c3fcf85e730080
+size 23040000
diff --git a/params_shard_102.bin b/params_shard_102.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3be27aa8ff62723d515bfbc3ea0171cbbf4fcab1
--- /dev/null
+++ b/params_shard_102.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:23ab90a5fcb85b4d0cff9613057a6bd8006ce0f6ca59cee5a64788e75663d98b
+size 70778880
diff --git a/params_shard_103.bin b/params_shard_103.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9a8e908d3b3591a886fa6d59f94b677811e56029
--- /dev/null
+++ b/params_shard_103.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d61dd64d3a6b5c1ad45671165233e5e6f6cde0e057ee681117b3f600b71e987e
+size 35389440
diff --git a/params_shard_104.bin b/params_shard_104.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0c4ae76f7877e3a67a002e2b17ef69200a73670b
--- /dev/null
+++ b/params_shard_104.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c2f7b342a36d609ffeddb0203175b13914ea072bb17940700b0bf8e61fa42da
+size 39321600
diff --git a/params_shard_105.bin b/params_shard_105.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e653bf32e8572fa7d975f9ed67e75ab34ec18717
--- /dev/null
+++ b/params_shard_105.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8cf778ffd59ae011885295df6b63bd76e7386e642d9002c90c76e77ffcedd081
+size 23040000
diff --git a/params_shard_106.bin b/params_shard_106.bin
new file mode 100644
index 0000000000000000000000000000000000000000..daf10a0e81c6ecee26f97441885dd8a7e55b608a
--- /dev/null
+++ b/params_shard_106.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:00452225b75ca94abd5e5ce5f0915e540abf2b6e9e6eccafdcd85befec60cac9
+size 70778880
diff --git a/params_shard_107.bin b/params_shard_107.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0b0a9f944bfc3dc424a1130a8b982c17c99fc39d
--- /dev/null
+++ b/params_shard_107.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:47f6d455fd8a88aff685dab3687ad34023f92d62f906e4fa8bf01d219d2f0aac
+size 35389440
diff --git a/params_shard_108.bin b/params_shard_108.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b39df3e472998b64f59426b68463097004d3dec1
--- /dev/null
+++ b/params_shard_108.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bb4689714ee7e489ab99a9b74edc2ad76d191464066d9a900fb294e116dd0468
+size 39321600
diff --git a/params_shard_109.bin b/params_shard_109.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cec0b7025136baf57e5308201df7cd0c5efb451f
--- /dev/null
+++ b/params_shard_109.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a6e62a3e0bad7334040af48c3269c3d835b411a39efe3b0a2c12a10551d104c9
+size 23040000
diff --git a/params_shard_11.bin b/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a34e764c335e5814dcf32d9ccbf37f0628dcfa25
--- /dev/null
+++ b/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3055295cbb58e5f2e251c33c70ae7071f7235c39eed51156575afc889370dd3c
+size 35389440
diff --git a/params_shard_110.bin b/params_shard_110.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0ec595eb688c4f96e9c347bb096678ae36215a60
--- /dev/null
+++ b/params_shard_110.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:59d626eead2daba4dca14453b5baeff26f138861a0184c71eafadf9d69581bd9
+size 70778880
diff --git a/params_shard_111.bin b/params_shard_111.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4ed77f8ce9f426ae6f92bc2904cffd222e7f96f1
--- /dev/null
+++ b/params_shard_111.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f2772dbe0d2f0238a6891983074dadf13640be9e28039e1985f739a4b4c5f77
+size 35389440
diff --git a/params_shard_112.bin b/params_shard_112.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a5c621dec633b99b000848146fed8d328567375
--- /dev/null
+++ b/params_shard_112.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f50792facd10234fe7c8e5eccfb022d1c76da7ac3afca519f7ef9e75d6038109
+size 39321600
diff --git a/params_shard_113.bin b/params_shard_113.bin
new file mode 100644
index 0000000000000000000000000000000000000000..642ea60c6bf724a55e453feff265050afbeced69
--- /dev/null
+++ b/params_shard_113.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6b1757fd79f26b3022d1bc808048e1ca3980100b5c0f54907e5564de13349abc
+size 23040000
diff --git a/params_shard_114.bin b/params_shard_114.bin
new file mode 100644
index 0000000000000000000000000000000000000000..68366b94368d3e7db6fa7555b48a1108dda3f04e
--- /dev/null
+++ b/params_shard_114.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:25feb11e60752b350a158a9ae9542534c3eb2c2775b90fcf47313cfed9599f1f
+size 70778880
diff --git a/params_shard_115.bin b/params_shard_115.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5766e0af7f6f7f88bd0ec5518d2d484e68f3189c
--- /dev/null
+++ b/params_shard_115.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:736cac6ee7a0e2efcadbd9b6beb9befaa625fda247a4b5b44850c3e257b58985
+size 35389440
diff --git a/params_shard_116.bin b/params_shard_116.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2411d5af7a62764f0bf9b203ff0d858c474e8074
--- /dev/null
+++ b/params_shard_116.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be0904bdbe8931c3998692c3799087561bc964740f0efc1ae2c06b40c30e5d28
+size 39321600
diff --git a/params_shard_117.bin b/params_shard_117.bin
new file mode 100644
index 0000000000000000000000000000000000000000..25a942ff7e999826658cd9e32e3ebea44c57251a
--- /dev/null
+++ b/params_shard_117.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c8da5460fe7334760b832953cca59fe0b881e9369e8d62b0cb88a37cbfab1572
+size 23040000
diff --git a/params_shard_118.bin b/params_shard_118.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4db8b18e4b2e6373cca88054aa15f773b7018db3
--- /dev/null
+++ b/params_shard_118.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:210890129a3f6eda85280db348ae7cdfdf89e423c9c8fa639d2b4c83e33a7f8b
+size 70778880
diff --git a/params_shard_119.bin b/params_shard_119.bin
new file mode 100644
index 0000000000000000000000000000000000000000..01e614d7b1680d678117ffa8ecd3328e0f2c00bd
--- /dev/null
+++ b/params_shard_119.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ddbb1abbcce09177d1673b7c786885bd102ac370d8785099e53bcbc5b907a3e1
+size 35389440
diff --git a/params_shard_12.bin b/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9e1835fc6a1fed01c883d1b3a18022e0683932f1
--- /dev/null
+++ b/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a503a7ecb362c2c9a7ea39773801a9140d7755a9c0594b3a36af1789b01b091
+size 39321600
diff --git a/params_shard_120.bin b/params_shard_120.bin
new file mode 100644
index 0000000000000000000000000000000000000000..91ea6ac88bb291549314eb2f757cbac9788e8d8c
--- /dev/null
+++ b/params_shard_120.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:36a0e85fbacf7f24b43830ba0d08d3d4689abcfa36878b690f34d93cfbbcde28
+size 39321600
diff --git a/params_shard_121.bin b/params_shard_121.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c5ed5f08530c915e8edf431104561e746e0ae75
--- /dev/null
+++ b/params_shard_121.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:794aaed7d877ab860c6d4e5da05de973b4e199da1a2c19373e02bb1e8f15fa53
+size 23040000
diff --git a/params_shard_122.bin b/params_shard_122.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d62fb0f09d511e01d001fac60a5e8c0c052517fc
--- /dev/null
+++ b/params_shard_122.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b74254179b3546b67e6aab202538fd780ac63b143923d0b5dff38507b7e14298
+size 70778880
diff --git a/params_shard_123.bin b/params_shard_123.bin
new file mode 100644
index 0000000000000000000000000000000000000000..480115be99084cb8dbf669903593dcb35002d230
--- /dev/null
+++ b/params_shard_123.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a3acf65b6a4af9a34dd46f1e0027337eeb5b7f9f7cbcbeaca42ba02895ffd646
+size 35389440
diff --git a/params_shard_124.bin b/params_shard_124.bin
new file mode 100644
index 0000000000000000000000000000000000000000..55fe3577946e841d3c34ea416832d606217ffe60
--- /dev/null
+++ b/params_shard_124.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e97915e33118be1cbaf9badba040bb1844583a988265f9f1e1f3f250dd0e8652
+size 39321600
diff --git a/params_shard_125.bin b/params_shard_125.bin
new file mode 100644
index 0000000000000000000000000000000000000000..494f7eb4c4f492b7a102d3d5f805c8d6df4419f1
--- /dev/null
+++ b/params_shard_125.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1ebc3886b91f40715f76ebfb250784dd023617f2c4dcd2fc004e7df600396b63
+size 23040000
diff --git a/params_shard_126.bin b/params_shard_126.bin
new file mode 100644
index 0000000000000000000000000000000000000000..dcbe29943b66a87eb461330f0dfaed1a459962ed
--- /dev/null
+++ b/params_shard_126.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fb3e23d6cfab313eacec1504a117bd902556195d50d8d774b0099a2ae2cd0a04
+size 70778880
diff --git a/params_shard_127.bin b/params_shard_127.bin
new file mode 100644
index 0000000000000000000000000000000000000000..07a2262ea7b17c07ca1f269bd41d0c253ea515a5
--- /dev/null
+++ b/params_shard_127.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:74db10d2ed1048bcb5f9d1e8be6debab22ff56ebb08a21da0ba802e962ab7fd6
+size 35389440
diff --git a/params_shard_128.bin b/params_shard_128.bin
new file mode 100644
index 0000000000000000000000000000000000000000..992dee9b808bd99609dcf8097162a451b45f50a7
--- /dev/null
+++ b/params_shard_128.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d10c347ab2bd769e3463323fb0743772b15ff283482b3791da4fc3842f57d1d5
+size 39321600
diff --git a/params_shard_129.bin b/params_shard_129.bin
new file mode 100644
index 0000000000000000000000000000000000000000..989a222849d6cf452b3422a6f6338de9f984dbdb
--- /dev/null
+++ b/params_shard_129.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ccfe098dce446262aee9e5a58965838019d134d45f401adf334320f3ac171939
+size 23040000
diff --git a/params_shard_13.bin b/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5eb1e8a0dfeeb3e098cbdd1294885a6dc44c582c
--- /dev/null
+++ b/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:52ab78f015dc1bd9406a11741363b8c256a8bc73de5e77be7b6200610e6cd340
+size 23040000
diff --git a/params_shard_130.bin b/params_shard_130.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c500d71cc131f2a1c73ad054145ad8d616cfdc2c
--- /dev/null
+++ b/params_shard_130.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:53b1f82a9644654f37792d41e23fe3319727362837cf7dfcd08b9b43a3ee7803
+size 70778880
diff --git a/params_shard_131.bin b/params_shard_131.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2c8fee4180391a864b99dca23539f31231eb6d3a
--- /dev/null
+++ b/params_shard_131.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2c93e3bce70e954eec665b0ce16c4bf45cd11dede900c0970d52921f9287b3a
+size 35389440
diff --git a/params_shard_132.bin b/params_shard_132.bin
new file mode 100644
index 0000000000000000000000000000000000000000..60642cc76af79458579c68f08db58a17b5ed28f5
--- /dev/null
+++ b/params_shard_132.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a22bf6788023006a3ae2d0485afe108ac4da1b286cbf9e1e846fa56fc74ef5dc
+size 39321600
diff --git a/params_shard_133.bin b/params_shard_133.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9541d87c8a2fdd01a9108ae1313cb675cf0b8adc
--- /dev/null
+++ b/params_shard_133.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83cc07de06fe170ae0ce59b23959c9f0b0d06656531b7305a77a43db65f185b0
+size 23040000
diff --git a/params_shard_134.bin b/params_shard_134.bin
new file mode 100644
index 0000000000000000000000000000000000000000..38db9ec98dde711236a9cc1aac65fef7a61819f1
--- /dev/null
+++ b/params_shard_134.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33c10ef609745610303a4e1d15f900f275351a1fd0881ce958a1d05eb5dfbdae
+size 70778880
diff --git a/params_shard_135.bin b/params_shard_135.bin
new file mode 100644
index 0000000000000000000000000000000000000000..92af751cd30b1f488306070f1998d74a104271a1
--- /dev/null
+++ b/params_shard_135.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5e488aa74804fdd975f82c96c61714f34f1d70835adf20f2ec82071e5adff4b6
+size 35389440
diff --git a/params_shard_136.bin b/params_shard_136.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26b448c925d255b3dadee5ec69788425d03e175e
--- /dev/null
+++ b/params_shard_136.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:91ba3b9fcd904297b5bdf92630b310229159caae417092ca48ab023af13c57c4
+size 39321600
diff --git a/params_shard_137.bin b/params_shard_137.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ec7748f114b44aafefa81b8f0a3185b0bb7ad6b2
--- /dev/null
+++ b/params_shard_137.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cb575b43e73c3b32376cd4c4206a29aa9d0676aabc3237727b26edc2906b6afd
+size 23040000
diff --git a/params_shard_138.bin b/params_shard_138.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eb478956272097014db894ac2cbe41b0a4156b13
--- /dev/null
+++ b/params_shard_138.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b83f7a48af674088ad3a860d7641e33e58a2e480b037417e4b5875dd25c54362
+size 70778880
diff --git a/params_shard_139.bin b/params_shard_139.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d054b4341b13ed002d71357f173237f58bc25f5
--- /dev/null
+++ b/params_shard_139.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a05a0a0672fa762b4685d970b8115e5b68789201be5e5cbd593bd1fa1ad83b3a
+size 35389440
diff --git a/params_shard_14.bin b/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7317ccccf45c313a93d4d7d55959d9d477303617
--- /dev/null
+++ b/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c24ba3f2f3ca324f8f6192939687cb6b75a09a8cfa0d6995998b5c8ecb5ecfb6
+size 70778880
diff --git a/params_shard_140.bin b/params_shard_140.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9250cdb79b95a0eb4a7e2ce25ec725128edfab06
--- /dev/null
+++ b/params_shard_140.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8ee0fcf13167b4a4f1ac15da16eb228ac29d55434ca51dc95838437045ed4c8b
+size 39321600
diff --git a/params_shard_141.bin b/params_shard_141.bin
new file mode 100644
index 0000000000000000000000000000000000000000..84f1cbf57f6175183a0f3b02db0541ace1e4e1cd
--- /dev/null
+++ b/params_shard_141.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d5c1b16bd885aa49396642700d1a3a45120a6b3b5b55f6b7dcac21ee6576017
+size 23040000
diff --git a/params_shard_142.bin b/params_shard_142.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0f0eb961a90185081771962417bfa1e07a99586d
--- /dev/null
+++ b/params_shard_142.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a9e9358a1256b9840886898c9d1dd1d97ca1094579658c9e05fa19cd0095a80b
+size 70778880
diff --git a/params_shard_143.bin b/params_shard_143.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1813f990a996a9470847c7274e2ed3f720d42ebc
--- /dev/null
+++ b/params_shard_143.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f4b3bad28cab1f519cfbd2edca8be64383f6514db2a3d8bc1605061f525c32c3
+size 35389440
diff --git a/params_shard_144.bin b/params_shard_144.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19d6c33c1122faa89556606f00e142b0b25d105e
--- /dev/null
+++ b/params_shard_144.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:731c66bd1c17131e84f8f396f3d07723bafa5b7dea970699f40152513acdafad
+size 39321600
diff --git a/params_shard_145.bin b/params_shard_145.bin
new file mode 100644
index 0000000000000000000000000000000000000000..863bccffc3f5bdd9a1465e5925e516c247c13bfa
--- /dev/null
+++ b/params_shard_145.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:41a9cd8abbd66d206fe4e4bd55166a7137dc1f6d0ba401662e1e86a9b0f3ce28
+size 23040000
diff --git a/params_shard_146.bin b/params_shard_146.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ca5157b7c7ef48491d8bbfb5e6a2f9e858466ced
--- /dev/null
+++ b/params_shard_146.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26b89fc978f09d8d81f39ce6e9e372ad76df26da05f275031d4e0f201f2d4fee
+size 70778880
diff --git a/params_shard_147.bin b/params_shard_147.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d6782f9d67b1a95928045f495c777e3a670b03c3
--- /dev/null
+++ b/params_shard_147.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:27cf4d19d1c6d0d4a9fab52d14e49ebc398fce7a91c37f1c3e02d022c4d48374
+size 35389440
diff --git a/params_shard_148.bin b/params_shard_148.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f1ce900cf8d6767adbcbac43fb5c4532b000acb
--- /dev/null
+++ b/params_shard_148.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ddcdc881ca84861c497172a6b228754ef04ab1d5bb31870e1683a6d0acec70d0
+size 39321600
diff --git a/params_shard_149.bin b/params_shard_149.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6f52b94140d808fd5bebb74906ac32434e970da1
--- /dev/null
+++ b/params_shard_149.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5202fc4a20c62df9f9708b7f9ef641abc6d062b9666e675deee3fe6183e27ed7
+size 23040000
diff --git a/params_shard_15.bin b/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3605579cafe862d91ee4b347fedcf57a6399d1d0
--- /dev/null
+++ b/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:290ca1ee1524010bf318efa52d4c65b6d76b2d8c9fdae7b8b4a736cd16e5285a
+size 35389440
diff --git a/params_shard_150.bin b/params_shard_150.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cd224e2a4009edb13794a7e559138507065e0683
--- /dev/null
+++ b/params_shard_150.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4ab6396a2660e36f9094dbe423be08c3ebcfd1b394c0d3e5306a42477342c59
+size 70778880
diff --git a/params_shard_151.bin b/params_shard_151.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4e621bed57517549fb6caad673cb47497bdb8eb2
--- /dev/null
+++ b/params_shard_151.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8d546b6d05d18ee68033bf0d6d69bc362e0e8ce89ed92ea49c51df748834da4
+size 35389440
diff --git a/params_shard_152.bin b/params_shard_152.bin
new file mode 100644
index 0000000000000000000000000000000000000000..661fa86540cc35e033dd2534b609f3d3ed8c517f
--- /dev/null
+++ b/params_shard_152.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:076cff08128a7fc5ae0c1ea92f031d9da358dacaf2e5a2fc934fd79f6c9e5ae9
+size 39321600
diff --git a/params_shard_153.bin b/params_shard_153.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bee83c02a46cfb1fc03912a26f55ba62db779aaf
--- /dev/null
+++ b/params_shard_153.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a019141238d8100231117641327e05b5e6d3b1822e0fe3a8137f75392320799
+size 23040000
diff --git a/params_shard_154.bin b/params_shard_154.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1afb4ab59d8d4516557aa873b09334f542790b27
--- /dev/null
+++ b/params_shard_154.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:81b751a81b469026cddcae5a773932058384518c67f5c8e05953941f1969eba9
+size 70778880
diff --git a/params_shard_155.bin b/params_shard_155.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d97aee5ba21bc73f1ec2d4895f691c595baf71c5
--- /dev/null
+++ b/params_shard_155.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:77fff75c1acd7ef6e95a3b3579c418a1cebb8c130fa113faf0f2e94251804787
+size 35389440
diff --git a/params_shard_156.bin b/params_shard_156.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f93120335a11fbd0cd394dceab5af169ce157a3f
--- /dev/null
+++ b/params_shard_156.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:53c36b5cc1f759e98665a579103a563652f3f7e1337a5587de301d4b9c0d45c4
+size 39321600
diff --git a/params_shard_157.bin b/params_shard_157.bin
new file mode 100644
index 0000000000000000000000000000000000000000..30f5b3e4f907998c0cbf5dabc3497e0266ef2897
--- /dev/null
+++ b/params_shard_157.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62360e0d72d93263b467cdb80403288edd534b30b2deaf0a7e45aa2ad0870522
+size 23040000
diff --git a/params_shard_158.bin b/params_shard_158.bin
new file mode 100644
index 0000000000000000000000000000000000000000..f5d2d4fac5e7efc7d2e8d50d364f86c63cd45588
--- /dev/null
+++ b/params_shard_158.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7a145367ca897ee9192ef445331d161687f4a9f7a8e89d7ec9681739730ea968
+size 70778880
diff --git a/params_shard_159.bin b/params_shard_159.bin
new file mode 100644
index 0000000000000000000000000000000000000000..109fc2e47a5e05b5ed8a550bacaddfc08875c4cc
--- /dev/null
+++ b/params_shard_159.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:35d6c1df4438ceaad388224577497a6719826d40646329eebf510c402453f997
+size 35389440
diff --git a/params_shard_16.bin b/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..19de00c6385df315ff9ee6268e3960ec1d6df078
--- /dev/null
+++ b/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8186f8f3e769ead1697364819d5066f2a099fcd43fddff24adeea82305c1098
+size 39321600
diff --git a/params_shard_160.bin b/params_shard_160.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7d481998685118200d59eb0c780f50dbe629dd40
--- /dev/null
+++ b/params_shard_160.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:579b07243ca8d3f02877ae9804eb75beadf4be7bc8d77f48da576c7919080519
+size 327680000
diff --git a/params_shard_161.bin b/params_shard_161.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4f746559c9f8e99ce421a24ac50a1a0cf9f2e362
--- /dev/null
+++ b/params_shard_161.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:453b1a9e59baa9bf1788ebb512764ca37b24ec8a16cb2f3fb1339953741e427c
+size 21641216
diff --git a/params_shard_17.bin b/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8a8ea78bd945ab15cc9d6b414d423da723cd1ca8
--- /dev/null
+++ b/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c1a09fef31f9b727f03c3271f2472b8aaacc19c6f837f7b750530b3d57687096
+size 23040000
diff --git a/params_shard_18.bin b/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4d56089b17fd1bd4e9de4c0de92ba3b337f15679
--- /dev/null
+++ b/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:38140d091e6739bbb8052d8e6b1ff43d21a87c6932088a6495f7bf34b2937f23
+size 70778880
diff --git a/params_shard_19.bin b/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..33e2e0f5695c51a4aee437d1a9b701c9a2081aa7
--- /dev/null
+++ b/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33ef422a0a8c1846f06367861dd74f382841cfe8d3080b0605c50a0f6a87253c
+size 35389440
diff --git a/params_shard_2.bin b/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..45f9653ff98111788d98c22dac8d4fc4782c4e32
--- /dev/null
+++ b/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e771a148dd627dafa1a217c8dea5100e14b8f46fed854972b2e7c925e260bc94
+size 70778880
diff --git a/params_shard_20.bin b/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9f620e3b0e01a954528e88802384232daeb775dc
--- /dev/null
+++ b/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc2a33a1f1d310405b6b9447a1b545db9fe4a3fa632917a39161431efd9bf982
+size 39321600
diff --git a/params_shard_21.bin b/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7fb484f65d492d28697d0b0f786c2ee458cdc201
--- /dev/null
+++ b/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e00e3e50f9893e4322ad1e9ca0749a1db2d928c568b1cffe85f07bc611d3aa7
+size 23040000
diff --git a/params_shard_22.bin b/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d781a8848b66b4ca8f13d6e4d89128b84726190c
--- /dev/null
+++ b/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d740241577bc8efb7c6d2b7eb2b89037cace2a1cd3c18e72a291566e1f17c191
+size 70778880
diff --git a/params_shard_23.bin b/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e971662ae5559592fc739f86df7a5e8c8562c5ae
--- /dev/null
+++ b/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:04d7594a4b5bfe15d8b6028174df661e0cd2450eadeeacbe1d389ffefacaa149
+size 35389440
diff --git a/params_shard_24.bin b/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c7c0ddd3b4c79d538d98136758d967b1325e8ae
--- /dev/null
+++ b/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6814015e417bb4f17c72a1e4edba0c7675a1907ad54c2c39e203fea83084e39c
+size 39321600
diff --git a/params_shard_25.bin b/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b96315c7f599dbc2e86cef732d65bc5d372a06b9
--- /dev/null
+++ b/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1e2e5e51f6993576d98dc21fcfc28a7fe10649b8942a6ff802fc9ff4479d3fc1
+size 23040000
diff --git a/params_shard_26.bin b/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a980aa69980449d238587a3912656b3b91e26f65
--- /dev/null
+++ b/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5ad7862e1e9190f069b64abc000751e99e02f27ca09a49a664dd5ec50241903e
+size 70778880
diff --git a/params_shard_27.bin b/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0cda944924d7f3ee672b03c5ff18f8eeddab01b6
--- /dev/null
+++ b/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d73d1d9d521246a475870c30674e6a37b3c6c047e5b01e46789b71255f6fe818
+size 35389440
diff --git a/params_shard_28.bin b/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c3cd9a3dd8d55332d701f8e44b42a6786c163a68
--- /dev/null
+++ b/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:07e1ad37e9499b4b5730c5f98b252701defe6b7920939afd82d17f8d082038bf
+size 39321600
diff --git a/params_shard_29.bin b/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8357d9eb4fd47f241e439a309e53a0d5efba7d43
--- /dev/null
+++ b/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:88cda58681f2394688ef06559834b2da0e70e0129131797fc250ba48f408d4cf
+size 23040000
diff --git a/params_shard_3.bin b/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..da0ab1531086efd61af9f3ce8e6fcbbf34125ff4
--- /dev/null
+++ b/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:902734089e4aa372c27fa8d688effa2c1b582fd0475410bcb4bb93f42a85f28f
+size 35389440
diff --git a/params_shard_30.bin b/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2573412e4475d22c6bde189e46ee9a6cf2322aaa
--- /dev/null
+++ b/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d4dfa42ed2624d89f4a226eb2e400f67e1aabeab1b3df8c2cee620fdb05f25e
+size 70778880
diff --git a/params_shard_31.bin b/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2617e84741fb51a224e67f42d4ec0e53b7c02394
--- /dev/null
+++ b/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b6f25cfe743feb4df87effddf9f00b71b00a19c02636b992d2c635a5d149c2e7
+size 35389440
diff --git a/params_shard_32.bin b/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e21dec8c230eeeab12dbfefae8c9460bb7b40b51
--- /dev/null
+++ b/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9d0fe2ef672937671ab1a348fa1e1fca06e9d6980e86984a3bc6d3a0944d62b7
+size 39321600
diff --git a/params_shard_33.bin b/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d86642f9f3e67a09175f8d5c9157ba8986542dd5
--- /dev/null
+++ b/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6608d9de5aeae08290f55e5fb1ae526d4ee898a73d1e20c990d78de4dc1ee004
+size 23040000
diff --git a/params_shard_34.bin b/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bcceece10ae4fdaf9daede9c08b9717287fb6566
--- /dev/null
+++ b/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3ece9ae6801008284dfddd6ae7f0c1ecbb9ee40ff11fb31063b9cc3f557e9dd8
+size 70778880
diff --git a/params_shard_35.bin b/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c38c723e08d7a37ab78bb196a76f90e22db3c28c
--- /dev/null
+++ b/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6756f5081f4d943e552fc969101fabc2f8b78da51452081be819c8fd41b27239
+size 35389440
diff --git a/params_shard_36.bin b/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1cf38fbf1c4c86ea897eb6ad71b992f2b617b7d1
--- /dev/null
+++ b/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e3a5a790056445822f1087d66a651dc9652ec6ea7036061e58f7c279e323fde9
+size 39321600
diff --git a/params_shard_37.bin b/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ecd7ce6de442b478ceba2b0fc262ba517b844fd
--- /dev/null
+++ b/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d0adb8c402f82514b794de21db1a096b5d0e026f55f330cd94817d3359e34109
+size 23040000
diff --git a/params_shard_38.bin b/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8323f6cfa7755af689278566ddf40d09fe988713
--- /dev/null
+++ b/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3d2f81d50cdf6d455558be7d1a49da1ce8971b39a84535cf193620635af372bc
+size 70778880
diff --git a/params_shard_39.bin b/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d45964ee69b0b14c424a0d5ec6992d098123e16
--- /dev/null
+++ b/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:42e5bb2d2ee46cfcf78d3db7151daef1253d68e24c08b3f5333735b1db9c3e79
+size 35389440
diff --git a/params_shard_4.bin b/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..08f2b9dda76e708d2ccecaa5f8cb46064b1d2f1f
--- /dev/null
+++ b/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4fb204aa8a7ea4f343dd1082d43c4542ad7b9cbc89aab007cd968517ef32944a
+size 39321600
diff --git a/params_shard_40.bin b/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8790177251d87c92fa0851f44d56449cb6c53b66
--- /dev/null
+++ b/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c0a192cfddfb8a49fa22b355822cd4053451c0bd3eb0a79cb6756dd031c9fd7a
+size 39321600
diff --git a/params_shard_41.bin b/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4e19b21cb337e2107e106c01d691407761c4f216
--- /dev/null
+++ b/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a2053818b112a03d757305950b6aa33d52f48f7f67a9fee5fdee3c1055895bfa
+size 23040000
diff --git a/params_shard_42.bin b/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1aa26b34511f08e8f87bddefcc22f5f768b03ab9
--- /dev/null
+++ b/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:467e6d2a525b62bb50b9867f26fe628d73301d0340f0e43b94f3e52d3d732c55
+size 70778880
diff --git a/params_shard_43.bin b/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..712f9dd70dea9ae1865d424122eaeb64f48e01fd
--- /dev/null
+++ b/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:87005ce235ddb4eb1875be030a4f0a6660122e97a3836a5f15fa34bc864146bc
+size 35389440
diff --git a/params_shard_44.bin b/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6932eea1ac23672125af8f3d0857e44a26128c51
--- /dev/null
+++ b/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c26d6cae3f744ded76f55fdd482a94a1caf5083cc2b9edb3452269236e40fbbb
+size 39321600
diff --git a/params_shard_45.bin b/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c1759ac973fcbe161d63d116db9ae68037c3b509
--- /dev/null
+++ b/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:13375e59873cb2866243c755be8908af0856b81e0b839af8a1ff8fa322b0112e
+size 23040000
diff --git a/params_shard_46.bin b/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7c9df0e2224e4edb2cbc86a3001a2251543b1192
--- /dev/null
+++ b/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ed0d657370fdb80d659397cfb8226be5c0dd57419b8fa814add7112b27d4ea85
+size 70778880
diff --git a/params_shard_47.bin b/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6650fc53e4561535045747791e527f91059dd10e
--- /dev/null
+++ b/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6e4740679f38e3e9396fd98975861da2657a88f8daaaac54ad9230e9de8c13cd
+size 35389440
diff --git a/params_shard_48.bin b/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d4af54264a1b4488bab9eb2111b9d2e8c3566d9d
--- /dev/null
+++ b/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:28544ff71d7f9a922ed102a1e672d0c258d2efec9d530ef5d57464b640878a12
+size 39321600
diff --git a/params_shard_49.bin b/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3e795f686bce443d0351241151ae26ea4867d229
--- /dev/null
+++ b/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4ddf589c134c620d69a197808fcea57828ab8b89b24b372e1d4f53ee75a905f7
+size 23040000
diff --git a/params_shard_5.bin b/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b2a00a9125919fa2fc258d839bb5b87138d10d65
--- /dev/null
+++ b/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e0b02c008a485f6f0e802cb0955a4ced2b49b593917da7d11111362e2b5647fa
+size 25497600
diff --git a/params_shard_50.bin b/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c155c67305b2080f8c9a69f44a9c712adfe369e
--- /dev/null
+++ b/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:55cf411715687aae13e435794bfc40358c3ed1cdf8e2c832e26dcb8c393f656a
+size 70778880
diff --git a/params_shard_51.bin b/params_shard_51.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7558099d34d0d828ca8941b7efd4ad060f1cac7e
--- /dev/null
+++ b/params_shard_51.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b0085fcc2d3869c85221bff39ecfe2e3de64c7fc809f4c9fd12d5ee3d6f19e81
+size 35389440
diff --git a/params_shard_52.bin b/params_shard_52.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9ed504a6cc1c5ee5972964d6b753fa31f0479f5c
--- /dev/null
+++ b/params_shard_52.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:22dff3f00b3315ba516568fa2905cfc5e808db183faf37704a968524b1492a19
+size 39321600
diff --git a/params_shard_53.bin b/params_shard_53.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8cebd336caf54b97e3a933a28dff5696e3a52da6
--- /dev/null
+++ b/params_shard_53.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:942451981d0b99df0cef04fa7e6a849eed6cdf188139ecc2b2da259c306bc887
+size 23040000
diff --git a/params_shard_54.bin b/params_shard_54.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e76e45f0bb55482f58398d7eebdd61aeaa74cbf7
--- /dev/null
+++ b/params_shard_54.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b45aa8630425165c3eedd1cc0d6874df04ef65eec6713e422ecbfddbdda132b8
+size 70778880
diff --git a/params_shard_55.bin b/params_shard_55.bin
new file mode 100644
index 0000000000000000000000000000000000000000..710443bffb389cc9e8a8277abffdbf5953542472
--- /dev/null
+++ b/params_shard_55.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ee9b59dac9ad66371f8473b326a850bf18d2c2508caa771b1a9ed2429e588fdc
+size 35389440
diff --git a/params_shard_56.bin b/params_shard_56.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ae0738ff7bc02846e479bcd2c70daa32b211f7d6
--- /dev/null
+++ b/params_shard_56.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e4a91423977483f7e0bf13a493513c4884b471aaaec46fdac99d2b35ab2cf190
+size 39321600
diff --git a/params_shard_57.bin b/params_shard_57.bin
new file mode 100644
index 0000000000000000000000000000000000000000..41450604ef0f4f4b5aa3698b30dab20bd217618e
--- /dev/null
+++ b/params_shard_57.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:61dacec8dcfd6ea28a08921c60ea42715767e8443cd279d9769717647286d4df
+size 23040000
diff --git a/params_shard_58.bin b/params_shard_58.bin
new file mode 100644
index 0000000000000000000000000000000000000000..eb76f2e624686af6412d317f6bb14f5b8360f58d
--- /dev/null
+++ b/params_shard_58.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfaffea66a3679838f89309af73f79191a7a71dfb32bee67c310f7dd96a60d04
+size 70778880
diff --git a/params_shard_59.bin b/params_shard_59.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b3dafac27b49f8d1b2c48fcfde3d57ca5942365b
--- /dev/null
+++ b/params_shard_59.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bcf20d3f34327a8328ed7d790d10e89d24b4aabf42f23f2e443ef2957ac46134
+size 35389440
diff --git a/params_shard_6.bin b/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a7765c94184b772adce43871cff6e484aa6aaa5e
--- /dev/null
+++ b/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f799935528e98e220c265af7c943246fe7b109c346e17a609683f5c2fc8dd834
+size 70778880
diff --git a/params_shard_60.bin b/params_shard_60.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bfedb527a33545159e8736dabe6a033701820c39
--- /dev/null
+++ b/params_shard_60.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7080a8e30b51259dc57f76a82e01a7dbbbec97f0e112698d79a09fae05326564
+size 39321600
diff --git a/params_shard_61.bin b/params_shard_61.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5ac272cee0b56d6e4d5db50a8cd792b1cbfd9fd2
--- /dev/null
+++ b/params_shard_61.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b32c6dd0c7cf8a05a96173d7f046f9c861c1f99c7e61a26b33b4873a0b48b05f
+size 23040000
diff --git a/params_shard_62.bin b/params_shard_62.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d62e9eb9bbfd1415e8d248184298f18f9c82db4
--- /dev/null
+++ b/params_shard_62.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:56c13108b32c2581b1b719f2746943ed679909ac8268338b91e6bf709af72573
+size 70778880
diff --git a/params_shard_63.bin b/params_shard_63.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4b3e8ee3c8b48aad4eb878eff0668a087d0fc785
--- /dev/null
+++ b/params_shard_63.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cab2ad9fb19794aa8a4c6410bf63476b9973bc737e672a257dfe9b22a7044223
+size 35389440
diff --git a/params_shard_64.bin b/params_shard_64.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0021c3d545e2a7d3a1d2fbfafdd63719849397d9
--- /dev/null
+++ b/params_shard_64.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ce0516e272484e98a0e82f64c3e03e58544ab0b2cf1b962d19dc9eda223538ed
+size 39321600
diff --git a/params_shard_65.bin b/params_shard_65.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a3fefc7ce81884ce25038f0e9032f650722531c8
--- /dev/null
+++ b/params_shard_65.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:162357aa2ce5b95b24086d642019b8b3d5ab7c5791f4f045ffbecc2101b24619
+size 23040000
diff --git a/params_shard_66.bin b/params_shard_66.bin
new file mode 100644
index 0000000000000000000000000000000000000000..02c3e369a28ed5a5e47eeb5f2d092a9d5fae1678
--- /dev/null
+++ b/params_shard_66.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6ef67c097849f7e1245bdcaae2cc69d9912a1fb9ee0cfd92fe3cb6e6e320a2b2
+size 70778880
diff --git a/params_shard_67.bin b/params_shard_67.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ad1f70ba80f94599a4fcd3ef2bb2a7956413fcb6
--- /dev/null
+++ b/params_shard_67.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:78644c37f6657513fc9be0f32fa9816902129dd88e5c0d0ba929fccbbc253ed6
+size 35389440
diff --git a/params_shard_68.bin b/params_shard_68.bin
new file mode 100644
index 0000000000000000000000000000000000000000..70ed1ae4f3002cfd2db395f753cbc29899fb8105
--- /dev/null
+++ b/params_shard_68.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:80148b3661c918b943eb6034f4df34f2f2d67673a9c0e0a0ce3ca964cda3f036
+size 39321600
diff --git a/params_shard_69.bin b/params_shard_69.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e822c6066212092f51ef5730696681acee3bf2ba
--- /dev/null
+++ b/params_shard_69.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2404c8012584183c1769547209955a14bcd06463b929526fbe2784e403ffb717
+size 23040000
diff --git a/params_shard_7.bin b/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54d11027f0b264bd1e7b193ea43e67647534820f
--- /dev/null
+++ b/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ecf7cd52ed338df9f82feb95db473957e4781974d2d03b7f19eaa7dcc6fbf29c
+size 35389440
diff --git a/params_shard_70.bin b/params_shard_70.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7410fc561ef7507543b5a6c1d8fc450841fd4dd3
--- /dev/null
+++ b/params_shard_70.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:416fc3b1dc6ac3f8d0197373a1009b1900c68f82e1888ae5941716a8965b3028
+size 70778880
diff --git a/params_shard_71.bin b/params_shard_71.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b4f03697d2261730c89629cdcb61feaa5d08c363
--- /dev/null
+++ b/params_shard_71.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a7bfdd2d6c7186b8362d933ea13600e5b98eebfc458744bb92fa8726024b3742
+size 35389440
diff --git a/params_shard_72.bin b/params_shard_72.bin
new file mode 100644
index 0000000000000000000000000000000000000000..234cd50e1fcb93f1716a5c90b2e21ebb0c123cdb
--- /dev/null
+++ b/params_shard_72.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:edf72d470fde3c37e30f0c63369dc237fef87a0c78a05afe138ebccb00d04298
+size 39321600
diff --git a/params_shard_73.bin b/params_shard_73.bin
new file mode 100644
index 0000000000000000000000000000000000000000..198c4d2947ca6d2414534bf6f4258cd364b0891d
--- /dev/null
+++ b/params_shard_73.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2c8f2acf9b2a12cba10e3edd3a662dcb172e260d2e54aec4cb7f1c2278ffd4b4
+size 23040000
diff --git a/params_shard_74.bin b/params_shard_74.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b2966ee7e435cbbd2fb58d14e3b9b1db4bbcd079
--- /dev/null
+++ b/params_shard_74.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17cc9b571bcf2829c5e3c57e7c1cd896b7df00a8e3c5e06f7e914348232a261d
+size 70778880
diff --git a/params_shard_75.bin b/params_shard_75.bin
new file mode 100644
index 0000000000000000000000000000000000000000..45ba50f6785660793dbc350926efb893fee30520
--- /dev/null
+++ b/params_shard_75.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e94557ed03641f702b6c026a35cc3d1e0836c70efb7cbbeb4c8b21f904c44978
+size 35389440
diff --git a/params_shard_76.bin b/params_shard_76.bin
new file mode 100644
index 0000000000000000000000000000000000000000..13fe60bc3830095dfedf8e7e2288bc5f5e6d87d2
--- /dev/null
+++ b/params_shard_76.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c88d32637affa2004e697f6acea03b7a4c5013d3894707123b26b160223fddd
+size 39321600
diff --git a/params_shard_77.bin b/params_shard_77.bin
new file mode 100644
index 0000000000000000000000000000000000000000..34ce9ba87867f4ecb45742bf527024f0c2686f90
--- /dev/null
+++ b/params_shard_77.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f331def8b958bacfa2f8b1cdc9cb06572b45290c8646bc13005831fd1c774276
+size 23040000
diff --git a/params_shard_78.bin b/params_shard_78.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c27bb6acffcad469fde120b40c77c8ea444eeff4
--- /dev/null
+++ b/params_shard_78.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d6abd5cdb64260b751888e2c665447225a72669222ce780cb47660b0c10e612a
+size 70778880
diff --git a/params_shard_79.bin b/params_shard_79.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7453d5f594a9f6e0e768bd03c2ee458dd64c89f1
--- /dev/null
+++ b/params_shard_79.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8c15b2789fe1eaf562877317af118580308a6a25e53e72eed3ee9349e72c98d0
+size 35389440
diff --git a/params_shard_8.bin b/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a203f13bc639715b417b2ba096ade7eae352a82
--- /dev/null
+++ b/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f2b5b736ffb597d0731d0047d2f4b830e24f18830337ccd2695552585d843029
+size 39321600
diff --git a/params_shard_80.bin b/params_shard_80.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9d06802e41fe6d36ae1b40c5198dfd65cecf75bf
--- /dev/null
+++ b/params_shard_80.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:51d4b16020796798b517ddac26e4c5857d5de281916908c4166512ba20d5ccee
+size 39321600
diff --git a/params_shard_81.bin b/params_shard_81.bin
new file mode 100644
index 0000000000000000000000000000000000000000..40adbb83f2c00399793500937a5d44df7c0907bf
--- /dev/null
+++ b/params_shard_81.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3219ef4df52b5c2fc6936f16e3d443b4d3b3d3715e39273096ea708e86d542ba
+size 23040000
diff --git a/params_shard_82.bin b/params_shard_82.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1b0bb6e148c8a27c4e9c502d5b94103c88097c20
--- /dev/null
+++ b/params_shard_82.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b4d82280c51287f505e266e95f0d11942524c0046f34df6cc6f41c2d65b70c2
+size 70778880
diff --git a/params_shard_83.bin b/params_shard_83.bin
new file mode 100644
index 0000000000000000000000000000000000000000..3f66cc218bac3d74aeb032f30c887ccbab987c9a
--- /dev/null
+++ b/params_shard_83.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4d3ee6a34492e6b9b3cb3980e0e38d19381ba92d5396b0293bccc2d265a1849a
+size 35389440
diff --git a/params_shard_84.bin b/params_shard_84.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0eeb1e0f00b2aee6f58769c4781bf6c54731804d
--- /dev/null
+++ b/params_shard_84.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:85428d150166333a7a6cd7b777a12aefebfbdec7ec30b90a6a4a4b1a000d195e
+size 39321600
diff --git a/params_shard_85.bin b/params_shard_85.bin
new file mode 100644
index 0000000000000000000000000000000000000000..80a0032e6b6cf6d4b6f27428f2668e23ccc4a2d0
--- /dev/null
+++ b/params_shard_85.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:763c4fdb13ca32234cd568d95c5d8fde9c1c49570bbf10bc061e564a6a1ae6ba
+size 23040000
diff --git a/params_shard_86.bin b/params_shard_86.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e148a135b214aa413da18d4e14594bc79d6411f4
--- /dev/null
+++ b/params_shard_86.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b40d2c8736bcde2a3f1cf40ca7954a191c77e288d7a03445f757d978e527f09
+size 70778880
diff --git a/params_shard_87.bin b/params_shard_87.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54e3b96b76055b5c0ae5b1215b98ce91249d4f4e
--- /dev/null
+++ b/params_shard_87.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:65313dcf3938b4366b9b3880986f46444409b18e399ea2713038f6ad02f6d059
+size 35389440
diff --git a/params_shard_88.bin b/params_shard_88.bin
new file mode 100644
index 0000000000000000000000000000000000000000..58101e31c6db82ce6a76845fded33450cc953b76
--- /dev/null
+++ b/params_shard_88.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6d0f35e84fe4499b2084ea9d46a9f63eb91ecb108bf68ff5600bcf367f639b90
+size 39321600
diff --git a/params_shard_89.bin b/params_shard_89.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c71a7de880f971f77a63a8a72041c6da14be96a8
--- /dev/null
+++ b/params_shard_89.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fe08d5893a67eb82b23f1759838c557e23028e85077d1d1984d77e30b3a2d3e1
+size 23040000
diff --git a/params_shard_9.bin b/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..474020fd70d0022efd47e0fbf2ab41e2e5a58805
--- /dev/null
+++ b/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cf162d12b60735c7c531ebdbe8d4c1858a1a937988ffc58d289afaf0255408d6
+size 23040000
diff --git a/params_shard_90.bin b/params_shard_90.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4a3b5104b03309e441409a35765d81ba342cf8e3
--- /dev/null
+++ b/params_shard_90.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:112551dccf1ac86ce486ff40bd2d8f2197aa19b1c008fae5721e9671c994df75
+size 70778880
diff --git a/params_shard_91.bin b/params_shard_91.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0179988d054bf7c256a64653976f6fc97e4ce22a
--- /dev/null
+++ b/params_shard_91.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:22268f1c87b1640e3781ff65ad8a6617325a3f0f3e908e45970e5118d1f8d044
+size 35389440
diff --git a/params_shard_92.bin b/params_shard_92.bin
new file mode 100644
index 0000000000000000000000000000000000000000..88aa902f3ecc992724e2629c2e1740ab5bd394eb
--- /dev/null
+++ b/params_shard_92.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a635df4e8b52252a3b0df640879fe1b6536d7b1a647a456e57274445a88425b0
+size 39321600
diff --git a/params_shard_93.bin b/params_shard_93.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2098a80e3a2f8867831a7f466c1a537b8a839e30
--- /dev/null
+++ b/params_shard_93.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4ba179cfdeb59b8cb040c0a5a51459ebdb01eb7141262151c79a39c036d8e6e
+size 23040000
diff --git a/params_shard_94.bin b/params_shard_94.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e686b43e32b329801eea1aa0ae8e7578ad8151f4
--- /dev/null
+++ b/params_shard_94.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c4032ab57f7bf15ae6edd7c31a195077b5a7401dda96bb6cb4df38432764375a
+size 70778880
diff --git a/params_shard_95.bin b/params_shard_95.bin
new file mode 100644
index 0000000000000000000000000000000000000000..257c6304210d4cf99ff3da06171fd899f2c18f9a
--- /dev/null
+++ b/params_shard_95.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d2e8bdb6073c493a453e5af9e37d0864fd9bb4f959815ced0a25ff8844f79036
+size 35389440
diff --git a/params_shard_96.bin b/params_shard_96.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2ae00a4e57f21bc1dbb66d20ae9482e49c05fd67
--- /dev/null
+++ b/params_shard_96.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7df3cee65890a261673facb0d68759796bf78e0bac4be54e357ca26bcc66fe54
+size 39321600
diff --git a/params_shard_97.bin b/params_shard_97.bin
new file mode 100644
index 0000000000000000000000000000000000000000..6c2456c5f18197079a8fb70a6653f4cfa6e0c2f0
--- /dev/null
+++ b/params_shard_97.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c498a4f12fb7d44746779b71d24bb0c946f34d366c88d2292cc52a439e53a5ee
+size 23040000
diff --git a/params_shard_98.bin b/params_shard_98.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7a6505f99f27b43f93299451348e0c6a7b5adaf8
--- /dev/null
+++ b/params_shard_98.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3548f79e8d92a7c032688362098acf9830402876909029ce045badf395eb6406
+size 70778880
diff --git a/params_shard_99.bin b/params_shard_99.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0ac0ca95ed994cc347401c28ebe74834392d3751
--- /dev/null
+++ b/params_shard_99.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:de45a7fc13ff426ed70c5696133ecbbf8ff8d44a167cf32db2370cde67d34ed4
+size 35389440
diff --git a/private-llm-config.json b/private-llm-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..77fb5425213023566dd6c2aabcde50ffe7dd894a
--- /dev/null
+++ b/private-llm-config.json
@@ -0,0 +1,19 @@
+{
+ "model_lib": "spicyboros-13b-2.2-w4a16g128asym",
+ "local_id": "spicyboros-13b-2.2-w4a16g128asym",
+ "conv_template": "vicuna_v1.1",
+ "temperature": 0.7,
+ "repetition_penalty": 1.0,
+ "top_p": 0.95,
+ "mean_gen_len": 128,
+ "max_gen_len": 512,
+ "max_window_size": 3072,
+ "num_shards": 1,
+ "shift_fill_factor": 0.3,
+ "tokenizer_files": [
+ "tokenizer.model"
+ ],
+ "model_category": "llama",
+ "model_name": "spicyboros-13b-2.2",
+ "vocab_size": 32000
+}
diff --git a/tokenizer.model b/tokenizer.model
new file mode 100644
index 0000000000000000000000000000000000000000..6c00c742ce03c627d6cd5b795984876fa49fa899
--- /dev/null
+++ b/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..16ada5c0af25aea4028bc3982cf88d7a6fbc0f93
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,37 @@
+{
+ "add_bos_token": true,
+ "add_eos_token": false,
+ "bos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "clean_up_tokenization_spaces": false,
+ "eos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "legacy": false,
+ "model_max_length": 1000000000000000019884624838656,
+ "pad_token": null,
+ "padding_side": "right",
+ "sp_model_kwargs": {},
+ "spaces_between_special_tokens": false,
+ "tokenizer_class": "LlamaTokenizer",
+ "unk_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false
+ },
+ "use_default_system_prompt": true
+}