Upload improved model weights.

Browse files

Files changed (7) hide show

onnx/decoder_model.onnx +1 -1
onnx/decoder_model_merged.onnx +1 -1
onnx/decoder_model_merged_quantized.onnx +1 -1
onnx/decoder_model_quantized.onnx +1 -1
onnx/decoder_with_past_model.onnx +1 -1
onnx/decoder_with_past_model_quantized.onnx +1 -1
quantize_config.json +52 -52

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:203088c58b43ed3d529666bd1e8b7abf84c8c4bc33a929b181cce280776b5bd2
 size 499275976

 version https://git-lfs.github.com/spec/v1
+oid sha256:04797f6f61f2ac95d7e53467d7b880005af0e7d6e23ac7af61c8966d387479a8
 size 499275976

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33238cfce1785c347e0ac7134f2500fadfa7f5af6e537a7bb2a769d9e4217260
 size 500799139

 version https://git-lfs.github.com/spec/v1
+oid sha256:b064a9a5e6c51608025266be8ba9d6ccf0ba588b6476a2498f29164ddadc41b1
 size 500799139

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:da6257be48d422fe7b0a71e2be74b1cec2f1d7637d9ec552c8f9e5ea4102de32
 size 128730727

 version https://git-lfs.github.com/spec/v1
+oid sha256:28ec91a265697bed4cdd4d560c83d6eafb7911ed51e7c3e3f6dc77395309884e
 size 128730727

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0fc84ac6c0b3de482208b865e23c05f718d116587abeca70cee52bc607c78db8
 size 126971841

 version https://git-lfs.github.com/spec/v1
+oid sha256:00d7b62491d00c106617e73bdb3568d8e864700a1b8d6668d6dbdf2b70ab5016
 size 126971841

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bccf364af191d522910eac476249a8f386489fe79287e9b30de307420129275b
 size 499282782

 version https://git-lfs.github.com/spec/v1
+oid sha256:c44ea42f606fdcb678b4a8637c6c23e9e826c692f54f8b17d60d53b25459b2bc
 size 499282782

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4a108612c823b5ad4c00257dc6937fe3beca7ef4494944761360e080f563ef9
 size 126980889

 version https://git-lfs.github.com/spec/v1
+oid sha256:f7cffc5fce24929f862e04df1188478fa565dc03049ec61a2350b9d04f080398
 size 126980889

quantize_config.json CHANGED Viewed

@@ -4,92 +4,92 @@
     "per_model_config": {
         "decoder_model": {
             "op_types": [
-                "Shape",
                 "Pow",
                 "Concat",
                 "Div",
-                "Add",
-                "Cast",
-                "Slice",
                 "Sub",
-                "Gather",
                 "ConstantOfShape",
-                "MatMul",
                 "Reshape",
                 "Where",
-                "Unsqueeze",
-                "Tanh",
-                "Transpose",
-                "Squeeze",
-                "Softmax",
-                "ReduceMean",
-                "Constant",
-                "Mul",
-                "Split",
                 "Sqrt",
-                "Range",
-                "Gemm"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Shape",
                 "Pow",
-                "If",
                 "Concat",
                 "Div",
-                "Add",
-                "Cast",
-                "Slice",
                 "Sub",
-                "Gather",
                 "ConstantOfShape",
-                "MatMul",
                 "Reshape",
                 "Where",
-                "Unsqueeze",
-                "Tanh",
-                "Transpose",
-                "Squeeze",
-                "Softmax",
-                "ReduceMean",
-                "Constant",
-                "Mul",
-                "Split",
                 "Sqrt",
-                "Range",
-                "Gemm"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Shape",
                 "Pow",
                 "Concat",
                 "Div",
-                "Add",
-                "Cast",
-                "Slice",
                 "Sub",
-                "Gather",
                 "ConstantOfShape",
-                "MatMul",
                 "Reshape",
                 "Where",
-                "Unsqueeze",
-                "Tanh",
-                "Transpose",
-                "Squeeze",
-                "Softmax",
-                "ReduceMean",
-                "Constant",
-                "Mul",
-                "Split",
                 "Sqrt",
-                "Range",
-                "Gemm"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "decoder_model": {
             "op_types": [
+                "Slice",
+                "Gemm",
+                "Split",
                 "Pow",
                 "Concat",
+                "Transpose",
+                "Gather",
+                "Tanh",
+                "Softmax",
+                "Mul",
                 "Div",
+                "ReduceMean",
+                "Range",
                 "Sub",
                 "ConstantOfShape",
                 "Reshape",
+                "MatMul",
                 "Where",
+                "Cast",
                 "Sqrt",
+                "Shape",
+                "Squeeze",
+                "Add",
+                "Unsqueeze",
+                "Constant"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
+                "Slice",
+                "Gemm",
+                "Split",
                 "Pow",
                 "Concat",
+                "Transpose",
+                "Gather",
+                "Tanh",
+                "Softmax",
+                "If",
+                "Mul",
                 "Div",
+                "ReduceMean",
+                "Range",
                 "Sub",
                 "ConstantOfShape",
                 "Reshape",
+                "MatMul",
                 "Where",
+                "Cast",
                 "Sqrt",
+                "Shape",
+                "Squeeze",
+                "Add",
+                "Unsqueeze",
+                "Constant"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Slice",
+                "Gemm",
+                "Split",
                 "Pow",
                 "Concat",
+                "Transpose",
+                "Gather",
+                "Tanh",
+                "Softmax",
+                "Mul",
                 "Div",
+                "ReduceMean",
+                "Range",
                 "Sub",
                 "ConstantOfShape",
                 "Reshape",
+                "MatMul",
                 "Where",
+                "Cast",
                 "Sqrt",
+                "Shape",
+                "Squeeze",
+                "Add",
+                "Unsqueeze",
+                "Constant"
             ],
             "weight_type": "QInt8"
         }