Upload Transformers-compatible ONNX weights

Files changed (3) hide show

onnx/model.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:09b950b371030de9003824baa66457f2e8fc4f96fe87a34cc4c3b242b2864d8b
+size 33741738

onnx/model_quantized.onnx ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9888cd09b6cb062a8c65f94758c57bffbcfcc5792e1022923bc8abf05d499ee
+size 8973119

onnx/quantize_config.json ADDED Viewed

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "model": {
+            "op_types": [
+                "Add",
+                "Mul",
+                "Concat",
+                "AveragePool",
+                "Conv",
+                "Sigmoid",
+                "Unsqueeze",
+                "Gather",
+                "GlobalAveragePool",
+                "Shape",
+                "Pad",
+                "Reshape",
+                "Constant",
+                "Gemm"
+            ],
+            "weight_type": "QUInt8"
+        }
+    }
+}