Xenova HF staff commited on
Commit
a8c5612
1 Parent(s): 558944c

Upload Transformers-compatible ONNX weights

Browse files
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09b950b371030de9003824baa66457f2e8fc4f96fe87a34cc4c3b242b2864d8b
3
+ size 33741738
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9888cd09b6cb062a8c65f94758c57bffbcfcc5792e1022923bc8abf05d499ee
3
+ size 8973119
onnx/quantize_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": true,
3
+ "reduce_range": true,
4
+ "per_model_config": {
5
+ "model": {
6
+ "op_types": [
7
+ "Add",
8
+ "Mul",
9
+ "Concat",
10
+ "AveragePool",
11
+ "Conv",
12
+ "Sigmoid",
13
+ "Unsqueeze",
14
+ "Gather",
15
+ "GlobalAveragePool",
16
+ "Shape",
17
+ "Pad",
18
+ "Reshape",
19
+ "Constant",
20
+ "Gemm"
21
+ ],
22
+ "weight_type": "QUInt8"
23
+ }
24
+ }
25
+ }