johnomeara commited on
Commit
ab7110b
·
verified ·
1 Parent(s): 1f63835

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. onnx/model_quantized.onnx +2 -2
  2. ort_config.json +25 -6
onnx/model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a3bda057b541217345984a0574ca39c22eba4ef02daf1656cc1033ab1fc4f20
3
- size 24417500
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:089213f71783e3a0a41eee1db4af6a1d7bfc5272c35076879e0fd9fea323248a
3
+ size 24625229
ort_config.json CHANGED
@@ -11,21 +11,40 @@
11
  "nodes_to_exclude": [],
12
  "nodes_to_quantize": [],
13
  "operators_to_quantize": [
 
 
 
14
  "Conv",
 
 
 
 
15
  "MatMul",
16
- "Attention",
17
- "LSTM",
18
- "Gather",
19
  "Transpose",
20
- "EmbedLayerNormalization"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  ],
22
- "per_channel": false,
23
  "qdq_add_pair_to_weight": false,
24
  "qdq_dedicated_pair": false,
25
  "qdq_op_type_per_channel_support_to_axis": {
26
  "MatMul": 1
27
  },
28
- "reduce_range": false,
29
  "weights_dtype": "QUInt8",
30
  "weights_symmetric": true
31
  },
 
11
  "nodes_to_exclude": [],
12
  "nodes_to_quantize": [],
13
  "operators_to_quantize": [
14
+ "Concat",
15
+ "Constant",
16
+ "Resize",
17
  "Conv",
18
+ "Div",
19
+ "Unsqueeze",
20
+ "Shape",
21
+ "Gemm",
22
  "MatMul",
 
 
 
23
  "Transpose",
24
+ "Pow",
25
+ "Softmax",
26
+ "Slice",
27
+ "Where",
28
+ "Expand",
29
+ "ReduceMean",
30
+ "Mul",
31
+ "Add",
32
+ "Sqrt",
33
+ "Gather",
34
+ "Sub",
35
+ "ConstantOfShape",
36
+ "Reshape",
37
+ "Equal",
38
+ "Identity",
39
+ "Erf"
40
  ],
41
+ "per_channel": true,
42
  "qdq_add_pair_to_weight": false,
43
  "qdq_dedicated_pair": false,
44
  "qdq_op_type_per_channel_support_to_axis": {
45
  "MatMul": 1
46
  },
47
+ "reduce_range": true,
48
  "weights_dtype": "QUInt8",
49
  "weights_symmetric": true
50
  },