onnx/quantize_config.json
527 B · 24 lines · json Raw
1 {
2 "per_channel": false,
3 "reduce_range": false,
4 "per_model_config": {
5 "model": {
6 "op_types": [
7 "Concat",
8 "MaxPool",
9 "Resize",
10 "Conv",
11 "Unsqueeze",
12 "Cast",
13 "Shape",
14 "Relu",
15 "Sigmoid",
16 "Gather",
17 "Constant",
18 "Slice",
19 "Add"
20 ],
21 "weight_type": "QUInt8"
22 }
23 }
24 }