Xenova
/

wav2vec2-base-960h

Automatic Speech Recognition

Transformers.js

ONNX

wav2vec2

Model card Files Files and versions Community

Xenova HF staff commited on Mar 20

Commit

27103eb

•

1 Parent(s): d0cc1bf

Update quantize_config.json

Browse files

Files changed (1) hide show

quantize_config.json +102 -28

quantize_config.json CHANGED Viewed

@@ -1,31 +1,105 @@
 {
-    "per_channel": true,
-    "reduce_range": true,
-    "per_model_config": {
-        "model": {
-            "op_types": [
-                "Unsqueeze",
-                "Softmax",
-                "Add",
-                "Mul",
-                "Reshape",
-                "Pow",
-                "InstanceNormalization",
-                "Shape",
-                "Constant",
-                "MatMul",
-                "ReduceMean",
-                "Erf",
-                "Sqrt",
-                "Div",
-                "Gather",
-                "Concat",
-                "Slice",
-                "Sub",
-                "Conv",
-                "Transpose"
-            ],
-            "weight_type": "QUInt8"
-        }
     }
 }

 {
+    "fp16": {},
+    "q8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Gather",
+                    "InstanceNormalization",
+                    "MatMul",
+                    "Mul",
+                    "Pow",
+                    "ReduceMean",
+                    "Reshape",
+                    "Shape",
+                    "Slice",
+                    "Softmax",
+                    "Sqrt",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "int8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Gather",
+                    "InstanceNormalization",
+                    "MatMul",
+                    "Mul",
+                    "Pow",
+                    "ReduceMean",
+                    "Reshape",
+                    "Shape",
+                    "Slice",
+                    "Softmax",
+                    "Sqrt",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "uint8": {
+        "per_model_config": {
+            "model": {
+                "op_types": [
+                    "Add",
+                    "Concat",
+                    "Constant",
+                    "Conv",
+                    "Div",
+                    "Erf",
+                    "Gather",
+                    "InstanceNormalization",
+                    "MatMul",
+                    "Mul",
+                    "Pow",
+                    "ReduceMean",
+                    "Reshape",
+                    "Shape",
+                    "Slice",
+                    "Softmax",
+                    "Sqrt",
+                    "Sub",
+                    "Transpose",
+                    "Unsqueeze"
+                ],
+                "weight_type": "QUInt8"
+            }
+        },
+        "per_channel": false,
+        "reduce_range": false
+    },
+    "q4": {
+        "block_size": 32,
+        "is_symmetric": true,
+        "accuracy_level": null
+    },
+    "bnb4": {
+        "block_size": 64,
+        "quant_type": 1
     }
 }