Skip to content

Commit c06b0ef

Browse files
committed
Only support int8 dtype for quant operators
1 parent 8cfa858 commit c06b0ef

File tree

1 file changed

+10
-2
lines changed

1 file changed

+10
-2
lines changed

backends/xnnpack/partition/config/xnnpack_config.py

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -10,12 +10,17 @@
1010
from typing import List, Optional
1111

1212
import torch
13+
from torch.export import ExportedProgram
14+
from executorch.backends.xnnpack.utils.quant_utils import (
15+
is_quant,
16+
is_dequant,
17+
is_qparam,
18+
)
1319
from executorch.exir.backend.canonical_partitioners.config_partitioner import (
1420
format_target_name,
1521
PartitionerConfig,
1622
)
1723
from executorch.exir.backend.utils import WhyNoPartition
18-
from torch.export import ExportedProgram
1924

2025
logger = logging.getLogger(__name__)
2126
why = WhyNoPartition(logger=logger)
@@ -220,9 +225,12 @@ def _check_node_has_valid_dtype(self, node):
220225
valid_dtypes = {
221226
torch.float32,
222227
torch.float16,
223-
torch.int8,
224228
torch.qint8,
225229
}
230+
# Only allow int8 for quantization operations
231+
if is_quant(node) or is_dequant(node) or is_qparam(node):
232+
valid_dtypes.add(torch.int8)
233+
226234
if (
227235
node.op != "placeholder"
228236
and node.op != "call_function"

0 commit comments

Comments
 (0)