From 3432700c5ba23132ddd3ed62e2f7a842fe8516bf Mon Sep 17 00:00:00 2001 From: dlyakhov Date: Mon, 21 Jul 2025 17:54:58 +0200 Subject: [PATCH] [TorchFX] Use torchao for quantize_pt2e API when possible --- .../torch/fx/quantization/qdq_parameters.py | 42 + .../torch/fx/quantization/quantize_model.py | 7 +- .../torch/fx/quantization/quantize_pt2e.py | 15 +- .../quantizer/openvino_quantizer.py | 27 +- .../quantizer/torch_ao_adapter.py | 25 +- .../experimental/torch/fx/transformations.py | 108 +- .../algorithms/min_max/torch_fx_backend.py | 49 +- .../XNNPACKQuantizer/mobilenet_v3_small.dot | 1056 ----- .../mobilenet_v3_small_ref_qconfig.json | 1352 ------ .../data/fx/XNNPACKQuantizer/resnet18.dot | 385 -- .../resnet18_ref_qconfig.json | 424 -- .../data/fx/XNNPACKQuantizer/swin_v2_t.dot | 3906 ----------------- .../swin_v2_t_ref_qconfig.json | 2813 ------------ .../synthetic_transformer.dot | 45 - .../synthetic_transformer_ref_qconfig.json | 46 - .../torch2/data/fx/XNNPACKQuantizer/unet.dot | 421 -- .../fx/XNNPACKQuantizer/unet_ref_qconfig.json | 451 -- .../data/fx/XNNPACKQuantizer/vit_b_16.dot | 2121 --------- .../vit_b_16_ref_qconfig.json | 1764 -------- .../XNNPACKQuantizer/yolo11n_sdpa_block.dot | 57 - .../yolo11n_sdpa_block_ref_qconfig.json | 30 - .../mobilenet_v3_small.dot | 144 +- .../resnet18.dot | 84 +- .../swin_v2_t.dot | 212 +- .../synthetic_transformer.dot | 8 +- .../unet.dot | 92 +- .../vit_b_16.dot | 200 +- .../yolo11n_sdpa_block.dot | 4 +- tests/torch2/fx/helpers.py | 4 +- .../fx/test_calculation_quantizer_params.py | 42 +- tests/torch2/fx/test_model_transformer.py | 44 +- tests/torch2/fx/test_quantizer.py | 48 +- 32 files changed, 616 insertions(+), 15410 deletions(-) create mode 100644 src/nncf/experimental/torch/fx/quantization/qdq_parameters.py delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small_ref_qconfig.json delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/resnet18.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/resnet18_ref_qconfig.json delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t_ref_qconfig.json delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer_ref_qconfig.json delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/unet.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/unet_ref_qconfig.json delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16_ref_qconfig.json delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block.dot delete mode 100644 tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block_ref_qconfig.json diff --git a/src/nncf/experimental/torch/fx/quantization/qdq_parameters.py b/src/nncf/experimental/torch/fx/quantization/qdq_parameters.py new file mode 100644 index 00000000000..eb2c3121339 --- /dev/null +++ b/src/nncf/experimental/torch/fx/quantization/qdq_parameters.py @@ -0,0 +1,42 @@ +# Copyright (c) 2025 Intel Corporation +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# http://www.apache.org/licenses/LICENSE-2.0 +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +from dataclasses import dataclass + +import torch + + +@dataclass +class TorchQDQParameters: + """ + Stores the quantization parameters required for + creation of a PyTorch quantize-dequantize pair. + + :param quant_min: Minimum quant value. + :type quant_min: int + :param quant_max: Maximum quant value. + :type quant_max: int + :param scale: Defines the scale factor used for quantization. + :type scale: torch.Tensor + :param zero_point: Specifies the quantized value to which 0 in floating point maps to. + :type zero_point: torch.Tensor + :param is_per_channel: Whether quantization is applied per channel. + :type is_per_channel: bool + :param ch_axis: Channel axis used for per-channel quantization. + :type ch_axis: int + """ + + quant_min: int + quant_max: int + scale: torch.Tensor + zero_point: torch.Tensor + is_per_channel: bool + ch_axis: int diff --git a/src/nncf/experimental/torch/fx/quantization/quantize_model.py b/src/nncf/experimental/torch/fx/quantization/quantize_model.py index 6daa6b5bc34..f08ba6fbeaa 100644 --- a/src/nncf/experimental/torch/fx/quantization/quantize_model.py +++ b/src/nncf/experimental/torch/fx/quantization/quantize_model.py @@ -17,6 +17,7 @@ from torch.ao.quantization.pt2e.port_metadata_pass import PortNodeMetaForQDQ from torch.ao.quantization.pt2e.qat_utils import _fold_conv_bn_qat from torch.ao.quantization.pt2e.utils import _disallow_eval_train +from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ from torch.fx import GraphModule from torch.fx.passes.infra.pass_manager import PassManager @@ -27,7 +28,6 @@ from nncf.data import Dataset from nncf.experimental.torch.fx.quantization.backend_parameters import is_weight_compression_needed from nncf.experimental.torch.fx.transformations import DuplicateDQPassNoAnnotations -from nncf.experimental.torch.fx.transformations import apply_quantization_transformations from nncf.experimental.torch.fx.transformations import compress_post_quantize_transformation from nncf.experimental.torch.fx.transformations import fq_weights_transformation from nncf.parameters import BackupMode @@ -87,8 +87,9 @@ def quantize_impl( advanced_parameters=advanced_parameters, ) - # To make it easier for bias correction algorithms. - apply_quantization_transformations(copied_model) + # Fuse batch norms to convolutions bias + # the same way it done in torchao + _fuse_conv_bn_(copied_model) nncf_graph = NNCFGraphFactory.create(copied_model) quantized_model = quantization_algorithm.apply(copied_model, nncf_graph, dataset=calibration_dataset) diff --git a/src/nncf/experimental/torch/fx/quantization/quantize_pt2e.py b/src/nncf/experimental/torch/fx/quantization/quantize_pt2e.py index 3f0b3186310..e23259fb862 100644 --- a/src/nncf/experimental/torch/fx/quantization/quantize_pt2e.py +++ b/src/nncf/experimental/torch/fx/quantization/quantize_pt2e.py @@ -14,10 +14,6 @@ import torch import torch.fx -from torch.ao.quantization.pt2e.port_metadata_pass import PortNodeMetaForQDQ -from torch.ao.quantization.pt2e.utils import _disallow_eval_train -from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ -from torch.ao.quantization.quantizer import Quantizer from torch.fx import GraphModule from torch.fx.passes.infra.pass_manager import PassManager @@ -38,6 +34,17 @@ from nncf.quantization.advanced_parameters import AdvancedSmoothQuantParameters from nncf.quantization.range_estimator import RangeEstimatorParameters +try: + from torchao.quantization.pt2e.quantizer import Quantizer + from torchao.quantization.pt2e.quantizer.port_metadata_pass import PortNodeMetaForQDQ + from torchao.quantization.pt2e.utils import _disallow_eval_train + from torchao.quantization.pt2e.utils import _fuse_conv_bn_ +except ImportError: + from torch.ao.quantization.pt2e.port_metadata_pass import PortNodeMetaForQDQ + from torch.ao.quantization.pt2e.utils import _disallow_eval_train + from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ + from torch.ao.quantization.quantizer import Quantizer + @api(canonical_alias="nncf.experimental.torch.fx.quantize_pt2e") def quantize_pt2e( diff --git a/src/nncf/experimental/torch/fx/quantization/quantizer/openvino_quantizer.py b/src/nncf/experimental/torch/fx/quantization/quantizer/openvino_quantizer.py index 55611a7d095..26a955a8903 100644 --- a/src/nncf/experimental/torch/fx/quantization/quantizer/openvino_quantizer.py +++ b/src/nncf/experimental/torch/fx/quantization/quantizer/openvino_quantizer.py @@ -13,14 +13,6 @@ from typing import Optional, Union import torch.fx -from torch.ao.quantization.observer import HistogramObserver -from torch.ao.quantization.observer import PerChannelMinMaxObserver -from torch.ao.quantization.quantizer.quantizer import EdgeOrNode -from torch.ao.quantization.quantizer.quantizer import QuantizationAnnotation as TorchAOQuantizationAnnotation -from torch.ao.quantization.quantizer.quantizer import QuantizationSpec as TorchAOQuantizationSpec -from torch.ao.quantization.quantizer.quantizer import QuantizationSpecBase as TorchAOQuantizationSpecBase -from torch.ao.quantization.quantizer.quantizer import Quantizer as TorchAOQuantizer -from torch.ao.quantization.quantizer.quantizer import SharedQuantizationSpec as TorchAOSharedQuantizationSpec import nncf from nncf import IgnoredScope @@ -43,6 +35,25 @@ from nncf.quantization.algorithms.min_max.algorithm import MinMaxQuantization from nncf.torch.model_graph_manager import get_weight_tensor_port_ids +try: + from torchao.quantization.pt2e.observer import HistogramObserver + from torchao.quantization.pt2e.observer import PerChannelMinMaxObserver + from torchao.quantization.pt2e.quantizer.quantizer import EdgeOrNode + from torchao.quantization.pt2e.quantizer.quantizer import QuantizationAnnotation as TorchAOQuantizationAnnotation + from torchao.quantization.pt2e.quantizer.quantizer import QuantizationSpec as TorchAOQuantizationSpec + from torchao.quantization.pt2e.quantizer.quantizer import QuantizationSpecBase as TorchAOQuantizationSpecBase + from torchao.quantization.pt2e.quantizer.quantizer import Quantizer as TorchAOQuantizer + from torchao.quantization.pt2e.quantizer.quantizer import SharedQuantizationSpec as TorchAOSharedQuantizationSpec +except ImportError: + from torch.ao.quantization.observer import HistogramObserver + from torch.ao.quantization.observer import PerChannelMinMaxObserver + from torch.ao.quantization.quantizer.quantizer import EdgeOrNode + from torch.ao.quantization.quantizer.quantizer import QuantizationAnnotation as TorchAOQuantizationAnnotation + from torch.ao.quantization.quantizer.quantizer import QuantizationSpec as TorchAOQuantizationSpec + from torch.ao.quantization.quantizer.quantizer import QuantizationSpecBase as TorchAOQuantizationSpecBase + from torch.ao.quantization.quantizer.quantizer import Quantizer as TorchAOQuantizer + from torch.ao.quantization.quantizer.quantizer import SharedQuantizationSpec as TorchAOSharedQuantizationSpec + QUANT_ANNOTATION_KEY = "quantization_annotation" diff --git a/src/nncf/experimental/torch/fx/quantization/quantizer/torch_ao_adapter.py b/src/nncf/experimental/torch/fx/quantization/quantizer/torch_ao_adapter.py index af5f0358edd..46d455147b0 100644 --- a/src/nncf/experimental/torch/fx/quantization/quantizer/torch_ao_adapter.py +++ b/src/nncf/experimental/torch/fx/quantization/quantizer/torch_ao_adapter.py @@ -15,11 +15,6 @@ import torch import torch.fx -from torch.ao.quantization.pt2e.prepare import _get_edge_or_node_to_group_id -from torch.ao.quantization.pt2e.prepare import _get_edge_or_node_to_qspec -from torch.ao.quantization.quantizer import Quantizer as TorchAOQuantizer -from torch.ao.quantization.quantizer.quantizer import QuantizationSpec -from torch.ao.quantization.quantizer.quantizer import SharedQuantizationSpec import nncf from nncf.common.graph.graph import NNCFGraph @@ -34,12 +29,26 @@ from nncf.experimental.torch.fx.nncf_graph_builder import GraphConverter from nncf.tensor.definitions import TensorDataType +try: + from torchao.quantization.pt2e.prepare import _get_edge_or_node_to_group_id + from torchao.quantization.pt2e.prepare import _get_edge_or_node_to_qspec + from torchao.quantization.pt2e.quantizer import Quantizer as TorchAOQuantizer + from torchao.quantization.pt2e.quantizer.quantizer import QuantizationSpec + from torchao.quantization.pt2e.quantizer.quantizer import SharedQuantizationSpec +except ImportError: + from torch.ao.quantization.pt2e.prepare import _get_edge_or_node_to_group_id + from torch.ao.quantization.pt2e.prepare import _get_edge_or_node_to_qspec + from torch.ao.quantization.quantizer import Quantizer as TorchAOQuantizer + from torch.ao.quantization.quantizer.quantizer import QuantizationSpec + from torch.ao.quantization.quantizer.quantizer import SharedQuantizationSpec + + EdgeOrNode = Union[tuple[torch.fx.Node, torch.fx.Node]] class TorchAOQuantizerAdapter(Quantizer): """ - Implementation of the NNCF Quantizer interface for any given torch.ao quantizer. + Implementation of the NNCF Quantizer interface for any given torchao quantizer. """ def __init__(self, quantizer: TorchAOQuantizer): @@ -120,7 +129,7 @@ def _get_node_args(node: torch.fx.Node) -> tuple[Any, ...]: def get_quantizer_config_from_annotated_model(annotated: torch.fx.GraphModule) -> SingleConfigQuantizerSetup: """ Process a torch.fx.GraphModule annotated with quantization specifications - (e.g., via torch.ao observers) and generates a corresponding NNCF quantization setup object, + (e.g., via torchao observers) and generates a corresponding NNCF quantization setup object, which maps quantization configurations to graph edges. :param annotated: A torch.fx.GraphModule that has been annotated with Torch quantization observers. @@ -149,7 +158,7 @@ def get_quantizer_config_from_annotated_model(annotated: torch.fx.GraphModule) - if qspec is None: continue if not isinstance(qspec, QuantizationSpec): - msg = f"Unknown torch.ao quantization spec: {qspec}" + msg = f"Unknown torchao quantization spec: {qspec}" raise nncf.InternalError(msg) if qspec.qscheme in [torch.per_channel_affine, torch.per_channel_symmetric]: diff --git a/src/nncf/experimental/torch/fx/transformations.py b/src/nncf/experimental/torch/fx/transformations.py index b2720262e81..2e7099e64cb 100644 --- a/src/nncf/experimental/torch/fx/transformations.py +++ b/src/nncf/experimental/torch/fx/transformations.py @@ -15,12 +15,9 @@ import torch import torch.fx -from torch.ao.quantization.fx.utils import create_getattr_from_value -from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ from torch.fx.node import map_arg from torch.fx.passes.infra.pass_base import PassBase from torch.fx.passes.infra.pass_base import PassResult -from torch.quantization.fake_quantize import FakeQuantize import nncf import nncf.torch @@ -29,6 +26,7 @@ from nncf.experimental.torch.fx.constant_folding import constant_fold from nncf.experimental.torch.fx.node_utils import get_graph_node_by_name from nncf.experimental.torch.fx.node_utils import get_tensor_constant_from_node +from nncf.experimental.torch.fx.quantization.qdq_parameters import TorchQDQParameters from nncf.torch.graph.transformations.commands import PTTargetPoint TransformationFNType = Callable[[torch.fx.GraphModule], None] @@ -223,16 +221,16 @@ def constant_update_fn( def qdq_insertion_transformation_builder( - quantizer: FakeQuantize, target_points: list[PTTargetPoint] + parameters: TorchQDQParameters, target_points: list[PTTargetPoint] ) -> TransformationFNType: """ - Returns transformation which inserts quantize-dequantize operations with parameters - inherited from the given quantizer to each given target point. + Returns transformation which inserts quantize-dequantize operations with + the given parameters to each given target point. - :param quantizer: Quantizer module to inherit quantization parameters from. + :param quantizer: Quantization parameters. :param target_points: List of target point used to insert quantize-dequantize pairs. - :return: Transformation which inserts quantize-dequantize operations with parameters - inherited from the given quantizer to each given target point. + :return: Transformation which inserts quantize-dequantize operations with + the given parameters to each given target point. """ def qdq_insertion_transformation(model: torch.fx.GraphModule): @@ -243,7 +241,7 @@ def qdq_insertion_transformation(model: torch.fx.GraphModule): ) raise nncf.InternalError(msg) for target_point in target_points: - insert_one_qdq(model, target_point, quantizer) + insert_one_qdq(model, target_point, parameters) return qdq_insertion_transformation @@ -311,38 +309,38 @@ def output_insertion_transformation(model: torch.fx.GraphModule): return output_insertion_transformation -def insert_one_qdq(model: torch.fx.GraphModule, target_point: PTTargetPoint, quantizer: FakeQuantize): +def insert_one_qdq(model: torch.fx.GraphModule, target_point: PTTargetPoint, parameters: TorchQDQParameters): """ Inserts quantize-dequantize after the target node to the target model. :param model: Target model. :param target_node: Target node, quantizer-dequantizer pair is inserted just after the target node. - :param quantizer: Quantizer module to inherit quantization parameters from. + :param parameters: Quantization parameters. """ - # Copied from torch.ao.quantization.quantize_pt2e.convert_pt2e + # Copied from torchao.quantization.quantize_pt2e.convert_pt2e # 1. extract information for inserting q/dq node from activation_post_process node_type = "call_function" quantize_op: Optional[Callable] = None - dtype = torch.int8 if quantizer.quant_min < 0 else torch.uint8 - if quantizer.is_per_channel: + dtype = torch.int8 if parameters.quant_min < 0 else torch.uint8 + if parameters.is_per_channel: qparams = { - "_scale_": quantizer.scale, - "_zero_point_": quantizer.zero_point, - "_axis_": quantizer.ch_axis, - "_quant_min_": quantizer.quant_min, - "_quant_max_": quantizer.quant_max, + "_scale_": parameters.scale, + "_zero_point_": parameters.zero_point, + "_axis_": parameters.ch_axis, + "_quant_min_": parameters.quant_min, + "_quant_max_": parameters.quant_max, "_dtype_": dtype, } quantize_op = torch.ops.quantized_decomposed.quantize_per_channel.default dequantize_op = torch.ops.quantized_decomposed.dequantize_per_channel.default else: qparams = { - "_scale_": float(quantizer.scale), - "_zero_point_": int(quantizer.zero_point), - "_quant_min_": quantizer.quant_min, - "_quant_max_": quantizer.quant_max, + "_scale_": float(parameters.scale), + "_zero_point_": int(parameters.zero_point), + "_quant_min_": parameters.quant_min, + "_quant_max_": parameters.quant_max, "_dtype_": dtype, } quantize_op = torch.ops.quantized_decomposed.quantize_per_tensor.default @@ -721,19 +719,6 @@ def match_filters(match, original_graph, graph): _set_meta_for_matches(model, matches) -def apply_quantization_transformations(model: torch.fx.GraphModule) -> None: - """ - Applies quantization transformations to the model. - - :param model: Model to apply transformations to. - """ - # BatchNorm operations have 3 output ports, - # to make it easier for algorithms to work - # with the target graph BatchNorm operations - # are being fused - _fuse_conv_bn_(model) - - def fold_constant_except_qdq(model: torch.fx.GraphModule): """ Performs constant folding avoiding quantize-dequantize pattern. @@ -826,3 +811,52 @@ def call(self, graph_module: torch.fx.GraphModule) -> PassResult: graph_module.graph.eliminate_dead_code() graph_module.recompile() return PassResult(graph_module, True) + + +def get_device(module: torch.nn.Module) -> torch.device: + """ + Retrieves device of the first parameter of the given module. + If there are no parameters - returns CPU device. + + :param module: A torch.nn.Module instance. + :return: A device of the first parameter of the given module. + If there are no parameters - returns CPU device. + """ + try: + named_param = next(module.parameters()) + except StopIteration: + named_param = None + if named_param is None: + return torch.device("cpu") + return named_param.device + + +def create_getattr_from_value(module: torch.nn.Module, graph: torch.fx.Graph, prefix: str, value: Any) -> torch.fx.Node: + """ + Given a value of any type, creates a getattr node corresponding to the value and + registers the value as a buffer to the module. + + :param module: A torch.nn.Module instance. + :param graph: A torch.fx.Graph instance. + :param prefix: A string to use as a name prefix for the new getattr node. + :param value: A value + :return: A getattr node corresponding to the given value. + """ + + def get_new_attr_name(module: torch.nn.Module, prefix: str): + def get_attr_name(i: int): + return prefix + str(i) + + i = 0 + attr_name = get_attr_name(i) + while hasattr(module, attr_name): + i += 1 + attr_name = get_attr_name(i) + return attr_name + + attr_name = get_new_attr_name(module, prefix.replace(".", "_")) + device = get_device(module) + new_value = value.detach().clone() if isinstance(value, torch.Tensor) else torch.tensor(value, device=device) + module.register_buffer(attr_name, new_value) + attr_node = graph.create_node("get_attr", attr_name) + return attr_node diff --git a/src/nncf/quantization/algorithms/min_max/torch_fx_backend.py b/src/nncf/quantization/algorithms/min_max/torch_fx_backend.py index eb14a764c8f..00ebbee14d4 100644 --- a/src/nncf/quantization/algorithms/min_max/torch_fx_backend.py +++ b/src/nncf/quantization/algorithms/min_max/torch_fx_backend.py @@ -12,7 +12,6 @@ from typing import Optional import torch -from torch.quantization.fake_quantize import FakeQuantize import nncf import nncf.torch.graph.operator_metatypes as om @@ -30,6 +29,7 @@ from nncf.experimental.common.tensor_statistics.collectors import TensorReducerBase from nncf.experimental.torch.fx.commands import FXApplyTransformationCommand from nncf.experimental.torch.fx.model_utils import get_target_point +from nncf.experimental.torch.fx.quantization.qdq_parameters import TorchQDQParameters from nncf.experimental.torch.fx.transformations import qdq_insertion_transformation_builder from nncf.parameters import ModelType from nncf.parameters import TargetDevice @@ -180,11 +180,11 @@ def _get_channel_axis(is_weight_quantizer: bool) -> int: return 1 @staticmethod - def _create_quantizer( + def _get_torch_qdq_params( quantizer_config: QuantizerConfig, parameters: FakeQuantizeParameters, is_weight_quantizer: bool, - ) -> FakeQuantize: + ) -> TorchQDQParameters: per_channel = quantizer_config.per_channel dtype = None if isinstance(quantizer_config, TypedQuantizerConfig): @@ -203,11 +203,6 @@ def _create_quantizer( else TensorDataType.uint8 ) - if per_channel: - observer = torch.ao.quantization.observer.PerChannelMinMaxObserver - else: - observer = torch.ao.quantization.observer.MinMaxObserver - if dtype is TensorDataType.int8: level_high = 127 level_low = -128 @@ -221,11 +216,6 @@ def _create_quantizer( else: level_high -= 1 - if quantizer_config.mode == QuantizationScheme.SYMMETRIC: - qscheme = torch.per_channel_symmetric if per_channel else torch.per_tensor_symmetric - else: - qscheme = torch.per_channel_affine if per_channel else torch.per_tensor_affine - scale, zero_point = get_scale_zp_from_input_low_input_high( level_low, level_high, parameters.input_low.data, parameters.input_high.data ) @@ -233,23 +223,18 @@ def _create_quantizer( scale = scale.view(-1) zero_point = zero_point.view(-1) - fakequantizer = FakeQuantize( - observer=observer, - quant_max=level_high, - quant_min=level_low, - dtype=torch.qint8 if dtype is TensorDataType.int8 else torch.quint8, - qscheme=qscheme, - eps=1e-16, - ) - - fakequantizer.scale = scale - fakequantizer.zero_point = zero_point + ch_axis = -1 if per_channel: - fakequantizer.ch_axis = FXMinMaxAlgoBackend._get_channel_axis(is_weight_quantizer) + ch_axis = FXMinMaxAlgoBackend._get_channel_axis(is_weight_quantizer) - # Disable observer to save parameters - fakequantizer.disable_observer() - return fakequantizer + return TorchQDQParameters( + quant_min=level_low, + quant_max=level_high, + scale=scale, + zero_point=zero_point, + is_per_channel=per_channel, + ch_axis=ch_axis, + ) @staticmethod def create_quantizer_insertion_command( @@ -258,10 +243,10 @@ def create_quantizer_insertion_command( quantizer_config: QuantizerConfig, parameters: FakeQuantizeParameters, ) -> FXApplyTransformationCommand: - quantizer = FXMinMaxAlgoBackend._create_quantizer( + torch_qdq_params = FXMinMaxAlgoBackend._get_torch_qdq_params( quantizer_config, parameters, target_point.is_weight_target_point() ) - transformation = qdq_insertion_transformation_builder(quantizer, [target_point]) + transformation = qdq_insertion_transformation_builder(torch_qdq_params, [target_point]) return FXApplyTransformationCommand(transformation) @staticmethod @@ -271,13 +256,13 @@ def create_unified_scales_quantizers_insertion_commands( quantizer_config: QuantizerConfig, parameters: FakeQuantizeParameters, ) -> list[PTSharedFnInsertionCommand]: - quantizer = FXMinMaxAlgoBackend._create_quantizer( + torch_qdq_params = FXMinMaxAlgoBackend._get_torch_qdq_params( quantizer_config, parameters, target_points[0].is_weight_target_point() ) transformations = [] for tp in target_points: - transformation = qdq_insertion_transformation_builder(quantizer, [tp]) + transformation = qdq_insertion_transformation_builder(torch_qdq_params, [tp]) transformations.append(FXApplyTransformationCommand(transformation)) return transformations diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small.dot b/tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small.dot deleted file mode 100644 index 14a75494691..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small.dot +++ /dev/null @@ -1,1056 +0,0 @@ -strict digraph { -"0 features_1_block_1_fc1_bias" [id=0, type="get_attr"]; -"1 features_1_block_1_fc2_bias" [id=1, type="get_attr"]; -"2 features_4_block_2_fc1_bias" [id=2, type="get_attr"]; -"3 features_4_block_2_fc2_bias" [id=3, type="get_attr"]; -"4 features_5_block_2_fc1_bias" [id=4, type="get_attr"]; -"5 features_5_block_2_fc2_bias" [id=5, type="get_attr"]; -"6 features_6_block_2_fc1_bias" [id=6, type="get_attr"]; -"7 features_6_block_2_fc2_bias" [id=7, type="get_attr"]; -"8 features_7_block_2_fc1_bias" [id=8, type="get_attr"]; -"9 features_7_block_2_fc2_bias" [id=9, type="get_attr"]; -"10 features_8_block_2_fc1_bias" [id=10, type="get_attr"]; -"11 features_8_block_2_fc2_bias" [id=11, type="get_attr"]; -"12 features_9_block_2_fc1_bias" [id=12, type="get_attr"]; -"13 features_9_block_2_fc2_bias" [id=13, type="get_attr"]; -"14 features_10_block_2_fc1_bias" [id=14, type="get_attr"]; -"15 features_10_block_2_fc2_bias" [id=15, type="get_attr"]; -"16 features_11_block_2_fc1_bias" [id=16, type="get_attr"]; -"17 features_11_block_2_fc2_bias" [id=17, type="get_attr"]; -"18 classifier_0_bias" [id=18, type="get_attr"]; -"19 classifier_3_bias" [id=19, type="get_attr"]; -"20 x" [id=20, type=input]; -"21 quantize_per_tensor_0" [id=21, type="quantize_per_tensor"]; -"22 dequantize_per_tensor_1" [id=22, type="dequantize_per_tensor"]; -"23 features_0_0_weight_bias" [id=23, type="get_attr"]; -"24 _frozen_param0" [id=24, type="get_attr"]; -"25 dequantize_per_tensor_2" [id=25, type="dequantize_per_tensor"]; -"26 conv2d" [id=26, type=conv2d]; -"27 quantize_per_tensor_3" [id=27, type="quantize_per_tensor"]; -"28 dequantize_per_tensor_4" [id=28, type="dequantize_per_tensor"]; -"29 hardswish_" [id=29, type="hardswish_"]; -"30 quantize_per_tensor_5" [id=30, type="quantize_per_tensor"]; -"31 dequantize_per_tensor_6" [id=31, type="dequantize_per_tensor"]; -"32 features_1_block_0_0_weight_bias" [id=32, type="get_attr"]; -"33 _frozen_param1" [id=33, type="get_attr"]; -"34 dequantize_per_tensor_7" [id=34, type="dequantize_per_tensor"]; -"35 conv2d_1" [id=35, type=conv2d]; -"36 relu_" [id=36, type="relu_"]; -"37 quantize_per_tensor_8" [id=37, type="quantize_per_tensor"]; -"38 dequantize_per_tensor_9" [id=38, type="dequantize_per_tensor"]; -"39 dequantize_per_tensor_10" [id=39, type="dequantize_per_tensor"]; -"40 adaptive_avg_pool2d" [id=40, type="adaptive_avg_pool2d"]; -"41 quantize_per_tensor_11" [id=41, type="quantize_per_tensor"]; -"42 dequantize_per_tensor_12" [id=42, type="dequantize_per_tensor"]; -"43 _frozen_param2" [id=43, type="get_attr"]; -"44 dequantize_per_tensor_13" [id=44, type="dequantize_per_tensor"]; -"45 conv2d_2" [id=45, type=conv2d]; -"46 relu" [id=46, type=relu]; -"47 quantize_per_tensor_14" [id=47, type="quantize_per_tensor"]; -"48 dequantize_per_tensor_15" [id=48, type="dequantize_per_tensor"]; -"49 _frozen_param3" [id=49, type="get_attr"]; -"50 dequantize_per_tensor_16" [id=50, type="dequantize_per_tensor"]; -"51 conv2d_3" [id=51, type=conv2d]; -"52 quantize_per_tensor_17" [id=52, type="quantize_per_tensor"]; -"53 dequantize_per_tensor_18" [id=53, type="dequantize_per_tensor"]; -"54 hardsigmoid" [id=54, type=hardsigmoid]; -"55 quantize_per_tensor_19" [id=55, type="quantize_per_tensor"]; -"56 dequantize_per_tensor_20" [id=56, type="dequantize_per_tensor"]; -"57 mul" [id=57, type=mul]; -"58 quantize_per_tensor_21" [id=58, type="quantize_per_tensor"]; -"59 dequantize_per_tensor_22" [id=59, type="dequantize_per_tensor"]; -"60 features_1_block_2_0_weight_bias" [id=60, type="get_attr"]; -"61 _frozen_param4" [id=61, type="get_attr"]; -"62 dequantize_per_tensor_23" [id=62, type="dequantize_per_tensor"]; -"63 conv2d_4" [id=63, type=conv2d]; -"64 quantize_per_tensor_24" [id=64, type="quantize_per_tensor"]; -"65 dequantize_per_tensor_25" [id=65, type="dequantize_per_tensor"]; -"66 features_2_block_0_0_weight_bias" [id=66, type="get_attr"]; -"67 _frozen_param5" [id=67, type="get_attr"]; -"68 dequantize_per_tensor_26" [id=68, type="dequantize_per_tensor"]; -"69 conv2d_5" [id=69, type=conv2d]; -"70 relu__1" [id=70, type="relu_"]; -"71 quantize_per_tensor_27" [id=71, type="quantize_per_tensor"]; -"72 dequantize_per_tensor_28" [id=72, type="dequantize_per_tensor"]; -"73 features_2_block_1_0_weight_bias" [id=73, type="get_attr"]; -"74 _frozen_param6" [id=74, type="get_attr"]; -"75 dequantize_per_tensor_29" [id=75, type="dequantize_per_tensor"]; -"76 conv2d_6" [id=76, type=conv2d]; -"77 relu__2" [id=77, type="relu_"]; -"78 quantize_per_tensor_30" [id=78, type="quantize_per_tensor"]; -"79 dequantize_per_tensor_31" [id=79, type="dequantize_per_tensor"]; -"80 features_2_block_2_0_weight_bias" [id=80, type="get_attr"]; -"81 _frozen_param7" [id=81, type="get_attr"]; -"82 dequantize_per_tensor_32" [id=82, type="dequantize_per_tensor"]; -"83 conv2d_7" [id=83, type=conv2d]; -"84 quantize_per_tensor_33" [id=84, type="quantize_per_tensor"]; -"85 dequantize_per_tensor_34" [id=85, type="dequantize_per_tensor"]; -"86 dequantize_per_tensor_35" [id=86, type="dequantize_per_tensor"]; -"87 features_3_block_0_0_weight_bias" [id=87, type="get_attr"]; -"88 _frozen_param8" [id=88, type="get_attr"]; -"89 dequantize_per_tensor_36" [id=89, type="dequantize_per_tensor"]; -"90 conv2d_8" [id=90, type=conv2d]; -"91 relu__3" [id=91, type="relu_"]; -"92 quantize_per_tensor_37" [id=92, type="quantize_per_tensor"]; -"93 dequantize_per_tensor_38" [id=93, type="dequantize_per_tensor"]; -"94 features_3_block_1_0_weight_bias" [id=94, type="get_attr"]; -"95 _frozen_param9" [id=95, type="get_attr"]; -"96 dequantize_per_tensor_39" [id=96, type="dequantize_per_tensor"]; -"97 conv2d_9" [id=97, type=conv2d]; -"98 relu__4" [id=98, type="relu_"]; -"99 quantize_per_tensor_40" [id=99, type="quantize_per_tensor"]; -"100 dequantize_per_tensor_41" [id=100, type="dequantize_per_tensor"]; -"101 features_3_block_2_0_weight_bias" [id=101, type="get_attr"]; -"102 _frozen_param10" [id=102, type="get_attr"]; -"103 dequantize_per_tensor_42" [id=103, type="dequantize_per_tensor"]; -"104 conv2d_10" [id=104, type=conv2d]; -"105 quantize_per_tensor_43" [id=105, type="quantize_per_tensor"]; -"106 dequantize_per_tensor_44" [id=106, type="dequantize_per_tensor"]; -"107 add_" [id=107, type="add_"]; -"108 quantize_per_tensor_45" [id=108, type="quantize_per_tensor"]; -"109 dequantize_per_tensor_46" [id=109, type="dequantize_per_tensor"]; -"110 features_4_block_0_0_weight_bias" [id=110, type="get_attr"]; -"111 _frozen_param11" [id=111, type="get_attr"]; -"112 dequantize_per_tensor_47" [id=112, type="dequantize_per_tensor"]; -"113 conv2d_11" [id=113, type=conv2d]; -"114 quantize_per_tensor_48" [id=114, type="quantize_per_tensor"]; -"115 dequantize_per_tensor_49" [id=115, type="dequantize_per_tensor"]; -"116 hardswish__1" [id=116, type="hardswish_"]; -"117 quantize_per_tensor_50" [id=117, type="quantize_per_tensor"]; -"118 dequantize_per_tensor_51" [id=118, type="dequantize_per_tensor"]; -"119 features_4_block_1_0_weight_bias" [id=119, type="get_attr"]; -"120 _frozen_param12" [id=120, type="get_attr"]; -"121 dequantize_per_tensor_52" [id=121, type="dequantize_per_tensor"]; -"122 conv2d_12" [id=122, type=conv2d]; -"123 quantize_per_tensor_53" [id=123, type="quantize_per_tensor"]; -"124 dequantize_per_tensor_54" [id=124, type="dequantize_per_tensor"]; -"125 hardswish__2" [id=125, type="hardswish_"]; -"126 quantize_per_tensor_55" [id=126, type="quantize_per_tensor"]; -"127 dequantize_per_tensor_56" [id=127, type="dequantize_per_tensor"]; -"128 dequantize_per_tensor_57" [id=128, type="dequantize_per_tensor"]; -"129 adaptive_avg_pool2d_1" [id=129, type="adaptive_avg_pool2d"]; -"130 quantize_per_tensor_58" [id=130, type="quantize_per_tensor"]; -"131 dequantize_per_tensor_59" [id=131, type="dequantize_per_tensor"]; -"132 _frozen_param13" [id=132, type="get_attr"]; -"133 dequantize_per_tensor_60" [id=133, type="dequantize_per_tensor"]; -"134 conv2d_13" [id=134, type=conv2d]; -"135 relu_1" [id=135, type=relu]; -"136 quantize_per_tensor_61" [id=136, type="quantize_per_tensor"]; -"137 dequantize_per_tensor_62" [id=137, type="dequantize_per_tensor"]; -"138 _frozen_param14" [id=138, type="get_attr"]; -"139 dequantize_per_tensor_63" [id=139, type="dequantize_per_tensor"]; -"140 conv2d_14" [id=140, type=conv2d]; -"141 quantize_per_tensor_64" [id=141, type="quantize_per_tensor"]; -"142 dequantize_per_tensor_65" [id=142, type="dequantize_per_tensor"]; -"143 hardsigmoid_1" [id=143, type=hardsigmoid]; -"144 quantize_per_tensor_66" [id=144, type="quantize_per_tensor"]; -"145 dequantize_per_tensor_67" [id=145, type="dequantize_per_tensor"]; -"146 mul_1" [id=146, type=mul]; -"147 quantize_per_tensor_68" [id=147, type="quantize_per_tensor"]; -"148 dequantize_per_tensor_69" [id=148, type="dequantize_per_tensor"]; -"149 features_4_block_3_0_weight_bias" [id=149, type="get_attr"]; -"150 _frozen_param15" [id=150, type="get_attr"]; -"151 dequantize_per_tensor_70" [id=151, type="dequantize_per_tensor"]; -"152 conv2d_15" [id=152, type=conv2d]; -"153 quantize_per_tensor_71" [id=153, type="quantize_per_tensor"]; -"154 dequantize_per_tensor_72" [id=154, type="dequantize_per_tensor"]; -"155 dequantize_per_tensor_73" [id=155, type="dequantize_per_tensor"]; -"156 features_5_block_0_0_weight_bias" [id=156, type="get_attr"]; -"157 _frozen_param16" [id=157, type="get_attr"]; -"158 dequantize_per_tensor_74" [id=158, type="dequantize_per_tensor"]; -"159 conv2d_16" [id=159, type=conv2d]; -"160 quantize_per_tensor_75" [id=160, type="quantize_per_tensor"]; -"161 dequantize_per_tensor_76" [id=161, type="dequantize_per_tensor"]; -"162 hardswish__3" [id=162, type="hardswish_"]; -"163 quantize_per_tensor_77" [id=163, type="quantize_per_tensor"]; -"164 dequantize_per_tensor_78" [id=164, type="dequantize_per_tensor"]; -"165 features_5_block_1_0_weight_bias" [id=165, type="get_attr"]; -"166 _frozen_param17" [id=166, type="get_attr"]; -"167 dequantize_per_tensor_79" [id=167, type="dequantize_per_tensor"]; -"168 conv2d_17" [id=168, type=conv2d]; -"169 quantize_per_tensor_80" [id=169, type="quantize_per_tensor"]; -"170 dequantize_per_tensor_81" [id=170, type="dequantize_per_tensor"]; -"171 hardswish__4" [id=171, type="hardswish_"]; -"172 quantize_per_tensor_82" [id=172, type="quantize_per_tensor"]; -"173 dequantize_per_tensor_83" [id=173, type="dequantize_per_tensor"]; -"174 dequantize_per_tensor_84" [id=174, type="dequantize_per_tensor"]; -"175 adaptive_avg_pool2d_2" [id=175, type="adaptive_avg_pool2d"]; -"176 quantize_per_tensor_85" [id=176, type="quantize_per_tensor"]; -"177 dequantize_per_tensor_86" [id=177, type="dequantize_per_tensor"]; -"178 _frozen_param18" [id=178, type="get_attr"]; -"179 dequantize_per_tensor_87" [id=179, type="dequantize_per_tensor"]; -"180 conv2d_18" [id=180, type=conv2d]; -"181 relu_2" [id=181, type=relu]; -"182 quantize_per_tensor_88" [id=182, type="quantize_per_tensor"]; -"183 dequantize_per_tensor_89" [id=183, type="dequantize_per_tensor"]; -"184 _frozen_param19" [id=184, type="get_attr"]; -"185 dequantize_per_tensor_90" [id=185, type="dequantize_per_tensor"]; -"186 conv2d_19" [id=186, type=conv2d]; -"187 quantize_per_tensor_91" [id=187, type="quantize_per_tensor"]; -"188 dequantize_per_tensor_92" [id=188, type="dequantize_per_tensor"]; -"189 hardsigmoid_2" [id=189, type=hardsigmoid]; -"190 quantize_per_tensor_93" [id=190, type="quantize_per_tensor"]; -"191 dequantize_per_tensor_94" [id=191, type="dequantize_per_tensor"]; -"192 mul_2" [id=192, type=mul]; -"193 quantize_per_tensor_95" [id=193, type="quantize_per_tensor"]; -"194 dequantize_per_tensor_96" [id=194, type="dequantize_per_tensor"]; -"195 features_5_block_3_0_weight_bias" [id=195, type="get_attr"]; -"196 _frozen_param20" [id=196, type="get_attr"]; -"197 dequantize_per_tensor_97" [id=197, type="dequantize_per_tensor"]; -"198 conv2d_20" [id=198, type=conv2d]; -"199 quantize_per_tensor_98" [id=199, type="quantize_per_tensor"]; -"200 dequantize_per_tensor_99" [id=200, type="dequantize_per_tensor"]; -"201 add__1" [id=201, type="add_"]; -"202 quantize_per_tensor_100" [id=202, type="quantize_per_tensor"]; -"203 dequantize_per_tensor_101" [id=203, type="dequantize_per_tensor"]; -"204 dequantize_per_tensor_102" [id=204, type="dequantize_per_tensor"]; -"205 features_6_block_0_0_weight_bias" [id=205, type="get_attr"]; -"206 _frozen_param21" [id=206, type="get_attr"]; -"207 dequantize_per_tensor_103" [id=207, type="dequantize_per_tensor"]; -"208 conv2d_21" [id=208, type=conv2d]; -"209 quantize_per_tensor_104" [id=209, type="quantize_per_tensor"]; -"210 dequantize_per_tensor_105" [id=210, type="dequantize_per_tensor"]; -"211 hardswish__5" [id=211, type="hardswish_"]; -"212 quantize_per_tensor_106" [id=212, type="quantize_per_tensor"]; -"213 dequantize_per_tensor_107" [id=213, type="dequantize_per_tensor"]; -"214 features_6_block_1_0_weight_bias" [id=214, type="get_attr"]; -"215 _frozen_param22" [id=215, type="get_attr"]; -"216 dequantize_per_tensor_108" [id=216, type="dequantize_per_tensor"]; -"217 conv2d_22" [id=217, type=conv2d]; -"218 quantize_per_tensor_109" [id=218, type="quantize_per_tensor"]; -"219 dequantize_per_tensor_110" [id=219, type="dequantize_per_tensor"]; -"220 hardswish__6" [id=220, type="hardswish_"]; -"221 quantize_per_tensor_111" [id=221, type="quantize_per_tensor"]; -"222 dequantize_per_tensor_112" [id=222, type="dequantize_per_tensor"]; -"223 dequantize_per_tensor_113" [id=223, type="dequantize_per_tensor"]; -"224 adaptive_avg_pool2d_3" [id=224, type="adaptive_avg_pool2d"]; -"225 quantize_per_tensor_114" [id=225, type="quantize_per_tensor"]; -"226 dequantize_per_tensor_115" [id=226, type="dequantize_per_tensor"]; -"227 _frozen_param23" [id=227, type="get_attr"]; -"228 dequantize_per_tensor_116" [id=228, type="dequantize_per_tensor"]; -"229 conv2d_23" [id=229, type=conv2d]; -"230 relu_3" [id=230, type=relu]; -"231 quantize_per_tensor_117" [id=231, type="quantize_per_tensor"]; -"232 dequantize_per_tensor_118" [id=232, type="dequantize_per_tensor"]; -"233 _frozen_param24" [id=233, type="get_attr"]; -"234 dequantize_per_tensor_119" [id=234, type="dequantize_per_tensor"]; -"235 conv2d_24" [id=235, type=conv2d]; -"236 quantize_per_tensor_120" [id=236, type="quantize_per_tensor"]; -"237 dequantize_per_tensor_121" [id=237, type="dequantize_per_tensor"]; -"238 hardsigmoid_3" [id=238, type=hardsigmoid]; -"239 quantize_per_tensor_122" [id=239, type="quantize_per_tensor"]; -"240 dequantize_per_tensor_123" [id=240, type="dequantize_per_tensor"]; -"241 mul_3" [id=241, type=mul]; -"242 quantize_per_tensor_124" [id=242, type="quantize_per_tensor"]; -"243 dequantize_per_tensor_125" [id=243, type="dequantize_per_tensor"]; -"244 features_6_block_3_0_weight_bias" [id=244, type="get_attr"]; -"245 _frozen_param25" [id=245, type="get_attr"]; -"246 dequantize_per_tensor_126" [id=246, type="dequantize_per_tensor"]; -"247 conv2d_25" [id=247, type=conv2d]; -"248 quantize_per_tensor_127" [id=248, type="quantize_per_tensor"]; -"249 dequantize_per_tensor_128" [id=249, type="dequantize_per_tensor"]; -"250 add__2" [id=250, type="add_"]; -"251 quantize_per_tensor_129" [id=251, type="quantize_per_tensor"]; -"252 dequantize_per_tensor_130" [id=252, type="dequantize_per_tensor"]; -"253 features_7_block_0_0_weight_bias" [id=253, type="get_attr"]; -"254 _frozen_param26" [id=254, type="get_attr"]; -"255 dequantize_per_tensor_131" [id=255, type="dequantize_per_tensor"]; -"256 conv2d_26" [id=256, type=conv2d]; -"257 quantize_per_tensor_132" [id=257, type="quantize_per_tensor"]; -"258 dequantize_per_tensor_133" [id=258, type="dequantize_per_tensor"]; -"259 hardswish__7" [id=259, type="hardswish_"]; -"260 quantize_per_tensor_134" [id=260, type="quantize_per_tensor"]; -"261 dequantize_per_tensor_135" [id=261, type="dequantize_per_tensor"]; -"262 features_7_block_1_0_weight_bias" [id=262, type="get_attr"]; -"263 _frozen_param27" [id=263, type="get_attr"]; -"264 dequantize_per_tensor_136" [id=264, type="dequantize_per_tensor"]; -"265 conv2d_27" [id=265, type=conv2d]; -"266 quantize_per_tensor_137" [id=266, type="quantize_per_tensor"]; -"267 dequantize_per_tensor_138" [id=267, type="dequantize_per_tensor"]; -"268 hardswish__8" [id=268, type="hardswish_"]; -"269 quantize_per_tensor_139" [id=269, type="quantize_per_tensor"]; -"270 dequantize_per_tensor_140" [id=270, type="dequantize_per_tensor"]; -"271 dequantize_per_tensor_141" [id=271, type="dequantize_per_tensor"]; -"272 adaptive_avg_pool2d_4" [id=272, type="adaptive_avg_pool2d"]; -"273 quantize_per_tensor_142" [id=273, type="quantize_per_tensor"]; -"274 dequantize_per_tensor_143" [id=274, type="dequantize_per_tensor"]; -"275 _frozen_param28" [id=275, type="get_attr"]; -"276 dequantize_per_tensor_144" [id=276, type="dequantize_per_tensor"]; -"277 conv2d_28" [id=277, type=conv2d]; -"278 relu_4" [id=278, type=relu]; -"279 quantize_per_tensor_145" [id=279, type="quantize_per_tensor"]; -"280 dequantize_per_tensor_146" [id=280, type="dequantize_per_tensor"]; -"281 _frozen_param29" [id=281, type="get_attr"]; -"282 dequantize_per_tensor_147" [id=282, type="dequantize_per_tensor"]; -"283 conv2d_29" [id=283, type=conv2d]; -"284 quantize_per_tensor_148" [id=284, type="quantize_per_tensor"]; -"285 dequantize_per_tensor_149" [id=285, type="dequantize_per_tensor"]; -"286 hardsigmoid_4" [id=286, type=hardsigmoid]; -"287 quantize_per_tensor_150" [id=287, type="quantize_per_tensor"]; -"288 dequantize_per_tensor_151" [id=288, type="dequantize_per_tensor"]; -"289 mul_4" [id=289, type=mul]; -"290 quantize_per_tensor_152" [id=290, type="quantize_per_tensor"]; -"291 dequantize_per_tensor_153" [id=291, type="dequantize_per_tensor"]; -"292 features_7_block_3_0_weight_bias" [id=292, type="get_attr"]; -"293 _frozen_param30" [id=293, type="get_attr"]; -"294 dequantize_per_tensor_154" [id=294, type="dequantize_per_tensor"]; -"295 conv2d_30" [id=295, type=conv2d]; -"296 quantize_per_tensor_155" [id=296, type="quantize_per_tensor"]; -"297 dequantize_per_tensor_156" [id=297, type="dequantize_per_tensor"]; -"298 dequantize_per_tensor_157" [id=298, type="dequantize_per_tensor"]; -"299 features_8_block_0_0_weight_bias" [id=299, type="get_attr"]; -"300 _frozen_param31" [id=300, type="get_attr"]; -"301 dequantize_per_tensor_158" [id=301, type="dequantize_per_tensor"]; -"302 conv2d_31" [id=302, type=conv2d]; -"303 quantize_per_tensor_159" [id=303, type="quantize_per_tensor"]; -"304 dequantize_per_tensor_160" [id=304, type="dequantize_per_tensor"]; -"305 hardswish__9" [id=305, type="hardswish_"]; -"306 quantize_per_tensor_161" [id=306, type="quantize_per_tensor"]; -"307 dequantize_per_tensor_162" [id=307, type="dequantize_per_tensor"]; -"308 features_8_block_1_0_weight_bias" [id=308, type="get_attr"]; -"309 _frozen_param32" [id=309, type="get_attr"]; -"310 dequantize_per_tensor_163" [id=310, type="dequantize_per_tensor"]; -"311 conv2d_32" [id=311, type=conv2d]; -"312 quantize_per_tensor_164" [id=312, type="quantize_per_tensor"]; -"313 dequantize_per_tensor_165" [id=313, type="dequantize_per_tensor"]; -"314 hardswish__10" [id=314, type="hardswish_"]; -"315 quantize_per_tensor_166" [id=315, type="quantize_per_tensor"]; -"316 dequantize_per_tensor_167" [id=316, type="dequantize_per_tensor"]; -"317 dequantize_per_tensor_168" [id=317, type="dequantize_per_tensor"]; -"318 adaptive_avg_pool2d_5" [id=318, type="adaptive_avg_pool2d"]; -"319 quantize_per_tensor_169" [id=319, type="quantize_per_tensor"]; -"320 dequantize_per_tensor_170" [id=320, type="dequantize_per_tensor"]; -"321 _frozen_param33" [id=321, type="get_attr"]; -"322 dequantize_per_tensor_171" [id=322, type="dequantize_per_tensor"]; -"323 conv2d_33" [id=323, type=conv2d]; -"324 relu_5" [id=324, type=relu]; -"325 quantize_per_tensor_172" [id=325, type="quantize_per_tensor"]; -"326 dequantize_per_tensor_173" [id=326, type="dequantize_per_tensor"]; -"327 _frozen_param34" [id=327, type="get_attr"]; -"328 dequantize_per_tensor_174" [id=328, type="dequantize_per_tensor"]; -"329 conv2d_34" [id=329, type=conv2d]; -"330 quantize_per_tensor_175" [id=330, type="quantize_per_tensor"]; -"331 dequantize_per_tensor_176" [id=331, type="dequantize_per_tensor"]; -"332 hardsigmoid_5" [id=332, type=hardsigmoid]; -"333 quantize_per_tensor_177" [id=333, type="quantize_per_tensor"]; -"334 dequantize_per_tensor_178" [id=334, type="dequantize_per_tensor"]; -"335 mul_5" [id=335, type=mul]; -"336 quantize_per_tensor_179" [id=336, type="quantize_per_tensor"]; -"337 dequantize_per_tensor_180" [id=337, type="dequantize_per_tensor"]; -"338 features_8_block_3_0_weight_bias" [id=338, type="get_attr"]; -"339 _frozen_param35" [id=339, type="get_attr"]; -"340 dequantize_per_tensor_181" [id=340, type="dequantize_per_tensor"]; -"341 conv2d_35" [id=341, type=conv2d]; -"342 quantize_per_tensor_182" [id=342, type="quantize_per_tensor"]; -"343 dequantize_per_tensor_183" [id=343, type="dequantize_per_tensor"]; -"344 add__3" [id=344, type="add_"]; -"345 quantize_per_tensor_184" [id=345, type="quantize_per_tensor"]; -"346 dequantize_per_tensor_185" [id=346, type="dequantize_per_tensor"]; -"347 features_9_block_0_0_weight_bias" [id=347, type="get_attr"]; -"348 _frozen_param36" [id=348, type="get_attr"]; -"349 dequantize_per_tensor_186" [id=349, type="dequantize_per_tensor"]; -"350 conv2d_36" [id=350, type=conv2d]; -"351 quantize_per_tensor_187" [id=351, type="quantize_per_tensor"]; -"352 dequantize_per_tensor_188" [id=352, type="dequantize_per_tensor"]; -"353 hardswish__11" [id=353, type="hardswish_"]; -"354 quantize_per_tensor_189" [id=354, type="quantize_per_tensor"]; -"355 dequantize_per_tensor_190" [id=355, type="dequantize_per_tensor"]; -"356 features_9_block_1_0_weight_bias" [id=356, type="get_attr"]; -"357 _frozen_param37" [id=357, type="get_attr"]; -"358 dequantize_per_tensor_191" [id=358, type="dequantize_per_tensor"]; -"359 conv2d_37" [id=359, type=conv2d]; -"360 quantize_per_tensor_192" [id=360, type="quantize_per_tensor"]; -"361 dequantize_per_tensor_193" [id=361, type="dequantize_per_tensor"]; -"362 hardswish__12" [id=362, type="hardswish_"]; -"363 quantize_per_tensor_194" [id=363, type="quantize_per_tensor"]; -"364 dequantize_per_tensor_195" [id=364, type="dequantize_per_tensor"]; -"365 dequantize_per_tensor_196" [id=365, type="dequantize_per_tensor"]; -"366 adaptive_avg_pool2d_6" [id=366, type="adaptive_avg_pool2d"]; -"367 quantize_per_tensor_197" [id=367, type="quantize_per_tensor"]; -"368 dequantize_per_tensor_198" [id=368, type="dequantize_per_tensor"]; -"369 _frozen_param38" [id=369, type="get_attr"]; -"370 dequantize_per_tensor_199" [id=370, type="dequantize_per_tensor"]; -"371 conv2d_38" [id=371, type=conv2d]; -"372 relu_6" [id=372, type=relu]; -"373 quantize_per_tensor_200" [id=373, type="quantize_per_tensor"]; -"374 dequantize_per_tensor_201" [id=374, type="dequantize_per_tensor"]; -"375 _frozen_param39" [id=375, type="get_attr"]; -"376 dequantize_per_tensor_202" [id=376, type="dequantize_per_tensor"]; -"377 conv2d_39" [id=377, type=conv2d]; -"378 quantize_per_tensor_203" [id=378, type="quantize_per_tensor"]; -"379 dequantize_per_tensor_204" [id=379, type="dequantize_per_tensor"]; -"380 hardsigmoid_6" [id=380, type=hardsigmoid]; -"381 quantize_per_tensor_205" [id=381, type="quantize_per_tensor"]; -"382 dequantize_per_tensor_206" [id=382, type="dequantize_per_tensor"]; -"383 mul_6" [id=383, type=mul]; -"384 quantize_per_tensor_207" [id=384, type="quantize_per_tensor"]; -"385 dequantize_per_tensor_208" [id=385, type="dequantize_per_tensor"]; -"386 features_9_block_3_0_weight_bias" [id=386, type="get_attr"]; -"387 _frozen_param40" [id=387, type="get_attr"]; -"388 dequantize_per_tensor_209" [id=388, type="dequantize_per_tensor"]; -"389 conv2d_40" [id=389, type=conv2d]; -"390 quantize_per_tensor_210" [id=390, type="quantize_per_tensor"]; -"391 dequantize_per_tensor_211" [id=391, type="dequantize_per_tensor"]; -"392 dequantize_per_tensor_212" [id=392, type="dequantize_per_tensor"]; -"393 features_10_block_0_0_weight_bias" [id=393, type="get_attr"]; -"394 _frozen_param41" [id=394, type="get_attr"]; -"395 dequantize_per_tensor_213" [id=395, type="dequantize_per_tensor"]; -"396 conv2d_41" [id=396, type=conv2d]; -"397 quantize_per_tensor_214" [id=397, type="quantize_per_tensor"]; -"398 dequantize_per_tensor_215" [id=398, type="dequantize_per_tensor"]; -"399 hardswish__13" [id=399, type="hardswish_"]; -"400 quantize_per_tensor_216" [id=400, type="quantize_per_tensor"]; -"401 dequantize_per_tensor_217" [id=401, type="dequantize_per_tensor"]; -"402 features_10_block_1_0_weight_bias" [id=402, type="get_attr"]; -"403 _frozen_param42" [id=403, type="get_attr"]; -"404 dequantize_per_tensor_218" [id=404, type="dequantize_per_tensor"]; -"405 conv2d_42" [id=405, type=conv2d]; -"406 quantize_per_tensor_219" [id=406, type="quantize_per_tensor"]; -"407 dequantize_per_tensor_220" [id=407, type="dequantize_per_tensor"]; -"408 hardswish__14" [id=408, type="hardswish_"]; -"409 quantize_per_tensor_221" [id=409, type="quantize_per_tensor"]; -"410 dequantize_per_tensor_222" [id=410, type="dequantize_per_tensor"]; -"411 dequantize_per_tensor_223" [id=411, type="dequantize_per_tensor"]; -"412 adaptive_avg_pool2d_7" [id=412, type="adaptive_avg_pool2d"]; -"413 quantize_per_tensor_224" [id=413, type="quantize_per_tensor"]; -"414 dequantize_per_tensor_225" [id=414, type="dequantize_per_tensor"]; -"415 _frozen_param43" [id=415, type="get_attr"]; -"416 dequantize_per_tensor_226" [id=416, type="dequantize_per_tensor"]; -"417 conv2d_43" [id=417, type=conv2d]; -"418 relu_7" [id=418, type=relu]; -"419 quantize_per_tensor_227" [id=419, type="quantize_per_tensor"]; -"420 dequantize_per_tensor_228" [id=420, type="dequantize_per_tensor"]; -"421 _frozen_param44" [id=421, type="get_attr"]; -"422 dequantize_per_tensor_229" [id=422, type="dequantize_per_tensor"]; -"423 conv2d_44" [id=423, type=conv2d]; -"424 quantize_per_tensor_230" [id=424, type="quantize_per_tensor"]; -"425 dequantize_per_tensor_231" [id=425, type="dequantize_per_tensor"]; -"426 hardsigmoid_7" [id=426, type=hardsigmoid]; -"427 quantize_per_tensor_232" [id=427, type="quantize_per_tensor"]; -"428 dequantize_per_tensor_233" [id=428, type="dequantize_per_tensor"]; -"429 mul_7" [id=429, type=mul]; -"430 quantize_per_tensor_234" [id=430, type="quantize_per_tensor"]; -"431 dequantize_per_tensor_235" [id=431, type="dequantize_per_tensor"]; -"432 features_10_block_3_0_weight_bias" [id=432, type="get_attr"]; -"433 _frozen_param45" [id=433, type="get_attr"]; -"434 dequantize_per_tensor_236" [id=434, type="dequantize_per_tensor"]; -"435 conv2d_45" [id=435, type=conv2d]; -"436 quantize_per_tensor_237" [id=436, type="quantize_per_tensor"]; -"437 dequantize_per_tensor_238" [id=437, type="dequantize_per_tensor"]; -"438 add__4" [id=438, type="add_"]; -"439 quantize_per_tensor_239" [id=439, type="quantize_per_tensor"]; -"440 dequantize_per_tensor_240" [id=440, type="dequantize_per_tensor"]; -"441 dequantize_per_tensor_241" [id=441, type="dequantize_per_tensor"]; -"442 features_11_block_0_0_weight_bias" [id=442, type="get_attr"]; -"443 _frozen_param46" [id=443, type="get_attr"]; -"444 dequantize_per_tensor_242" [id=444, type="dequantize_per_tensor"]; -"445 conv2d_46" [id=445, type=conv2d]; -"446 quantize_per_tensor_243" [id=446, type="quantize_per_tensor"]; -"447 dequantize_per_tensor_244" [id=447, type="dequantize_per_tensor"]; -"448 hardswish__15" [id=448, type="hardswish_"]; -"449 quantize_per_tensor_245" [id=449, type="quantize_per_tensor"]; -"450 dequantize_per_tensor_246" [id=450, type="dequantize_per_tensor"]; -"451 features_11_block_1_0_weight_bias" [id=451, type="get_attr"]; -"452 _frozen_param47" [id=452, type="get_attr"]; -"453 dequantize_per_tensor_247" [id=453, type="dequantize_per_tensor"]; -"454 conv2d_47" [id=454, type=conv2d]; -"455 quantize_per_tensor_248" [id=455, type="quantize_per_tensor"]; -"456 dequantize_per_tensor_249" [id=456, type="dequantize_per_tensor"]; -"457 hardswish__16" [id=457, type="hardswish_"]; -"458 quantize_per_tensor_250" [id=458, type="quantize_per_tensor"]; -"459 dequantize_per_tensor_251" [id=459, type="dequantize_per_tensor"]; -"460 dequantize_per_tensor_252" [id=460, type="dequantize_per_tensor"]; -"461 adaptive_avg_pool2d_8" [id=461, type="adaptive_avg_pool2d"]; -"462 quantize_per_tensor_253" [id=462, type="quantize_per_tensor"]; -"463 dequantize_per_tensor_254" [id=463, type="dequantize_per_tensor"]; -"464 _frozen_param48" [id=464, type="get_attr"]; -"465 dequantize_per_tensor_255" [id=465, type="dequantize_per_tensor"]; -"466 conv2d_48" [id=466, type=conv2d]; -"467 relu_8" [id=467, type=relu]; -"468 quantize_per_tensor_256" [id=468, type="quantize_per_tensor"]; -"469 dequantize_per_tensor_257" [id=469, type="dequantize_per_tensor"]; -"470 _frozen_param49" [id=470, type="get_attr"]; -"471 dequantize_per_tensor_258" [id=471, type="dequantize_per_tensor"]; -"472 conv2d_49" [id=472, type=conv2d]; -"473 quantize_per_tensor_259" [id=473, type="quantize_per_tensor"]; -"474 dequantize_per_tensor_260" [id=474, type="dequantize_per_tensor"]; -"475 hardsigmoid_8" [id=475, type=hardsigmoid]; -"476 quantize_per_tensor_261" [id=476, type="quantize_per_tensor"]; -"477 dequantize_per_tensor_262" [id=477, type="dequantize_per_tensor"]; -"478 mul_8" [id=478, type=mul]; -"479 quantize_per_tensor_263" [id=479, type="quantize_per_tensor"]; -"480 dequantize_per_tensor_264" [id=480, type="dequantize_per_tensor"]; -"481 features_11_block_3_0_weight_bias" [id=481, type="get_attr"]; -"482 _frozen_param50" [id=482, type="get_attr"]; -"483 dequantize_per_tensor_265" [id=483, type="dequantize_per_tensor"]; -"484 conv2d_50" [id=484, type=conv2d]; -"485 quantize_per_tensor_266" [id=485, type="quantize_per_tensor"]; -"486 dequantize_per_tensor_267" [id=486, type="dequantize_per_tensor"]; -"487 add__5" [id=487, type="add_"]; -"488 quantize_per_tensor_268" [id=488, type="quantize_per_tensor"]; -"489 dequantize_per_tensor_269" [id=489, type="dequantize_per_tensor"]; -"490 features_12_0_weight_bias" [id=490, type="get_attr"]; -"491 _frozen_param51" [id=491, type="get_attr"]; -"492 dequantize_per_tensor_270" [id=492, type="dequantize_per_tensor"]; -"493 conv2d_51" [id=493, type=conv2d]; -"494 quantize_per_tensor_271" [id=494, type="quantize_per_tensor"]; -"495 dequantize_per_tensor_272" [id=495, type="dequantize_per_tensor"]; -"496 hardswish__17" [id=496, type="hardswish_"]; -"497 quantize_per_tensor_273" [id=497, type="quantize_per_tensor"]; -"498 dequantize_per_tensor_274" [id=498, type="dequantize_per_tensor"]; -"499 adaptive_avg_pool2d_9" [id=499, type="adaptive_avg_pool2d"]; -"500 quantize_per_tensor_275" [id=500, type="quantize_per_tensor"]; -"501 dequantize_per_tensor_276" [id=501, type="dequantize_per_tensor"]; -"502 flatten" [id=502, type=flatten]; -"503 quantize_per_tensor_277" [id=503, type="quantize_per_tensor"]; -"504 dequantize_per_tensor_278" [id=504, type="dequantize_per_tensor"]; -"505 _frozen_param52" [id=505, type="get_attr"]; -"506 dequantize_per_tensor_279" [id=506, type="dequantize_per_tensor"]; -"507 linear" [id=507, type=linear]; -"508 quantize_per_tensor_280" [id=508, type="quantize_per_tensor"]; -"509 dequantize_per_tensor_281" [id=509, type="dequantize_per_tensor"]; -"510 hardswish__18" [id=510, type="hardswish_"]; -"511 dropout_" [id=511, type="dropout_"]; -"512 quantize_per_tensor_282" [id=512, type="quantize_per_tensor"]; -"513 dequantize_per_tensor_283" [id=513, type="dequantize_per_tensor"]; -"514 _frozen_param53" [id=514, type="get_attr"]; -"515 dequantize_per_tensor_284" [id=515, type="dequantize_per_tensor"]; -"516 linear_1" [id=516, type=linear]; -"517 quantize_per_tensor_285" [id=517, type="quantize_per_tensor"]; -"518 dequantize_per_tensor_286" [id=518, type="dequantize_per_tensor"]; -"519 output" [id=519, type=output]; -"0 features_1_block_1_fc1_bias" -> "45 conv2d_2" [style=solid, label="(8,)"]; -"1 features_1_block_1_fc2_bias" -> "51 conv2d_3" [style=solid, label="(16,)"]; -"2 features_4_block_2_fc1_bias" -> "134 conv2d_13" [style=solid, label="(24,)"]; -"3 features_4_block_2_fc2_bias" -> "140 conv2d_14" [style=solid, label="(96,)"]; -"4 features_5_block_2_fc1_bias" -> "180 conv2d_18" [style=solid, label="(64,)"]; -"5 features_5_block_2_fc2_bias" -> "186 conv2d_19" [style=solid, label="(240,)"]; -"6 features_6_block_2_fc1_bias" -> "229 conv2d_23" [style=solid, label="(64,)"]; -"7 features_6_block_2_fc2_bias" -> "235 conv2d_24" [style=solid, label="(240,)"]; -"8 features_7_block_2_fc1_bias" -> "277 conv2d_28" [style=solid, label="(32,)"]; -"9 features_7_block_2_fc2_bias" -> "283 conv2d_29" [style=solid, label="(120,)"]; -"10 features_8_block_2_fc1_bias" -> "323 conv2d_33" [style=solid, label="(40,)"]; -"11 features_8_block_2_fc2_bias" -> "329 conv2d_34" [style=solid, label="(144,)"]; -"12 features_9_block_2_fc1_bias" -> "371 conv2d_38" [style=solid, label="(72,)"]; -"13 features_9_block_2_fc2_bias" -> "377 conv2d_39" [style=solid, label="(288,)"]; -"14 features_10_block_2_fc1_bias" -> "417 conv2d_43" [style=solid, label="(144,)"]; -"15 features_10_block_2_fc2_bias" -> "423 conv2d_44" [style=solid, label="(576,)"]; -"16 features_11_block_2_fc1_bias" -> "466 conv2d_48" [style=solid, label="(144,)"]; -"17 features_11_block_2_fc2_bias" -> "472 conv2d_49" [style=solid, label="(576,)"]; -"18 classifier_0_bias" -> "507 linear" [style=solid, label="(1024,)"]; -"19 classifier_3_bias" -> "516 linear_1" [style=solid, label="(1000,)"]; -"20 x" -> "21 quantize_per_tensor_0" [style=solid, label="(1, 3, 224, 224)"]; -"21 quantize_per_tensor_0" -> "22 dequantize_per_tensor_1" [style=solid, label="(1, 3, 224, 224)"]; -"22 dequantize_per_tensor_1" -> "26 conv2d" [style=solid, label="(1, 3, 224, 224)"]; -"23 features_0_0_weight_bias" -> "26 conv2d" [style=solid, label="(16,)"]; -"24 _frozen_param0" -> "25 dequantize_per_tensor_2" [style=solid, label="(16, 3, 3, 3)"]; -"25 dequantize_per_tensor_2" -> "26 conv2d" [style=solid, label="(16, 3, 3, 3)"]; -"26 conv2d" -> "27 quantize_per_tensor_3" [style=solid, label="(1, 16, 112, 112)"]; -"27 quantize_per_tensor_3" -> "28 dequantize_per_tensor_4" [style=solid, label="(1, 16, 112, 112)"]; -"28 dequantize_per_tensor_4" -> "29 hardswish_" [style=solid, label="(1, 16, 112, 112)"]; -"29 hardswish_" -> "30 quantize_per_tensor_5" [style=solid, label="(1, 16, 112, 112)"]; -"30 quantize_per_tensor_5" -> "31 dequantize_per_tensor_6" [style=solid, label="(1, 16, 112, 112)"]; -"31 dequantize_per_tensor_6" -> "35 conv2d_1" [style=solid, label="(1, 16, 112, 112)"]; -"32 features_1_block_0_0_weight_bias" -> "35 conv2d_1" [style=solid, label="(16,)"]; -"33 _frozen_param1" -> "34 dequantize_per_tensor_7" [style=solid, label="(16, 1, 3, 3)"]; -"34 dequantize_per_tensor_7" -> "35 conv2d_1" [style=solid, label="(16, 1, 3, 3)"]; -"35 conv2d_1" -> "36 relu_" [style=solid, label="(1, 16, 56, 56)"]; -"36 relu_" -> "37 quantize_per_tensor_8" [style=solid, label="(1, 16, 56, 56)"]; -"37 quantize_per_tensor_8" -> "38 dequantize_per_tensor_9" [style=solid, label="(1, 16, 56, 56)"]; -"37 quantize_per_tensor_8" -> "39 dequantize_per_tensor_10" [style=solid, label="(1, 16, 56, 56)"]; -"38 dequantize_per_tensor_9" -> "57 mul" [style=solid, label="(1, 16, 56, 56)"]; -"39 dequantize_per_tensor_10" -> "40 adaptive_avg_pool2d" [style=solid, label="(1, 16, 56, 56)"]; -"40 adaptive_avg_pool2d" -> "41 quantize_per_tensor_11" [style=solid, label="(1, 16, 1, 1)"]; -"41 quantize_per_tensor_11" -> "42 dequantize_per_tensor_12" [style=solid, label="(1, 16, 1, 1)"]; -"42 dequantize_per_tensor_12" -> "45 conv2d_2" [style=solid, label="(1, 16, 1, 1)"]; -"43 _frozen_param2" -> "44 dequantize_per_tensor_13" [style=solid, label="(8, 16, 1, 1)"]; -"44 dequantize_per_tensor_13" -> "45 conv2d_2" [style=solid, label="(8, 16, 1, 1)"]; -"45 conv2d_2" -> "46 relu" [style=solid, label="(1, 8, 1, 1)"]; -"46 relu" -> "47 quantize_per_tensor_14" [style=solid, label="(1, 8, 1, 1)"]; -"47 quantize_per_tensor_14" -> "48 dequantize_per_tensor_15" [style=solid, label="(1, 8, 1, 1)"]; -"48 dequantize_per_tensor_15" -> "51 conv2d_3" [style=solid, label="(1, 8, 1, 1)"]; -"49 _frozen_param3" -> "50 dequantize_per_tensor_16" [style=solid, label="(16, 8, 1, 1)"]; -"50 dequantize_per_tensor_16" -> "51 conv2d_3" [style=solid, label="(16, 8, 1, 1)"]; -"51 conv2d_3" -> "52 quantize_per_tensor_17" [style=solid, label="(1, 16, 1, 1)"]; -"52 quantize_per_tensor_17" -> "53 dequantize_per_tensor_18" [style=solid, label="(1, 16, 1, 1)"]; -"53 dequantize_per_tensor_18" -> "54 hardsigmoid" [style=solid, label="(1, 16, 1, 1)"]; -"54 hardsigmoid" -> "55 quantize_per_tensor_19" [style=solid, label="(1, 16, 1, 1)"]; -"55 quantize_per_tensor_19" -> "56 dequantize_per_tensor_20" [style=solid, label="(1, 16, 1, 1)"]; -"56 dequantize_per_tensor_20" -> "57 mul" [style=solid, label="(1, 16, 1, 1)"]; -"57 mul" -> "58 quantize_per_tensor_21" [style=solid, label="(1, 16, 56, 56)"]; -"58 quantize_per_tensor_21" -> "59 dequantize_per_tensor_22" [style=solid, label="(1, 16, 56, 56)"]; -"59 dequantize_per_tensor_22" -> "63 conv2d_4" [style=solid, label="(1, 16, 56, 56)"]; -"60 features_1_block_2_0_weight_bias" -> "63 conv2d_4" [style=solid, label="(16,)"]; -"61 _frozen_param4" -> "62 dequantize_per_tensor_23" [style=solid, label="(16, 16, 1, 1)"]; -"62 dequantize_per_tensor_23" -> "63 conv2d_4" [style=solid, label="(16, 16, 1, 1)"]; -"63 conv2d_4" -> "64 quantize_per_tensor_24" [style=solid, label="(1, 16, 56, 56)"]; -"64 quantize_per_tensor_24" -> "65 dequantize_per_tensor_25" [style=solid, label="(1, 16, 56, 56)"]; -"65 dequantize_per_tensor_25" -> "69 conv2d_5" [style=solid, label="(1, 16, 56, 56)"]; -"66 features_2_block_0_0_weight_bias" -> "69 conv2d_5" [style=solid, label="(72,)"]; -"67 _frozen_param5" -> "68 dequantize_per_tensor_26" [style=solid, label="(72, 16, 1, 1)"]; -"68 dequantize_per_tensor_26" -> "69 conv2d_5" [style=solid, label="(72, 16, 1, 1)"]; -"69 conv2d_5" -> "70 relu__1" [style=solid, label="(1, 72, 56, 56)"]; -"70 relu__1" -> "71 quantize_per_tensor_27" [style=solid, label="(1, 72, 56, 56)"]; -"71 quantize_per_tensor_27" -> "72 dequantize_per_tensor_28" [style=solid, label="(1, 72, 56, 56)"]; -"72 dequantize_per_tensor_28" -> "76 conv2d_6" [style=solid, label="(1, 72, 56, 56)"]; -"73 features_2_block_1_0_weight_bias" -> "76 conv2d_6" [style=solid, label="(72,)"]; -"74 _frozen_param6" -> "75 dequantize_per_tensor_29" [style=solid, label="(72, 1, 3, 3)"]; -"75 dequantize_per_tensor_29" -> "76 conv2d_6" [style=solid, label="(72, 1, 3, 3)"]; -"76 conv2d_6" -> "77 relu__2" [style=solid, label="(1, 72, 28, 28)"]; -"77 relu__2" -> "78 quantize_per_tensor_30" [style=solid, label="(1, 72, 28, 28)"]; -"78 quantize_per_tensor_30" -> "79 dequantize_per_tensor_31" [style=solid, label="(1, 72, 28, 28)"]; -"79 dequantize_per_tensor_31" -> "83 conv2d_7" [style=solid, label="(1, 72, 28, 28)"]; -"80 features_2_block_2_0_weight_bias" -> "83 conv2d_7" [style=solid, label="(24,)"]; -"81 _frozen_param7" -> "82 dequantize_per_tensor_32" [style=solid, label="(24, 72, 1, 1)"]; -"82 dequantize_per_tensor_32" -> "83 conv2d_7" [style=solid, label="(24, 72, 1, 1)"]; -"83 conv2d_7" -> "84 quantize_per_tensor_33" [style=solid, label="(1, 24, 28, 28)"]; -"84 quantize_per_tensor_33" -> "85 dequantize_per_tensor_34" [style=solid, label="(1, 24, 28, 28)"]; -"84 quantize_per_tensor_33" -> "86 dequantize_per_tensor_35" [style=solid, label="(1, 24, 28, 28)"]; -"85 dequantize_per_tensor_34" -> "107 add_" [style=solid, label="(1, 24, 28, 28)"]; -"86 dequantize_per_tensor_35" -> "90 conv2d_8" [style=solid, label="(1, 24, 28, 28)"]; -"87 features_3_block_0_0_weight_bias" -> "90 conv2d_8" [style=solid, label="(88,)"]; -"88 _frozen_param8" -> "89 dequantize_per_tensor_36" [style=solid, label="(88, 24, 1, 1)"]; -"89 dequantize_per_tensor_36" -> "90 conv2d_8" [style=solid, label="(88, 24, 1, 1)"]; -"90 conv2d_8" -> "91 relu__3" [style=solid, label="(1, 88, 28, 28)"]; -"91 relu__3" -> "92 quantize_per_tensor_37" [style=solid, label="(1, 88, 28, 28)"]; -"92 quantize_per_tensor_37" -> "93 dequantize_per_tensor_38" [style=solid, label="(1, 88, 28, 28)"]; -"93 dequantize_per_tensor_38" -> "97 conv2d_9" [style=solid, label="(1, 88, 28, 28)"]; -"94 features_3_block_1_0_weight_bias" -> "97 conv2d_9" [style=solid, label="(88,)"]; -"95 _frozen_param9" -> "96 dequantize_per_tensor_39" [style=solid, label="(88, 1, 3, 3)"]; -"96 dequantize_per_tensor_39" -> "97 conv2d_9" [style=solid, label="(88, 1, 3, 3)"]; -"97 conv2d_9" -> "98 relu__4" [style=solid, label="(1, 88, 28, 28)"]; -"98 relu__4" -> "99 quantize_per_tensor_40" [style=solid, label="(1, 88, 28, 28)"]; -"99 quantize_per_tensor_40" -> "100 dequantize_per_tensor_41" [style=solid, label="(1, 88, 28, 28)"]; -"100 dequantize_per_tensor_41" -> "104 conv2d_10" [style=solid, label="(1, 88, 28, 28)"]; -"101 features_3_block_2_0_weight_bias" -> "104 conv2d_10" [style=solid, label="(24,)"]; -"102 _frozen_param10" -> "103 dequantize_per_tensor_42" [style=solid, label="(24, 88, 1, 1)"]; -"103 dequantize_per_tensor_42" -> "104 conv2d_10" [style=solid, label="(24, 88, 1, 1)"]; -"104 conv2d_10" -> "105 quantize_per_tensor_43" [style=solid, label="(1, 24, 28, 28)"]; -"105 quantize_per_tensor_43" -> "106 dequantize_per_tensor_44" [style=solid, label="(1, 24, 28, 28)"]; -"106 dequantize_per_tensor_44" -> "107 add_" [style=solid, label="(1, 24, 28, 28)"]; -"107 add_" -> "108 quantize_per_tensor_45" [style=solid, label="(1, 24, 28, 28)"]; -"108 quantize_per_tensor_45" -> "109 dequantize_per_tensor_46" [style=solid, label="(1, 24, 28, 28)"]; -"109 dequantize_per_tensor_46" -> "113 conv2d_11" [style=solid, label="(1, 24, 28, 28)"]; -"110 features_4_block_0_0_weight_bias" -> "113 conv2d_11" [style=solid, label="(96,)"]; -"111 _frozen_param11" -> "112 dequantize_per_tensor_47" [style=solid, label="(96, 24, 1, 1)"]; -"112 dequantize_per_tensor_47" -> "113 conv2d_11" [style=solid, label="(96, 24, 1, 1)"]; -"113 conv2d_11" -> "114 quantize_per_tensor_48" [style=solid, label="(1, 96, 28, 28)"]; -"114 quantize_per_tensor_48" -> "115 dequantize_per_tensor_49" [style=solid, label="(1, 96, 28, 28)"]; -"115 dequantize_per_tensor_49" -> "116 hardswish__1" [style=solid, label="(1, 96, 28, 28)"]; -"116 hardswish__1" -> "117 quantize_per_tensor_50" [style=solid, label="(1, 96, 28, 28)"]; -"117 quantize_per_tensor_50" -> "118 dequantize_per_tensor_51" [style=solid, label="(1, 96, 28, 28)"]; -"118 dequantize_per_tensor_51" -> "122 conv2d_12" [style=solid, label="(1, 96, 28, 28)"]; -"119 features_4_block_1_0_weight_bias" -> "122 conv2d_12" [style=solid, label="(96,)"]; -"120 _frozen_param12" -> "121 dequantize_per_tensor_52" [style=solid, label="(96, 1, 5, 5)"]; -"121 dequantize_per_tensor_52" -> "122 conv2d_12" [style=solid, label="(96, 1, 5, 5)"]; -"122 conv2d_12" -> "123 quantize_per_tensor_53" [style=solid, label="(1, 96, 14, 14)"]; -"123 quantize_per_tensor_53" -> "124 dequantize_per_tensor_54" [style=solid, label="(1, 96, 14, 14)"]; -"124 dequantize_per_tensor_54" -> "125 hardswish__2" [style=solid, label="(1, 96, 14, 14)"]; -"125 hardswish__2" -> "126 quantize_per_tensor_55" [style=solid, label="(1, 96, 14, 14)"]; -"126 quantize_per_tensor_55" -> "127 dequantize_per_tensor_56" [style=solid, label="(1, 96, 14, 14)"]; -"126 quantize_per_tensor_55" -> "128 dequantize_per_tensor_57" [style=solid, label="(1, 96, 14, 14)"]; -"127 dequantize_per_tensor_56" -> "146 mul_1" [style=solid, label="(1, 96, 14, 14)"]; -"128 dequantize_per_tensor_57" -> "129 adaptive_avg_pool2d_1" [style=solid, label="(1, 96, 14, 14)"]; -"129 adaptive_avg_pool2d_1" -> "130 quantize_per_tensor_58" [style=solid, label="(1, 96, 1, 1)"]; -"130 quantize_per_tensor_58" -> "131 dequantize_per_tensor_59" [style=solid, label="(1, 96, 1, 1)"]; -"131 dequantize_per_tensor_59" -> "134 conv2d_13" [style=solid, label="(1, 96, 1, 1)"]; -"132 _frozen_param13" -> "133 dequantize_per_tensor_60" [style=solid, label="(24, 96, 1, 1)"]; -"133 dequantize_per_tensor_60" -> "134 conv2d_13" [style=solid, label="(24, 96, 1, 1)"]; -"134 conv2d_13" -> "135 relu_1" [style=solid, label="(1, 24, 1, 1)"]; -"135 relu_1" -> "136 quantize_per_tensor_61" [style=solid, label="(1, 24, 1, 1)"]; -"136 quantize_per_tensor_61" -> "137 dequantize_per_tensor_62" [style=solid, label="(1, 24, 1, 1)"]; -"137 dequantize_per_tensor_62" -> "140 conv2d_14" [style=solid, label="(1, 24, 1, 1)"]; -"138 _frozen_param14" -> "139 dequantize_per_tensor_63" [style=solid, label="(96, 24, 1, 1)"]; -"139 dequantize_per_tensor_63" -> "140 conv2d_14" [style=solid, label="(96, 24, 1, 1)"]; -"140 conv2d_14" -> "141 quantize_per_tensor_64" [style=solid, label="(1, 96, 1, 1)"]; -"141 quantize_per_tensor_64" -> "142 dequantize_per_tensor_65" [style=solid, label="(1, 96, 1, 1)"]; -"142 dequantize_per_tensor_65" -> "143 hardsigmoid_1" [style=solid, label="(1, 96, 1, 1)"]; -"143 hardsigmoid_1" -> "144 quantize_per_tensor_66" [style=solid, label="(1, 96, 1, 1)"]; -"144 quantize_per_tensor_66" -> "145 dequantize_per_tensor_67" [style=solid, label="(1, 96, 1, 1)"]; -"145 dequantize_per_tensor_67" -> "146 mul_1" [style=solid, label="(1, 96, 1, 1)"]; -"146 mul_1" -> "147 quantize_per_tensor_68" [style=solid, label="(1, 96, 14, 14)"]; -"147 quantize_per_tensor_68" -> "148 dequantize_per_tensor_69" [style=solid, label="(1, 96, 14, 14)"]; -"148 dequantize_per_tensor_69" -> "152 conv2d_15" [style=solid, label="(1, 96, 14, 14)"]; -"149 features_4_block_3_0_weight_bias" -> "152 conv2d_15" [style=solid, label="(40,)"]; -"150 _frozen_param15" -> "151 dequantize_per_tensor_70" [style=solid, label="(40, 96, 1, 1)"]; -"151 dequantize_per_tensor_70" -> "152 conv2d_15" [style=solid, label="(40, 96, 1, 1)"]; -"152 conv2d_15" -> "153 quantize_per_tensor_71" [style=solid, label="(1, 40, 14, 14)"]; -"153 quantize_per_tensor_71" -> "154 dequantize_per_tensor_72" [style=solid, label="(1, 40, 14, 14)"]; -"153 quantize_per_tensor_71" -> "155 dequantize_per_tensor_73" [style=solid, label="(1, 40, 14, 14)"]; -"154 dequantize_per_tensor_72" -> "201 add__1" [style=solid, label="(1, 40, 14, 14)"]; -"155 dequantize_per_tensor_73" -> "159 conv2d_16" [style=solid, label="(1, 40, 14, 14)"]; -"156 features_5_block_0_0_weight_bias" -> "159 conv2d_16" [style=solid, label="(240,)"]; -"157 _frozen_param16" -> "158 dequantize_per_tensor_74" [style=solid, label="(240, 40, 1, 1)"]; -"158 dequantize_per_tensor_74" -> "159 conv2d_16" [style=solid, label="(240, 40, 1, 1)"]; -"159 conv2d_16" -> "160 quantize_per_tensor_75" [style=solid, label="(1, 240, 14, 14)"]; -"160 quantize_per_tensor_75" -> "161 dequantize_per_tensor_76" [style=solid, label="(1, 240, 14, 14)"]; -"161 dequantize_per_tensor_76" -> "162 hardswish__3" [style=solid, label="(1, 240, 14, 14)"]; -"162 hardswish__3" -> "163 quantize_per_tensor_77" [style=solid, label="(1, 240, 14, 14)"]; -"163 quantize_per_tensor_77" -> "164 dequantize_per_tensor_78" [style=solid, label="(1, 240, 14, 14)"]; -"164 dequantize_per_tensor_78" -> "168 conv2d_17" [style=solid, label="(1, 240, 14, 14)"]; -"165 features_5_block_1_0_weight_bias" -> "168 conv2d_17" [style=solid, label="(240,)"]; -"166 _frozen_param17" -> "167 dequantize_per_tensor_79" [style=solid, label="(240, 1, 5, 5)"]; -"167 dequantize_per_tensor_79" -> "168 conv2d_17" [style=solid, label="(240, 1, 5, 5)"]; -"168 conv2d_17" -> "169 quantize_per_tensor_80" [style=solid, label="(1, 240, 14, 14)"]; -"169 quantize_per_tensor_80" -> "170 dequantize_per_tensor_81" [style=solid, label="(1, 240, 14, 14)"]; -"170 dequantize_per_tensor_81" -> "171 hardswish__4" [style=solid, label="(1, 240, 14, 14)"]; -"171 hardswish__4" -> "172 quantize_per_tensor_82" [style=solid, label="(1, 240, 14, 14)"]; -"172 quantize_per_tensor_82" -> "173 dequantize_per_tensor_83" [style=solid, label="(1, 240, 14, 14)"]; -"172 quantize_per_tensor_82" -> "174 dequantize_per_tensor_84" [style=solid, label="(1, 240, 14, 14)"]; -"173 dequantize_per_tensor_83" -> "192 mul_2" [style=solid, label="(1, 240, 14, 14)"]; -"174 dequantize_per_tensor_84" -> "175 adaptive_avg_pool2d_2" [style=solid, label="(1, 240, 14, 14)"]; -"175 adaptive_avg_pool2d_2" -> "176 quantize_per_tensor_85" [style=solid, label="(1, 240, 1, 1)"]; -"176 quantize_per_tensor_85" -> "177 dequantize_per_tensor_86" [style=solid, label="(1, 240, 1, 1)"]; -"177 dequantize_per_tensor_86" -> "180 conv2d_18" [style=solid, label="(1, 240, 1, 1)"]; -"178 _frozen_param18" -> "179 dequantize_per_tensor_87" [style=solid, label="(64, 240, 1, 1)"]; -"179 dequantize_per_tensor_87" -> "180 conv2d_18" [style=solid, label="(64, 240, 1, 1)"]; -"180 conv2d_18" -> "181 relu_2" [style=solid, label="(1, 64, 1, 1)"]; -"181 relu_2" -> "182 quantize_per_tensor_88" [style=solid, label="(1, 64, 1, 1)"]; -"182 quantize_per_tensor_88" -> "183 dequantize_per_tensor_89" [style=solid, label="(1, 64, 1, 1)"]; -"183 dequantize_per_tensor_89" -> "186 conv2d_19" [style=solid, label="(1, 64, 1, 1)"]; -"184 _frozen_param19" -> "185 dequantize_per_tensor_90" [style=solid, label="(240, 64, 1, 1)"]; -"185 dequantize_per_tensor_90" -> "186 conv2d_19" [style=solid, label="(240, 64, 1, 1)"]; -"186 conv2d_19" -> "187 quantize_per_tensor_91" [style=solid, label="(1, 240, 1, 1)"]; -"187 quantize_per_tensor_91" -> "188 dequantize_per_tensor_92" [style=solid, label="(1, 240, 1, 1)"]; -"188 dequantize_per_tensor_92" -> "189 hardsigmoid_2" [style=solid, label="(1, 240, 1, 1)"]; -"189 hardsigmoid_2" -> "190 quantize_per_tensor_93" [style=solid, label="(1, 240, 1, 1)"]; -"190 quantize_per_tensor_93" -> "191 dequantize_per_tensor_94" [style=solid, label="(1, 240, 1, 1)"]; -"191 dequantize_per_tensor_94" -> "192 mul_2" [style=solid, label="(1, 240, 1, 1)"]; -"192 mul_2" -> "193 quantize_per_tensor_95" [style=solid, label="(1, 240, 14, 14)"]; -"193 quantize_per_tensor_95" -> "194 dequantize_per_tensor_96" [style=solid, label="(1, 240, 14, 14)"]; -"194 dequantize_per_tensor_96" -> "198 conv2d_20" [style=solid, label="(1, 240, 14, 14)"]; -"195 features_5_block_3_0_weight_bias" -> "198 conv2d_20" [style=solid, label="(40,)"]; -"196 _frozen_param20" -> "197 dequantize_per_tensor_97" [style=solid, label="(40, 240, 1, 1)"]; -"197 dequantize_per_tensor_97" -> "198 conv2d_20" [style=solid, label="(40, 240, 1, 1)"]; -"198 conv2d_20" -> "199 quantize_per_tensor_98" [style=solid, label="(1, 40, 14, 14)"]; -"199 quantize_per_tensor_98" -> "200 dequantize_per_tensor_99" [style=solid, label="(1, 40, 14, 14)"]; -"200 dequantize_per_tensor_99" -> "201 add__1" [style=solid, label="(1, 40, 14, 14)"]; -"201 add__1" -> "202 quantize_per_tensor_100" [style=solid, label="(1, 40, 14, 14)"]; -"202 quantize_per_tensor_100" -> "203 dequantize_per_tensor_101" [style=solid, label="(1, 40, 14, 14)"]; -"202 quantize_per_tensor_100" -> "204 dequantize_per_tensor_102" [style=solid, label="(1, 40, 14, 14)"]; -"203 dequantize_per_tensor_101" -> "250 add__2" [style=solid, label="(1, 40, 14, 14)"]; -"204 dequantize_per_tensor_102" -> "208 conv2d_21" [style=solid, label="(1, 40, 14, 14)"]; -"205 features_6_block_0_0_weight_bias" -> "208 conv2d_21" [style=solid, label="(240,)"]; -"206 _frozen_param21" -> "207 dequantize_per_tensor_103" [style=solid, label="(240, 40, 1, 1)"]; -"207 dequantize_per_tensor_103" -> "208 conv2d_21" [style=solid, label="(240, 40, 1, 1)"]; -"208 conv2d_21" -> "209 quantize_per_tensor_104" [style=solid, label="(1, 240, 14, 14)"]; -"209 quantize_per_tensor_104" -> "210 dequantize_per_tensor_105" [style=solid, label="(1, 240, 14, 14)"]; -"210 dequantize_per_tensor_105" -> "211 hardswish__5" [style=solid, label="(1, 240, 14, 14)"]; -"211 hardswish__5" -> "212 quantize_per_tensor_106" [style=solid, label="(1, 240, 14, 14)"]; -"212 quantize_per_tensor_106" -> "213 dequantize_per_tensor_107" [style=solid, label="(1, 240, 14, 14)"]; -"213 dequantize_per_tensor_107" -> "217 conv2d_22" [style=solid, label="(1, 240, 14, 14)"]; -"214 features_6_block_1_0_weight_bias" -> "217 conv2d_22" [style=solid, label="(240,)"]; -"215 _frozen_param22" -> "216 dequantize_per_tensor_108" [style=solid, label="(240, 1, 5, 5)"]; -"216 dequantize_per_tensor_108" -> "217 conv2d_22" [style=solid, label="(240, 1, 5, 5)"]; -"217 conv2d_22" -> "218 quantize_per_tensor_109" [style=solid, label="(1, 240, 14, 14)"]; -"218 quantize_per_tensor_109" -> "219 dequantize_per_tensor_110" [style=solid, label="(1, 240, 14, 14)"]; -"219 dequantize_per_tensor_110" -> "220 hardswish__6" [style=solid, label="(1, 240, 14, 14)"]; -"220 hardswish__6" -> "221 quantize_per_tensor_111" [style=solid, label="(1, 240, 14, 14)"]; -"221 quantize_per_tensor_111" -> "222 dequantize_per_tensor_112" [style=solid, label="(1, 240, 14, 14)"]; -"221 quantize_per_tensor_111" -> "223 dequantize_per_tensor_113" [style=solid, label="(1, 240, 14, 14)"]; -"222 dequantize_per_tensor_112" -> "241 mul_3" [style=solid, label="(1, 240, 14, 14)"]; -"223 dequantize_per_tensor_113" -> "224 adaptive_avg_pool2d_3" [style=solid, label="(1, 240, 14, 14)"]; -"224 adaptive_avg_pool2d_3" -> "225 quantize_per_tensor_114" [style=solid, label="(1, 240, 1, 1)"]; -"225 quantize_per_tensor_114" -> "226 dequantize_per_tensor_115" [style=solid, label="(1, 240, 1, 1)"]; -"226 dequantize_per_tensor_115" -> "229 conv2d_23" [style=solid, label="(1, 240, 1, 1)"]; -"227 _frozen_param23" -> "228 dequantize_per_tensor_116" [style=solid, label="(64, 240, 1, 1)"]; -"228 dequantize_per_tensor_116" -> "229 conv2d_23" [style=solid, label="(64, 240, 1, 1)"]; -"229 conv2d_23" -> "230 relu_3" [style=solid, label="(1, 64, 1, 1)"]; -"230 relu_3" -> "231 quantize_per_tensor_117" [style=solid, label="(1, 64, 1, 1)"]; -"231 quantize_per_tensor_117" -> "232 dequantize_per_tensor_118" [style=solid, label="(1, 64, 1, 1)"]; -"232 dequantize_per_tensor_118" -> "235 conv2d_24" [style=solid, label="(1, 64, 1, 1)"]; -"233 _frozen_param24" -> "234 dequantize_per_tensor_119" [style=solid, label="(240, 64, 1, 1)"]; -"234 dequantize_per_tensor_119" -> "235 conv2d_24" [style=solid, label="(240, 64, 1, 1)"]; -"235 conv2d_24" -> "236 quantize_per_tensor_120" [style=solid, label="(1, 240, 1, 1)"]; -"236 quantize_per_tensor_120" -> "237 dequantize_per_tensor_121" [style=solid, label="(1, 240, 1, 1)"]; -"237 dequantize_per_tensor_121" -> "238 hardsigmoid_3" [style=solid, label="(1, 240, 1, 1)"]; -"238 hardsigmoid_3" -> "239 quantize_per_tensor_122" [style=solid, label="(1, 240, 1, 1)"]; -"239 quantize_per_tensor_122" -> "240 dequantize_per_tensor_123" [style=solid, label="(1, 240, 1, 1)"]; -"240 dequantize_per_tensor_123" -> "241 mul_3" [style=solid, label="(1, 240, 1, 1)"]; -"241 mul_3" -> "242 quantize_per_tensor_124" [style=solid, label="(1, 240, 14, 14)"]; -"242 quantize_per_tensor_124" -> "243 dequantize_per_tensor_125" [style=solid, label="(1, 240, 14, 14)"]; -"243 dequantize_per_tensor_125" -> "247 conv2d_25" [style=solid, label="(1, 240, 14, 14)"]; -"244 features_6_block_3_0_weight_bias" -> "247 conv2d_25" [style=solid, label="(40,)"]; -"245 _frozen_param25" -> "246 dequantize_per_tensor_126" [style=solid, label="(40, 240, 1, 1)"]; -"246 dequantize_per_tensor_126" -> "247 conv2d_25" [style=solid, label="(40, 240, 1, 1)"]; -"247 conv2d_25" -> "248 quantize_per_tensor_127" [style=solid, label="(1, 40, 14, 14)"]; -"248 quantize_per_tensor_127" -> "249 dequantize_per_tensor_128" [style=solid, label="(1, 40, 14, 14)"]; -"249 dequantize_per_tensor_128" -> "250 add__2" [style=solid, label="(1, 40, 14, 14)"]; -"250 add__2" -> "251 quantize_per_tensor_129" [style=solid, label="(1, 40, 14, 14)"]; -"251 quantize_per_tensor_129" -> "252 dequantize_per_tensor_130" [style=solid, label="(1, 40, 14, 14)"]; -"252 dequantize_per_tensor_130" -> "256 conv2d_26" [style=solid, label="(1, 40, 14, 14)"]; -"253 features_7_block_0_0_weight_bias" -> "256 conv2d_26" [style=solid, label="(120,)"]; -"254 _frozen_param26" -> "255 dequantize_per_tensor_131" [style=solid, label="(120, 40, 1, 1)"]; -"255 dequantize_per_tensor_131" -> "256 conv2d_26" [style=solid, label="(120, 40, 1, 1)"]; -"256 conv2d_26" -> "257 quantize_per_tensor_132" [style=solid, label="(1, 120, 14, 14)"]; -"257 quantize_per_tensor_132" -> "258 dequantize_per_tensor_133" [style=solid, label="(1, 120, 14, 14)"]; -"258 dequantize_per_tensor_133" -> "259 hardswish__7" [style=solid, label="(1, 120, 14, 14)"]; -"259 hardswish__7" -> "260 quantize_per_tensor_134" [style=solid, label="(1, 120, 14, 14)"]; -"260 quantize_per_tensor_134" -> "261 dequantize_per_tensor_135" [style=solid, label="(1, 120, 14, 14)"]; -"261 dequantize_per_tensor_135" -> "265 conv2d_27" [style=solid, label="(1, 120, 14, 14)"]; -"262 features_7_block_1_0_weight_bias" -> "265 conv2d_27" [style=solid, label="(120,)"]; -"263 _frozen_param27" -> "264 dequantize_per_tensor_136" [style=solid, label="(120, 1, 5, 5)"]; -"264 dequantize_per_tensor_136" -> "265 conv2d_27" [style=solid, label="(120, 1, 5, 5)"]; -"265 conv2d_27" -> "266 quantize_per_tensor_137" [style=solid, label="(1, 120, 14, 14)"]; -"266 quantize_per_tensor_137" -> "267 dequantize_per_tensor_138" [style=solid, label="(1, 120, 14, 14)"]; -"267 dequantize_per_tensor_138" -> "268 hardswish__8" [style=solid, label="(1, 120, 14, 14)"]; -"268 hardswish__8" -> "269 quantize_per_tensor_139" [style=solid, label="(1, 120, 14, 14)"]; -"269 quantize_per_tensor_139" -> "270 dequantize_per_tensor_140" [style=solid, label="(1, 120, 14, 14)"]; -"269 quantize_per_tensor_139" -> "271 dequantize_per_tensor_141" [style=solid, label="(1, 120, 14, 14)"]; -"270 dequantize_per_tensor_140" -> "289 mul_4" [style=solid, label="(1, 120, 14, 14)"]; -"271 dequantize_per_tensor_141" -> "272 adaptive_avg_pool2d_4" [style=solid, label="(1, 120, 14, 14)"]; -"272 adaptive_avg_pool2d_4" -> "273 quantize_per_tensor_142" [style=solid, label="(1, 120, 1, 1)"]; -"273 quantize_per_tensor_142" -> "274 dequantize_per_tensor_143" [style=solid, label="(1, 120, 1, 1)"]; -"274 dequantize_per_tensor_143" -> "277 conv2d_28" [style=solid, label="(1, 120, 1, 1)"]; -"275 _frozen_param28" -> "276 dequantize_per_tensor_144" [style=solid, label="(32, 120, 1, 1)"]; -"276 dequantize_per_tensor_144" -> "277 conv2d_28" [style=solid, label="(32, 120, 1, 1)"]; -"277 conv2d_28" -> "278 relu_4" [style=solid, label="(1, 32, 1, 1)"]; -"278 relu_4" -> "279 quantize_per_tensor_145" [style=solid, label="(1, 32, 1, 1)"]; -"279 quantize_per_tensor_145" -> "280 dequantize_per_tensor_146" [style=solid, label="(1, 32, 1, 1)"]; -"280 dequantize_per_tensor_146" -> "283 conv2d_29" [style=solid, label="(1, 32, 1, 1)"]; -"281 _frozen_param29" -> "282 dequantize_per_tensor_147" [style=solid, label="(120, 32, 1, 1)"]; -"282 dequantize_per_tensor_147" -> "283 conv2d_29" [style=solid, label="(120, 32, 1, 1)"]; -"283 conv2d_29" -> "284 quantize_per_tensor_148" [style=solid, label="(1, 120, 1, 1)"]; -"284 quantize_per_tensor_148" -> "285 dequantize_per_tensor_149" [style=solid, label="(1, 120, 1, 1)"]; -"285 dequantize_per_tensor_149" -> "286 hardsigmoid_4" [style=solid, label="(1, 120, 1, 1)"]; -"286 hardsigmoid_4" -> "287 quantize_per_tensor_150" [style=solid, label="(1, 120, 1, 1)"]; -"287 quantize_per_tensor_150" -> "288 dequantize_per_tensor_151" [style=solid, label="(1, 120, 1, 1)"]; -"288 dequantize_per_tensor_151" -> "289 mul_4" [style=solid, label="(1, 120, 1, 1)"]; -"289 mul_4" -> "290 quantize_per_tensor_152" [style=solid, label="(1, 120, 14, 14)"]; -"290 quantize_per_tensor_152" -> "291 dequantize_per_tensor_153" [style=solid, label="(1, 120, 14, 14)"]; -"291 dequantize_per_tensor_153" -> "295 conv2d_30" [style=solid, label="(1, 120, 14, 14)"]; -"292 features_7_block_3_0_weight_bias" -> "295 conv2d_30" [style=solid, label="(48,)"]; -"293 _frozen_param30" -> "294 dequantize_per_tensor_154" [style=solid, label="(48, 120, 1, 1)"]; -"294 dequantize_per_tensor_154" -> "295 conv2d_30" [style=solid, label="(48, 120, 1, 1)"]; -"295 conv2d_30" -> "296 quantize_per_tensor_155" [style=solid, label="(1, 48, 14, 14)"]; -"296 quantize_per_tensor_155" -> "297 dequantize_per_tensor_156" [style=solid, label="(1, 48, 14, 14)"]; -"296 quantize_per_tensor_155" -> "298 dequantize_per_tensor_157" [style=solid, label="(1, 48, 14, 14)"]; -"297 dequantize_per_tensor_156" -> "344 add__3" [style=solid, label="(1, 48, 14, 14)"]; -"298 dequantize_per_tensor_157" -> "302 conv2d_31" [style=solid, label="(1, 48, 14, 14)"]; -"299 features_8_block_0_0_weight_bias" -> "302 conv2d_31" [style=solid, label="(144,)"]; -"300 _frozen_param31" -> "301 dequantize_per_tensor_158" [style=solid, label="(144, 48, 1, 1)"]; -"301 dequantize_per_tensor_158" -> "302 conv2d_31" [style=solid, label="(144, 48, 1, 1)"]; -"302 conv2d_31" -> "303 quantize_per_tensor_159" [style=solid, label="(1, 144, 14, 14)"]; -"303 quantize_per_tensor_159" -> "304 dequantize_per_tensor_160" [style=solid, label="(1, 144, 14, 14)"]; -"304 dequantize_per_tensor_160" -> "305 hardswish__9" [style=solid, label="(1, 144, 14, 14)"]; -"305 hardswish__9" -> "306 quantize_per_tensor_161" [style=solid, label="(1, 144, 14, 14)"]; -"306 quantize_per_tensor_161" -> "307 dequantize_per_tensor_162" [style=solid, label="(1, 144, 14, 14)"]; -"307 dequantize_per_tensor_162" -> "311 conv2d_32" [style=solid, label="(1, 144, 14, 14)"]; -"308 features_8_block_1_0_weight_bias" -> "311 conv2d_32" [style=solid, label="(144,)"]; -"309 _frozen_param32" -> "310 dequantize_per_tensor_163" [style=solid, label="(144, 1, 5, 5)"]; -"310 dequantize_per_tensor_163" -> "311 conv2d_32" [style=solid, label="(144, 1, 5, 5)"]; -"311 conv2d_32" -> "312 quantize_per_tensor_164" [style=solid, label="(1, 144, 14, 14)"]; -"312 quantize_per_tensor_164" -> "313 dequantize_per_tensor_165" [style=solid, label="(1, 144, 14, 14)"]; -"313 dequantize_per_tensor_165" -> "314 hardswish__10" [style=solid, label="(1, 144, 14, 14)"]; -"314 hardswish__10" -> "315 quantize_per_tensor_166" [style=solid, label="(1, 144, 14, 14)"]; -"315 quantize_per_tensor_166" -> "316 dequantize_per_tensor_167" [style=solid, label="(1, 144, 14, 14)"]; -"315 quantize_per_tensor_166" -> "317 dequantize_per_tensor_168" [style=solid, label="(1, 144, 14, 14)"]; -"316 dequantize_per_tensor_167" -> "335 mul_5" [style=solid, label="(1, 144, 14, 14)"]; -"317 dequantize_per_tensor_168" -> "318 adaptive_avg_pool2d_5" [style=solid, label="(1, 144, 14, 14)"]; -"318 adaptive_avg_pool2d_5" -> "319 quantize_per_tensor_169" [style=solid, label="(1, 144, 1, 1)"]; -"319 quantize_per_tensor_169" -> "320 dequantize_per_tensor_170" [style=solid, label="(1, 144, 1, 1)"]; -"320 dequantize_per_tensor_170" -> "323 conv2d_33" [style=solid, label="(1, 144, 1, 1)"]; -"321 _frozen_param33" -> "322 dequantize_per_tensor_171" [style=solid, label="(40, 144, 1, 1)"]; -"322 dequantize_per_tensor_171" -> "323 conv2d_33" [style=solid, label="(40, 144, 1, 1)"]; -"323 conv2d_33" -> "324 relu_5" [style=solid, label="(1, 40, 1, 1)"]; -"324 relu_5" -> "325 quantize_per_tensor_172" [style=solid, label="(1, 40, 1, 1)"]; -"325 quantize_per_tensor_172" -> "326 dequantize_per_tensor_173" [style=solid, label="(1, 40, 1, 1)"]; -"326 dequantize_per_tensor_173" -> "329 conv2d_34" [style=solid, label="(1, 40, 1, 1)"]; -"327 _frozen_param34" -> "328 dequantize_per_tensor_174" [style=solid, label="(144, 40, 1, 1)"]; -"328 dequantize_per_tensor_174" -> "329 conv2d_34" [style=solid, label="(144, 40, 1, 1)"]; -"329 conv2d_34" -> "330 quantize_per_tensor_175" [style=solid, label="(1, 144, 1, 1)"]; -"330 quantize_per_tensor_175" -> "331 dequantize_per_tensor_176" [style=solid, label="(1, 144, 1, 1)"]; -"331 dequantize_per_tensor_176" -> "332 hardsigmoid_5" [style=solid, label="(1, 144, 1, 1)"]; -"332 hardsigmoid_5" -> "333 quantize_per_tensor_177" [style=solid, label="(1, 144, 1, 1)"]; -"333 quantize_per_tensor_177" -> "334 dequantize_per_tensor_178" [style=solid, label="(1, 144, 1, 1)"]; -"334 dequantize_per_tensor_178" -> "335 mul_5" [style=solid, label="(1, 144, 1, 1)"]; -"335 mul_5" -> "336 quantize_per_tensor_179" [style=solid, label="(1, 144, 14, 14)"]; -"336 quantize_per_tensor_179" -> "337 dequantize_per_tensor_180" [style=solid, label="(1, 144, 14, 14)"]; -"337 dequantize_per_tensor_180" -> "341 conv2d_35" [style=solid, label="(1, 144, 14, 14)"]; -"338 features_8_block_3_0_weight_bias" -> "341 conv2d_35" [style=solid, label="(48,)"]; -"339 _frozen_param35" -> "340 dequantize_per_tensor_181" [style=solid, label="(48, 144, 1, 1)"]; -"340 dequantize_per_tensor_181" -> "341 conv2d_35" [style=solid, label="(48, 144, 1, 1)"]; -"341 conv2d_35" -> "342 quantize_per_tensor_182" [style=solid, label="(1, 48, 14, 14)"]; -"342 quantize_per_tensor_182" -> "343 dequantize_per_tensor_183" [style=solid, label="(1, 48, 14, 14)"]; -"343 dequantize_per_tensor_183" -> "344 add__3" [style=solid, label="(1, 48, 14, 14)"]; -"344 add__3" -> "345 quantize_per_tensor_184" [style=solid, label="(1, 48, 14, 14)"]; -"345 quantize_per_tensor_184" -> "346 dequantize_per_tensor_185" [style=solid, label="(1, 48, 14, 14)"]; -"346 dequantize_per_tensor_185" -> "350 conv2d_36" [style=solid, label="(1, 48, 14, 14)"]; -"347 features_9_block_0_0_weight_bias" -> "350 conv2d_36" [style=solid, label="(288,)"]; -"348 _frozen_param36" -> "349 dequantize_per_tensor_186" [style=solid, label="(288, 48, 1, 1)"]; -"349 dequantize_per_tensor_186" -> "350 conv2d_36" [style=solid, label="(288, 48, 1, 1)"]; -"350 conv2d_36" -> "351 quantize_per_tensor_187" [style=solid, label="(1, 288, 14, 14)"]; -"351 quantize_per_tensor_187" -> "352 dequantize_per_tensor_188" [style=solid, label="(1, 288, 14, 14)"]; -"352 dequantize_per_tensor_188" -> "353 hardswish__11" [style=solid, label="(1, 288, 14, 14)"]; -"353 hardswish__11" -> "354 quantize_per_tensor_189" [style=solid, label="(1, 288, 14, 14)"]; -"354 quantize_per_tensor_189" -> "355 dequantize_per_tensor_190" [style=solid, label="(1, 288, 14, 14)"]; -"355 dequantize_per_tensor_190" -> "359 conv2d_37" [style=solid, label="(1, 288, 14, 14)"]; -"356 features_9_block_1_0_weight_bias" -> "359 conv2d_37" [style=solid, label="(288,)"]; -"357 _frozen_param37" -> "358 dequantize_per_tensor_191" [style=solid, label="(288, 1, 5, 5)"]; -"358 dequantize_per_tensor_191" -> "359 conv2d_37" [style=solid, label="(288, 1, 5, 5)"]; -"359 conv2d_37" -> "360 quantize_per_tensor_192" [style=solid, label="(1, 288, 7, 7)"]; -"360 quantize_per_tensor_192" -> "361 dequantize_per_tensor_193" [style=solid, label="(1, 288, 7, 7)"]; -"361 dequantize_per_tensor_193" -> "362 hardswish__12" [style=solid, label="(1, 288, 7, 7)"]; -"362 hardswish__12" -> "363 quantize_per_tensor_194" [style=solid, label="(1, 288, 7, 7)"]; -"363 quantize_per_tensor_194" -> "364 dequantize_per_tensor_195" [style=solid, label="(1, 288, 7, 7)"]; -"363 quantize_per_tensor_194" -> "365 dequantize_per_tensor_196" [style=solid, label="(1, 288, 7, 7)"]; -"364 dequantize_per_tensor_195" -> "383 mul_6" [style=solid, label="(1, 288, 7, 7)"]; -"365 dequantize_per_tensor_196" -> "366 adaptive_avg_pool2d_6" [style=solid, label="(1, 288, 7, 7)"]; -"366 adaptive_avg_pool2d_6" -> "367 quantize_per_tensor_197" [style=solid, label="(1, 288, 1, 1)"]; -"367 quantize_per_tensor_197" -> "368 dequantize_per_tensor_198" [style=solid, label="(1, 288, 1, 1)"]; -"368 dequantize_per_tensor_198" -> "371 conv2d_38" [style=solid, label="(1, 288, 1, 1)"]; -"369 _frozen_param38" -> "370 dequantize_per_tensor_199" [style=solid, label="(72, 288, 1, 1)"]; -"370 dequantize_per_tensor_199" -> "371 conv2d_38" [style=solid, label="(72, 288, 1, 1)"]; -"371 conv2d_38" -> "372 relu_6" [style=solid, label="(1, 72, 1, 1)"]; -"372 relu_6" -> "373 quantize_per_tensor_200" [style=solid, label="(1, 72, 1, 1)"]; -"373 quantize_per_tensor_200" -> "374 dequantize_per_tensor_201" [style=solid, label="(1, 72, 1, 1)"]; -"374 dequantize_per_tensor_201" -> "377 conv2d_39" [style=solid, label="(1, 72, 1, 1)"]; -"375 _frozen_param39" -> "376 dequantize_per_tensor_202" [style=solid, label="(288, 72, 1, 1)"]; -"376 dequantize_per_tensor_202" -> "377 conv2d_39" [style=solid, label="(288, 72, 1, 1)"]; -"377 conv2d_39" -> "378 quantize_per_tensor_203" [style=solid, label="(1, 288, 1, 1)"]; -"378 quantize_per_tensor_203" -> "379 dequantize_per_tensor_204" [style=solid, label="(1, 288, 1, 1)"]; -"379 dequantize_per_tensor_204" -> "380 hardsigmoid_6" [style=solid, label="(1, 288, 1, 1)"]; -"380 hardsigmoid_6" -> "381 quantize_per_tensor_205" [style=solid, label="(1, 288, 1, 1)"]; -"381 quantize_per_tensor_205" -> "382 dequantize_per_tensor_206" [style=solid, label="(1, 288, 1, 1)"]; -"382 dequantize_per_tensor_206" -> "383 mul_6" [style=solid, label="(1, 288, 1, 1)"]; -"383 mul_6" -> "384 quantize_per_tensor_207" [style=solid, label="(1, 288, 7, 7)"]; -"384 quantize_per_tensor_207" -> "385 dequantize_per_tensor_208" [style=solid, label="(1, 288, 7, 7)"]; -"385 dequantize_per_tensor_208" -> "389 conv2d_40" [style=solid, label="(1, 288, 7, 7)"]; -"386 features_9_block_3_0_weight_bias" -> "389 conv2d_40" [style=solid, label="(96,)"]; -"387 _frozen_param40" -> "388 dequantize_per_tensor_209" [style=solid, label="(96, 288, 1, 1)"]; -"388 dequantize_per_tensor_209" -> "389 conv2d_40" [style=solid, label="(96, 288, 1, 1)"]; -"389 conv2d_40" -> "390 quantize_per_tensor_210" [style=solid, label="(1, 96, 7, 7)"]; -"390 quantize_per_tensor_210" -> "391 dequantize_per_tensor_211" [style=solid, label="(1, 96, 7, 7)"]; -"390 quantize_per_tensor_210" -> "392 dequantize_per_tensor_212" [style=solid, label="(1, 96, 7, 7)"]; -"391 dequantize_per_tensor_211" -> "438 add__4" [style=solid, label="(1, 96, 7, 7)"]; -"392 dequantize_per_tensor_212" -> "396 conv2d_41" [style=solid, label="(1, 96, 7, 7)"]; -"393 features_10_block_0_0_weight_bias" -> "396 conv2d_41" [style=solid, label="(576,)"]; -"394 _frozen_param41" -> "395 dequantize_per_tensor_213" [style=solid, label="(576, 96, 1, 1)"]; -"395 dequantize_per_tensor_213" -> "396 conv2d_41" [style=solid, label="(576, 96, 1, 1)"]; -"396 conv2d_41" -> "397 quantize_per_tensor_214" [style=solid, label="(1, 576, 7, 7)"]; -"397 quantize_per_tensor_214" -> "398 dequantize_per_tensor_215" [style=solid, label="(1, 576, 7, 7)"]; -"398 dequantize_per_tensor_215" -> "399 hardswish__13" [style=solid, label="(1, 576, 7, 7)"]; -"399 hardswish__13" -> "400 quantize_per_tensor_216" [style=solid, label="(1, 576, 7, 7)"]; -"400 quantize_per_tensor_216" -> "401 dequantize_per_tensor_217" [style=solid, label="(1, 576, 7, 7)"]; -"401 dequantize_per_tensor_217" -> "405 conv2d_42" [style=solid, label="(1, 576, 7, 7)"]; -"402 features_10_block_1_0_weight_bias" -> "405 conv2d_42" [style=solid, label="(576,)"]; -"403 _frozen_param42" -> "404 dequantize_per_tensor_218" [style=solid, label="(576, 1, 5, 5)"]; -"404 dequantize_per_tensor_218" -> "405 conv2d_42" [style=solid, label="(576, 1, 5, 5)"]; -"405 conv2d_42" -> "406 quantize_per_tensor_219" [style=solid, label="(1, 576, 7, 7)"]; -"406 quantize_per_tensor_219" -> "407 dequantize_per_tensor_220" [style=solid, label="(1, 576, 7, 7)"]; -"407 dequantize_per_tensor_220" -> "408 hardswish__14" [style=solid, label="(1, 576, 7, 7)"]; -"408 hardswish__14" -> "409 quantize_per_tensor_221" [style=solid, label="(1, 576, 7, 7)"]; -"409 quantize_per_tensor_221" -> "410 dequantize_per_tensor_222" [style=solid, label="(1, 576, 7, 7)"]; -"409 quantize_per_tensor_221" -> "411 dequantize_per_tensor_223" [style=solid, label="(1, 576, 7, 7)"]; -"410 dequantize_per_tensor_222" -> "429 mul_7" [style=solid, label="(1, 576, 7, 7)"]; -"411 dequantize_per_tensor_223" -> "412 adaptive_avg_pool2d_7" [style=solid, label="(1, 576, 7, 7)"]; -"412 adaptive_avg_pool2d_7" -> "413 quantize_per_tensor_224" [style=solid, label="(1, 576, 1, 1)"]; -"413 quantize_per_tensor_224" -> "414 dequantize_per_tensor_225" [style=solid, label="(1, 576, 1, 1)"]; -"414 dequantize_per_tensor_225" -> "417 conv2d_43" [style=solid, label="(1, 576, 1, 1)"]; -"415 _frozen_param43" -> "416 dequantize_per_tensor_226" [style=solid, label="(144, 576, 1, 1)"]; -"416 dequantize_per_tensor_226" -> "417 conv2d_43" [style=solid, label="(144, 576, 1, 1)"]; -"417 conv2d_43" -> "418 relu_7" [style=solid, label="(1, 144, 1, 1)"]; -"418 relu_7" -> "419 quantize_per_tensor_227" [style=solid, label="(1, 144, 1, 1)"]; -"419 quantize_per_tensor_227" -> "420 dequantize_per_tensor_228" [style=solid, label="(1, 144, 1, 1)"]; -"420 dequantize_per_tensor_228" -> "423 conv2d_44" [style=solid, label="(1, 144, 1, 1)"]; -"421 _frozen_param44" -> "422 dequantize_per_tensor_229" [style=solid, label="(576, 144, 1, 1)"]; -"422 dequantize_per_tensor_229" -> "423 conv2d_44" [style=solid, label="(576, 144, 1, 1)"]; -"423 conv2d_44" -> "424 quantize_per_tensor_230" [style=solid, label="(1, 576, 1, 1)"]; -"424 quantize_per_tensor_230" -> "425 dequantize_per_tensor_231" [style=solid, label="(1, 576, 1, 1)"]; -"425 dequantize_per_tensor_231" -> "426 hardsigmoid_7" [style=solid, label="(1, 576, 1, 1)"]; -"426 hardsigmoid_7" -> "427 quantize_per_tensor_232" [style=solid, label="(1, 576, 1, 1)"]; -"427 quantize_per_tensor_232" -> "428 dequantize_per_tensor_233" [style=solid, label="(1, 576, 1, 1)"]; -"428 dequantize_per_tensor_233" -> "429 mul_7" [style=solid, label="(1, 576, 1, 1)"]; -"429 mul_7" -> "430 quantize_per_tensor_234" [style=solid, label="(1, 576, 7, 7)"]; -"430 quantize_per_tensor_234" -> "431 dequantize_per_tensor_235" [style=solid, label="(1, 576, 7, 7)"]; -"431 dequantize_per_tensor_235" -> "435 conv2d_45" [style=solid, label="(1, 576, 7, 7)"]; -"432 features_10_block_3_0_weight_bias" -> "435 conv2d_45" [style=solid, label="(96,)"]; -"433 _frozen_param45" -> "434 dequantize_per_tensor_236" [style=solid, label="(96, 576, 1, 1)"]; -"434 dequantize_per_tensor_236" -> "435 conv2d_45" [style=solid, label="(96, 576, 1, 1)"]; -"435 conv2d_45" -> "436 quantize_per_tensor_237" [style=solid, label="(1, 96, 7, 7)"]; -"436 quantize_per_tensor_237" -> "437 dequantize_per_tensor_238" [style=solid, label="(1, 96, 7, 7)"]; -"437 dequantize_per_tensor_238" -> "438 add__4" [style=solid, label="(1, 96, 7, 7)"]; -"438 add__4" -> "439 quantize_per_tensor_239" [style=solid, label="(1, 96, 7, 7)"]; -"439 quantize_per_tensor_239" -> "440 dequantize_per_tensor_240" [style=solid, label="(1, 96, 7, 7)"]; -"439 quantize_per_tensor_239" -> "441 dequantize_per_tensor_241" [style=solid, label="(1, 96, 7, 7)"]; -"440 dequantize_per_tensor_240" -> "487 add__5" [style=solid, label="(1, 96, 7, 7)"]; -"441 dequantize_per_tensor_241" -> "445 conv2d_46" [style=solid, label="(1, 96, 7, 7)"]; -"442 features_11_block_0_0_weight_bias" -> "445 conv2d_46" [style=solid, label="(576,)"]; -"443 _frozen_param46" -> "444 dequantize_per_tensor_242" [style=solid, label="(576, 96, 1, 1)"]; -"444 dequantize_per_tensor_242" -> "445 conv2d_46" [style=solid, label="(576, 96, 1, 1)"]; -"445 conv2d_46" -> "446 quantize_per_tensor_243" [style=solid, label="(1, 576, 7, 7)"]; -"446 quantize_per_tensor_243" -> "447 dequantize_per_tensor_244" [style=solid, label="(1, 576, 7, 7)"]; -"447 dequantize_per_tensor_244" -> "448 hardswish__15" [style=solid, label="(1, 576, 7, 7)"]; -"448 hardswish__15" -> "449 quantize_per_tensor_245" [style=solid, label="(1, 576, 7, 7)"]; -"449 quantize_per_tensor_245" -> "450 dequantize_per_tensor_246" [style=solid, label="(1, 576, 7, 7)"]; -"450 dequantize_per_tensor_246" -> "454 conv2d_47" [style=solid, label="(1, 576, 7, 7)"]; -"451 features_11_block_1_0_weight_bias" -> "454 conv2d_47" [style=solid, label="(576,)"]; -"452 _frozen_param47" -> "453 dequantize_per_tensor_247" [style=solid, label="(576, 1, 5, 5)"]; -"453 dequantize_per_tensor_247" -> "454 conv2d_47" [style=solid, label="(576, 1, 5, 5)"]; -"454 conv2d_47" -> "455 quantize_per_tensor_248" [style=solid, label="(1, 576, 7, 7)"]; -"455 quantize_per_tensor_248" -> "456 dequantize_per_tensor_249" [style=solid, label="(1, 576, 7, 7)"]; -"456 dequantize_per_tensor_249" -> "457 hardswish__16" [style=solid, label="(1, 576, 7, 7)"]; -"457 hardswish__16" -> "458 quantize_per_tensor_250" [style=solid, label="(1, 576, 7, 7)"]; -"458 quantize_per_tensor_250" -> "459 dequantize_per_tensor_251" [style=solid, label="(1, 576, 7, 7)"]; -"458 quantize_per_tensor_250" -> "460 dequantize_per_tensor_252" [style=solid, label="(1, 576, 7, 7)"]; -"459 dequantize_per_tensor_251" -> "478 mul_8" [style=solid, label="(1, 576, 7, 7)"]; -"460 dequantize_per_tensor_252" -> "461 adaptive_avg_pool2d_8" [style=solid, label="(1, 576, 7, 7)"]; -"461 adaptive_avg_pool2d_8" -> "462 quantize_per_tensor_253" [style=solid, label="(1, 576, 1, 1)"]; -"462 quantize_per_tensor_253" -> "463 dequantize_per_tensor_254" [style=solid, label="(1, 576, 1, 1)"]; -"463 dequantize_per_tensor_254" -> "466 conv2d_48" [style=solid, label="(1, 576, 1, 1)"]; -"464 _frozen_param48" -> "465 dequantize_per_tensor_255" [style=solid, label="(144, 576, 1, 1)"]; -"465 dequantize_per_tensor_255" -> "466 conv2d_48" [style=solid, label="(144, 576, 1, 1)"]; -"466 conv2d_48" -> "467 relu_8" [style=solid, label="(1, 144, 1, 1)"]; -"467 relu_8" -> "468 quantize_per_tensor_256" [style=solid, label="(1, 144, 1, 1)"]; -"468 quantize_per_tensor_256" -> "469 dequantize_per_tensor_257" [style=solid, label="(1, 144, 1, 1)"]; -"469 dequantize_per_tensor_257" -> "472 conv2d_49" [style=solid, label="(1, 144, 1, 1)"]; -"470 _frozen_param49" -> "471 dequantize_per_tensor_258" [style=solid, label="(576, 144, 1, 1)"]; -"471 dequantize_per_tensor_258" -> "472 conv2d_49" [style=solid, label="(576, 144, 1, 1)"]; -"472 conv2d_49" -> "473 quantize_per_tensor_259" [style=solid, label="(1, 576, 1, 1)"]; -"473 quantize_per_tensor_259" -> "474 dequantize_per_tensor_260" [style=solid, label="(1, 576, 1, 1)"]; -"474 dequantize_per_tensor_260" -> "475 hardsigmoid_8" [style=solid, label="(1, 576, 1, 1)"]; -"475 hardsigmoid_8" -> "476 quantize_per_tensor_261" [style=solid, label="(1, 576, 1, 1)"]; -"476 quantize_per_tensor_261" -> "477 dequantize_per_tensor_262" [style=solid, label="(1, 576, 1, 1)"]; -"477 dequantize_per_tensor_262" -> "478 mul_8" [style=solid, label="(1, 576, 1, 1)"]; -"478 mul_8" -> "479 quantize_per_tensor_263" [style=solid, label="(1, 576, 7, 7)"]; -"479 quantize_per_tensor_263" -> "480 dequantize_per_tensor_264" [style=solid, label="(1, 576, 7, 7)"]; -"480 dequantize_per_tensor_264" -> "484 conv2d_50" [style=solid, label="(1, 576, 7, 7)"]; -"481 features_11_block_3_0_weight_bias" -> "484 conv2d_50" [style=solid, label="(96,)"]; -"482 _frozen_param50" -> "483 dequantize_per_tensor_265" [style=solid, label="(96, 576, 1, 1)"]; -"483 dequantize_per_tensor_265" -> "484 conv2d_50" [style=solid, label="(96, 576, 1, 1)"]; -"484 conv2d_50" -> "485 quantize_per_tensor_266" [style=solid, label="(1, 96, 7, 7)"]; -"485 quantize_per_tensor_266" -> "486 dequantize_per_tensor_267" [style=solid, label="(1, 96, 7, 7)"]; -"486 dequantize_per_tensor_267" -> "487 add__5" [style=solid, label="(1, 96, 7, 7)"]; -"487 add__5" -> "488 quantize_per_tensor_268" [style=solid, label="(1, 96, 7, 7)"]; -"488 quantize_per_tensor_268" -> "489 dequantize_per_tensor_269" [style=solid, label="(1, 96, 7, 7)"]; -"489 dequantize_per_tensor_269" -> "493 conv2d_51" [style=solid, label="(1, 96, 7, 7)"]; -"490 features_12_0_weight_bias" -> "493 conv2d_51" [style=solid, label="(576,)"]; -"491 _frozen_param51" -> "492 dequantize_per_tensor_270" [style=solid, label="(576, 96, 1, 1)"]; -"492 dequantize_per_tensor_270" -> "493 conv2d_51" [style=solid, label="(576, 96, 1, 1)"]; -"493 conv2d_51" -> "494 quantize_per_tensor_271" [style=solid, label="(1, 576, 7, 7)"]; -"494 quantize_per_tensor_271" -> "495 dequantize_per_tensor_272" [style=solid, label="(1, 576, 7, 7)"]; -"495 dequantize_per_tensor_272" -> "496 hardswish__17" [style=solid, label="(1, 576, 7, 7)"]; -"496 hardswish__17" -> "497 quantize_per_tensor_273" [style=solid, label="(1, 576, 7, 7)"]; -"497 quantize_per_tensor_273" -> "498 dequantize_per_tensor_274" [style=solid, label="(1, 576, 7, 7)"]; -"498 dequantize_per_tensor_274" -> "499 adaptive_avg_pool2d_9" [style=solid, label="(1, 576, 7, 7)"]; -"499 adaptive_avg_pool2d_9" -> "500 quantize_per_tensor_275" [style=solid, label="(1, 576, 1, 1)"]; -"500 quantize_per_tensor_275" -> "501 dequantize_per_tensor_276" [style=solid, label="(1, 576, 1, 1)"]; -"501 dequantize_per_tensor_276" -> "502 flatten" [style=solid, label="(1, 576, 1, 1)"]; -"502 flatten" -> "503 quantize_per_tensor_277" [style=solid, label="(1, 576)"]; -"503 quantize_per_tensor_277" -> "504 dequantize_per_tensor_278" [style=solid, label="(1, 576)"]; -"504 dequantize_per_tensor_278" -> "507 linear" [style=solid, label="(1, 576)"]; -"505 _frozen_param52" -> "506 dequantize_per_tensor_279" [style=solid, label="(1024, 576)"]; -"506 dequantize_per_tensor_279" -> "507 linear" [style=solid, label="(1024, 576)"]; -"507 linear" -> "508 quantize_per_tensor_280" [style=solid, label="(1, 1024)"]; -"508 quantize_per_tensor_280" -> "509 dequantize_per_tensor_281" [style=solid, label="(1, 1024)"]; -"509 dequantize_per_tensor_281" -> "510 hardswish__18" [style=solid, label="(1, 1024)"]; -"510 hardswish__18" -> "511 dropout_" [style=solid, label="(1, 1024)"]; -"511 dropout_" -> "512 quantize_per_tensor_282" [style=solid, label="(1, 1024)"]; -"512 quantize_per_tensor_282" -> "513 dequantize_per_tensor_283" [style=solid, label="(1, 1024)"]; -"513 dequantize_per_tensor_283" -> "516 linear_1" [style=solid, label="(1, 1024)"]; -"514 _frozen_param53" -> "515 dequantize_per_tensor_284" [style=solid, label="(1000, 1024)"]; -"515 dequantize_per_tensor_284" -> "516 linear_1" [style=solid, label="(1000, 1024)"]; -"516 linear_1" -> "517 quantize_per_tensor_285" [style=solid, label="(1, 1000)"]; -"517 quantize_per_tensor_285" -> "518 dequantize_per_tensor_286" [style=solid, label="(1, 1000)"]; -"518 dequantize_per_tensor_286" -> "519 output" [style=solid, label="(1, 1000)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small_ref_qconfig.json deleted file mode 100644 index 49e5f5f6b58..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/mobilenet_v3_small_ref_qconfig.json +++ /dev/null @@ -1,1352 +0,0 @@ -{ - "quantization_points": { - "('conv2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish_',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d', 'mul')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_2',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_3',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_4',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_5',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_6',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_7',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add_', 'conv2d_8')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_8',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_9',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_10',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add_',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_11',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_12',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_1', 'mul_1')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_13',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_14',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_15',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__1', 'conv2d_16')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_16',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_17',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_2', 'mul_2')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_18',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_19',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_20',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add__2', 'conv2d_21')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_21',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_22',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_3', 'mul_3')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_23',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_24',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_25',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_25',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_26',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_26',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_27',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_27',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_4', 'mul_4')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_28',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_28',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_29',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_29',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_30',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_30',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__3', 'conv2d_31')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_31',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_32',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_32',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_5', 'mul_5')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_33',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_34',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_34',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_35',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_35',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_36',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_36',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_37',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_38',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_6', 'mul_6')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_38',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_39',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_39',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_40',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_40',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__4', 'conv2d_41')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_41',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_42',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_42',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_7', 'mul_7')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_43',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_43',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_44',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_44',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_45',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_45',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add__5', 'conv2d_46')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_46',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_47',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_47',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_8', 'mul_8')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_48',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_48',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_49',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_49',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardsigmoid_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_50',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_50',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_51',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_51',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('flatten',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('hardswish__18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('output',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": { - "0": [ - 5, - 6 - ], - "1": [ - 33, - 34 - ], - "2": [ - 48, - 49 - ], - "3": [ - 64, - 65 - ], - "4": [ - 80, - 81 - ], - "5": [ - 95, - 96 - ], - "6": [ - 111, - 112 - ], - "7": [ - 126, - 127 - ], - "8": [ - 142, - 143 - ], - "9": [ - 155, - 156, - 157 - ] - }, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/resnet18.dot b/tests/torch2/data/fx/XNNPACKQuantizer/resnet18.dot deleted file mode 100644 index ac8cf95c2c1..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/resnet18.dot +++ /dev/null @@ -1,385 +0,0 @@ -strict digraph { -"0 fc_bias" [id=0, type="get_attr"]; -"1 x" [id=1, type=input]; -"2 quantize_per_tensor_0" [id=2, type="quantize_per_tensor"]; -"3 dequantize_per_tensor_1" [id=3, type="dequantize_per_tensor"]; -"4 conv1_weight_bias" [id=4, type="get_attr"]; -"5 _frozen_param0" [id=5, type="get_attr"]; -"6 dequantize_per_tensor_2" [id=6, type="dequantize_per_tensor"]; -"7 conv2d" [id=7, type=conv2d]; -"8 relu_" [id=8, type="relu_"]; -"9 quantize_per_tensor_3" [id=9, type="quantize_per_tensor"]; -"10 dequantize_per_tensor_4" [id=10, type="dequantize_per_tensor"]; -"11 max_pool2d" [id=11, type="max_pool2d"]; -"12 quantize_per_tensor_5" [id=12, type="quantize_per_tensor"]; -"13 dequantize_per_tensor_6" [id=13, type="dequantize_per_tensor"]; -"14 dequantize_per_tensor_7" [id=14, type="dequantize_per_tensor"]; -"15 layer1_0_conv1_weight_bias" [id=15, type="get_attr"]; -"16 _frozen_param1" [id=16, type="get_attr"]; -"17 dequantize_per_tensor_8" [id=17, type="dequantize_per_tensor"]; -"18 conv2d_1" [id=18, type=conv2d]; -"19 relu__1" [id=19, type="relu_"]; -"20 quantize_per_tensor_9" [id=20, type="quantize_per_tensor"]; -"21 dequantize_per_tensor_10" [id=21, type="dequantize_per_tensor"]; -"22 layer1_0_conv2_weight_bias" [id=22, type="get_attr"]; -"23 _frozen_param2" [id=23, type="get_attr"]; -"24 dequantize_per_tensor_11" [id=24, type="dequantize_per_tensor"]; -"25 conv2d_2" [id=25, type=conv2d]; -"26 quantize_per_tensor_12" [id=26, type="quantize_per_tensor"]; -"27 dequantize_per_tensor_13" [id=27, type="dequantize_per_tensor"]; -"28 add_" [id=28, type="add_"]; -"29 relu__2" [id=29, type="relu_"]; -"30 quantize_per_tensor_14" [id=30, type="quantize_per_tensor"]; -"31 dequantize_per_tensor_15" [id=31, type="dequantize_per_tensor"]; -"32 dequantize_per_tensor_16" [id=32, type="dequantize_per_tensor"]; -"33 layer1_1_conv1_weight_bias" [id=33, type="get_attr"]; -"34 _frozen_param3" [id=34, type="get_attr"]; -"35 dequantize_per_tensor_17" [id=35, type="dequantize_per_tensor"]; -"36 conv2d_3" [id=36, type=conv2d]; -"37 relu__3" [id=37, type="relu_"]; -"38 quantize_per_tensor_18" [id=38, type="quantize_per_tensor"]; -"39 dequantize_per_tensor_19" [id=39, type="dequantize_per_tensor"]; -"40 layer1_1_conv2_weight_bias" [id=40, type="get_attr"]; -"41 _frozen_param4" [id=41, type="get_attr"]; -"42 dequantize_per_tensor_20" [id=42, type="dequantize_per_tensor"]; -"43 conv2d_4" [id=43, type=conv2d]; -"44 quantize_per_tensor_21" [id=44, type="quantize_per_tensor"]; -"45 dequantize_per_tensor_22" [id=45, type="dequantize_per_tensor"]; -"46 add__1" [id=46, type="add_"]; -"47 relu__4" [id=47, type="relu_"]; -"48 quantize_per_tensor_23" [id=48, type="quantize_per_tensor"]; -"49 dequantize_per_tensor_24" [id=49, type="dequantize_per_tensor"]; -"50 dequantize_per_tensor_25" [id=50, type="dequantize_per_tensor"]; -"51 layer2_0_conv1_weight_bias" [id=51, type="get_attr"]; -"52 _frozen_param5" [id=52, type="get_attr"]; -"53 dequantize_per_tensor_26" [id=53, type="dequantize_per_tensor"]; -"54 conv2d_5" [id=54, type=conv2d]; -"55 relu__5" [id=55, type="relu_"]; -"56 quantize_per_tensor_27" [id=56, type="quantize_per_tensor"]; -"57 dequantize_per_tensor_28" [id=57, type="dequantize_per_tensor"]; -"58 layer2_0_conv2_weight_bias" [id=58, type="get_attr"]; -"59 _frozen_param6" [id=59, type="get_attr"]; -"60 dequantize_per_tensor_29" [id=60, type="dequantize_per_tensor"]; -"61 conv2d_6" [id=61, type=conv2d]; -"62 quantize_per_tensor_30" [id=62, type="quantize_per_tensor"]; -"63 dequantize_per_tensor_31" [id=63, type="dequantize_per_tensor"]; -"64 layer2_0_downsample_0_weight_bias" [id=64, type="get_attr"]; -"65 _frozen_param7" [id=65, type="get_attr"]; -"66 dequantize_per_tensor_32" [id=66, type="dequantize_per_tensor"]; -"67 conv2d_7" [id=67, type=conv2d]; -"68 quantize_per_tensor_33" [id=68, type="quantize_per_tensor"]; -"69 dequantize_per_tensor_34" [id=69, type="dequantize_per_tensor"]; -"70 add__2" [id=70, type="add_"]; -"71 relu__6" [id=71, type="relu_"]; -"72 quantize_per_tensor_35" [id=72, type="quantize_per_tensor"]; -"73 dequantize_per_tensor_36" [id=73, type="dequantize_per_tensor"]; -"74 dequantize_per_tensor_37" [id=74, type="dequantize_per_tensor"]; -"75 layer2_1_conv1_weight_bias" [id=75, type="get_attr"]; -"76 _frozen_param8" [id=76, type="get_attr"]; -"77 dequantize_per_tensor_38" [id=77, type="dequantize_per_tensor"]; -"78 conv2d_8" [id=78, type=conv2d]; -"79 relu__7" [id=79, type="relu_"]; -"80 quantize_per_tensor_39" [id=80, type="quantize_per_tensor"]; -"81 dequantize_per_tensor_40" [id=81, type="dequantize_per_tensor"]; -"82 layer2_1_conv2_weight_bias" [id=82, type="get_attr"]; -"83 _frozen_param9" [id=83, type="get_attr"]; -"84 dequantize_per_tensor_41" [id=84, type="dequantize_per_tensor"]; -"85 conv2d_9" [id=85, type=conv2d]; -"86 quantize_per_tensor_42" [id=86, type="quantize_per_tensor"]; -"87 dequantize_per_tensor_43" [id=87, type="dequantize_per_tensor"]; -"88 add__3" [id=88, type="add_"]; -"89 relu__8" [id=89, type="relu_"]; -"90 quantize_per_tensor_44" [id=90, type="quantize_per_tensor"]; -"91 dequantize_per_tensor_45" [id=91, type="dequantize_per_tensor"]; -"92 dequantize_per_tensor_46" [id=92, type="dequantize_per_tensor"]; -"93 layer3_0_conv1_weight_bias" [id=93, type="get_attr"]; -"94 _frozen_param10" [id=94, type="get_attr"]; -"95 dequantize_per_tensor_47" [id=95, type="dequantize_per_tensor"]; -"96 conv2d_10" [id=96, type=conv2d]; -"97 relu__9" [id=97, type="relu_"]; -"98 quantize_per_tensor_48" [id=98, type="quantize_per_tensor"]; -"99 dequantize_per_tensor_49" [id=99, type="dequantize_per_tensor"]; -"100 layer3_0_conv2_weight_bias" [id=100, type="get_attr"]; -"101 _frozen_param11" [id=101, type="get_attr"]; -"102 dequantize_per_tensor_50" [id=102, type="dequantize_per_tensor"]; -"103 conv2d_11" [id=103, type=conv2d]; -"104 quantize_per_tensor_51" [id=104, type="quantize_per_tensor"]; -"105 dequantize_per_tensor_52" [id=105, type="dequantize_per_tensor"]; -"106 layer3_0_downsample_0_weight_bias" [id=106, type="get_attr"]; -"107 _frozen_param12" [id=107, type="get_attr"]; -"108 dequantize_per_tensor_53" [id=108, type="dequantize_per_tensor"]; -"109 conv2d_12" [id=109, type=conv2d]; -"110 quantize_per_tensor_54" [id=110, type="quantize_per_tensor"]; -"111 dequantize_per_tensor_55" [id=111, type="dequantize_per_tensor"]; -"112 add__4" [id=112, type="add_"]; -"113 relu__10" [id=113, type="relu_"]; -"114 quantize_per_tensor_56" [id=114, type="quantize_per_tensor"]; -"115 dequantize_per_tensor_57" [id=115, type="dequantize_per_tensor"]; -"116 dequantize_per_tensor_58" [id=116, type="dequantize_per_tensor"]; -"117 layer3_1_conv1_weight_bias" [id=117, type="get_attr"]; -"118 _frozen_param13" [id=118, type="get_attr"]; -"119 dequantize_per_tensor_59" [id=119, type="dequantize_per_tensor"]; -"120 conv2d_13" [id=120, type=conv2d]; -"121 relu__11" [id=121, type="relu_"]; -"122 quantize_per_tensor_60" [id=122, type="quantize_per_tensor"]; -"123 dequantize_per_tensor_61" [id=123, type="dequantize_per_tensor"]; -"124 layer3_1_conv2_weight_bias" [id=124, type="get_attr"]; -"125 _frozen_param14" [id=125, type="get_attr"]; -"126 dequantize_per_tensor_62" [id=126, type="dequantize_per_tensor"]; -"127 conv2d_14" [id=127, type=conv2d]; -"128 quantize_per_tensor_63" [id=128, type="quantize_per_tensor"]; -"129 dequantize_per_tensor_64" [id=129, type="dequantize_per_tensor"]; -"130 add__5" [id=130, type="add_"]; -"131 relu__12" [id=131, type="relu_"]; -"132 quantize_per_tensor_65" [id=132, type="quantize_per_tensor"]; -"133 dequantize_per_tensor_66" [id=133, type="dequantize_per_tensor"]; -"134 dequantize_per_tensor_67" [id=134, type="dequantize_per_tensor"]; -"135 layer4_0_conv1_weight_bias" [id=135, type="get_attr"]; -"136 _frozen_param15" [id=136, type="get_attr"]; -"137 dequantize_per_tensor_68" [id=137, type="dequantize_per_tensor"]; -"138 conv2d_15" [id=138, type=conv2d]; -"139 relu__13" [id=139, type="relu_"]; -"140 quantize_per_tensor_69" [id=140, type="quantize_per_tensor"]; -"141 dequantize_per_tensor_70" [id=141, type="dequantize_per_tensor"]; -"142 layer4_0_conv2_weight_bias" [id=142, type="get_attr"]; -"143 _frozen_param16" [id=143, type="get_attr"]; -"144 dequantize_per_tensor_71" [id=144, type="dequantize_per_tensor"]; -"145 conv2d_16" [id=145, type=conv2d]; -"146 quantize_per_tensor_72" [id=146, type="quantize_per_tensor"]; -"147 dequantize_per_tensor_73" [id=147, type="dequantize_per_tensor"]; -"148 layer4_0_downsample_0_weight_bias" [id=148, type="get_attr"]; -"149 _frozen_param17" [id=149, type="get_attr"]; -"150 dequantize_per_tensor_74" [id=150, type="dequantize_per_tensor"]; -"151 conv2d_17" [id=151, type=conv2d]; -"152 quantize_per_tensor_75" [id=152, type="quantize_per_tensor"]; -"153 dequantize_per_tensor_76" [id=153, type="dequantize_per_tensor"]; -"154 add__6" [id=154, type="add_"]; -"155 relu__14" [id=155, type="relu_"]; -"156 quantize_per_tensor_77" [id=156, type="quantize_per_tensor"]; -"157 dequantize_per_tensor_78" [id=157, type="dequantize_per_tensor"]; -"158 dequantize_per_tensor_79" [id=158, type="dequantize_per_tensor"]; -"159 layer4_1_conv1_weight_bias" [id=159, type="get_attr"]; -"160 _frozen_param18" [id=160, type="get_attr"]; -"161 dequantize_per_tensor_80" [id=161, type="dequantize_per_tensor"]; -"162 conv2d_18" [id=162, type=conv2d]; -"163 relu__15" [id=163, type="relu_"]; -"164 quantize_per_tensor_81" [id=164, type="quantize_per_tensor"]; -"165 dequantize_per_tensor_82" [id=165, type="dequantize_per_tensor"]; -"166 layer4_1_conv2_weight_bias" [id=166, type="get_attr"]; -"167 _frozen_param19" [id=167, type="get_attr"]; -"168 dequantize_per_tensor_83" [id=168, type="dequantize_per_tensor"]; -"169 conv2d_19" [id=169, type=conv2d]; -"170 quantize_per_tensor_84" [id=170, type="quantize_per_tensor"]; -"171 dequantize_per_tensor_85" [id=171, type="dequantize_per_tensor"]; -"172 add__7" [id=172, type="add_"]; -"173 relu__16" [id=173, type="relu_"]; -"174 quantize_per_tensor_86" [id=174, type="quantize_per_tensor"]; -"175 dequantize_per_tensor_87" [id=175, type="dequantize_per_tensor"]; -"176 adaptive_avg_pool2d" [id=176, type="adaptive_avg_pool2d"]; -"177 quantize_per_tensor_88" [id=177, type="quantize_per_tensor"]; -"178 dequantize_per_tensor_89" [id=178, type="dequantize_per_tensor"]; -"179 flatten" [id=179, type=flatten]; -"180 quantize_per_tensor_90" [id=180, type="quantize_per_tensor"]; -"181 dequantize_per_tensor_91" [id=181, type="dequantize_per_tensor"]; -"182 _frozen_param20" [id=182, type="get_attr"]; -"183 dequantize_per_tensor_92" [id=183, type="dequantize_per_tensor"]; -"184 linear" [id=184, type=linear]; -"185 quantize_per_tensor_93" [id=185, type="quantize_per_tensor"]; -"186 dequantize_per_tensor_94" [id=186, type="dequantize_per_tensor"]; -"187 output" [id=187, type=output]; -"0 fc_bias" -> "184 linear" [style=solid, label="(1000,)"]; -"1 x" -> "2 quantize_per_tensor_0" [style=solid, label="(1, 3, 224, 224)"]; -"2 quantize_per_tensor_0" -> "3 dequantize_per_tensor_1" [style=solid, label="(1, 3, 224, 224)"]; -"3 dequantize_per_tensor_1" -> "7 conv2d" [style=solid, label="(1, 3, 224, 224)"]; -"4 conv1_weight_bias" -> "7 conv2d" [style=solid, label="(64,)"]; -"5 _frozen_param0" -> "6 dequantize_per_tensor_2" [style=solid, label="(64, 3, 7, 7)"]; -"6 dequantize_per_tensor_2" -> "7 conv2d" [style=solid, label="(64, 3, 7, 7)"]; -"7 conv2d" -> "8 relu_" [style=solid, label="(1, 64, 112, 112)"]; -"8 relu_" -> "9 quantize_per_tensor_3" [style=solid, label="(1, 64, 112, 112)"]; -"9 quantize_per_tensor_3" -> "10 dequantize_per_tensor_4" [style=solid, label="(1, 64, 112, 112)"]; -"10 dequantize_per_tensor_4" -> "11 max_pool2d" [style=solid, label="(1, 64, 112, 112)"]; -"11 max_pool2d" -> "12 quantize_per_tensor_5" [style=solid, label="(1, 64, 56, 56)"]; -"12 quantize_per_tensor_5" -> "13 dequantize_per_tensor_6" [style=solid, label="(1, 64, 56, 56)"]; -"12 quantize_per_tensor_5" -> "14 dequantize_per_tensor_7" [style=solid, label="(1, 64, 56, 56)"]; -"13 dequantize_per_tensor_6" -> "28 add_" [style=solid, label="(1, 64, 56, 56)"]; -"14 dequantize_per_tensor_7" -> "18 conv2d_1" [style=solid, label="(1, 64, 56, 56)"]; -"15 layer1_0_conv1_weight_bias" -> "18 conv2d_1" [style=solid, label="(64,)"]; -"16 _frozen_param1" -> "17 dequantize_per_tensor_8" [style=solid, label="(64, 64, 3, 3)"]; -"17 dequantize_per_tensor_8" -> "18 conv2d_1" [style=solid, label="(64, 64, 3, 3)"]; -"18 conv2d_1" -> "19 relu__1" [style=solid, label="(1, 64, 56, 56)"]; -"19 relu__1" -> "20 quantize_per_tensor_9" [style=solid, label="(1, 64, 56, 56)"]; -"20 quantize_per_tensor_9" -> "21 dequantize_per_tensor_10" [style=solid, label="(1, 64, 56, 56)"]; -"21 dequantize_per_tensor_10" -> "25 conv2d_2" [style=solid, label="(1, 64, 56, 56)"]; -"22 layer1_0_conv2_weight_bias" -> "25 conv2d_2" [style=solid, label="(64,)"]; -"23 _frozen_param2" -> "24 dequantize_per_tensor_11" [style=solid, label="(64, 64, 3, 3)"]; -"24 dequantize_per_tensor_11" -> "25 conv2d_2" [style=solid, label="(64, 64, 3, 3)"]; -"25 conv2d_2" -> "26 quantize_per_tensor_12" [style=solid, label="(1, 64, 56, 56)"]; -"26 quantize_per_tensor_12" -> "27 dequantize_per_tensor_13" [style=solid, label="(1, 64, 56, 56)"]; -"27 dequantize_per_tensor_13" -> "28 add_" [style=solid, label="(1, 64, 56, 56)"]; -"28 add_" -> "29 relu__2" [style=solid, label="(1, 64, 56, 56)"]; -"29 relu__2" -> "30 quantize_per_tensor_14" [style=solid, label="(1, 64, 56, 56)"]; -"30 quantize_per_tensor_14" -> "31 dequantize_per_tensor_15" [style=solid, label="(1, 64, 56, 56)"]; -"30 quantize_per_tensor_14" -> "32 dequantize_per_tensor_16" [style=solid, label="(1, 64, 56, 56)"]; -"31 dequantize_per_tensor_15" -> "46 add__1" [style=solid, label="(1, 64, 56, 56)"]; -"32 dequantize_per_tensor_16" -> "36 conv2d_3" [style=solid, label="(1, 64, 56, 56)"]; -"33 layer1_1_conv1_weight_bias" -> "36 conv2d_3" [style=solid, label="(64,)"]; -"34 _frozen_param3" -> "35 dequantize_per_tensor_17" [style=solid, label="(64, 64, 3, 3)"]; -"35 dequantize_per_tensor_17" -> "36 conv2d_3" [style=solid, label="(64, 64, 3, 3)"]; -"36 conv2d_3" -> "37 relu__3" [style=solid, label="(1, 64, 56, 56)"]; -"37 relu__3" -> "38 quantize_per_tensor_18" [style=solid, label="(1, 64, 56, 56)"]; -"38 quantize_per_tensor_18" -> "39 dequantize_per_tensor_19" [style=solid, label="(1, 64, 56, 56)"]; -"39 dequantize_per_tensor_19" -> "43 conv2d_4" [style=solid, label="(1, 64, 56, 56)"]; -"40 layer1_1_conv2_weight_bias" -> "43 conv2d_4" [style=solid, label="(64,)"]; -"41 _frozen_param4" -> "42 dequantize_per_tensor_20" [style=solid, label="(64, 64, 3, 3)"]; -"42 dequantize_per_tensor_20" -> "43 conv2d_4" [style=solid, label="(64, 64, 3, 3)"]; -"43 conv2d_4" -> "44 quantize_per_tensor_21" [style=solid, label="(1, 64, 56, 56)"]; -"44 quantize_per_tensor_21" -> "45 dequantize_per_tensor_22" [style=solid, label="(1, 64, 56, 56)"]; -"45 dequantize_per_tensor_22" -> "46 add__1" [style=solid, label="(1, 64, 56, 56)"]; -"46 add__1" -> "47 relu__4" [style=solid, label="(1, 64, 56, 56)"]; -"47 relu__4" -> "48 quantize_per_tensor_23" [style=solid, label="(1, 64, 56, 56)"]; -"48 quantize_per_tensor_23" -> "49 dequantize_per_tensor_24" [style=solid, label="(1, 64, 56, 56)"]; -"48 quantize_per_tensor_23" -> "50 dequantize_per_tensor_25" [style=solid, label="(1, 64, 56, 56)"]; -"49 dequantize_per_tensor_24" -> "67 conv2d_7" [style=solid, label="(1, 64, 56, 56)"]; -"50 dequantize_per_tensor_25" -> "54 conv2d_5" [style=solid, label="(1, 64, 56, 56)"]; -"51 layer2_0_conv1_weight_bias" -> "54 conv2d_5" [style=solid, label="(128,)"]; -"52 _frozen_param5" -> "53 dequantize_per_tensor_26" [style=solid, label="(128, 64, 3, 3)"]; -"53 dequantize_per_tensor_26" -> "54 conv2d_5" [style=solid, label="(128, 64, 3, 3)"]; -"54 conv2d_5" -> "55 relu__5" [style=solid, label="(1, 128, 28, 28)"]; -"55 relu__5" -> "56 quantize_per_tensor_27" [style=solid, label="(1, 128, 28, 28)"]; -"56 quantize_per_tensor_27" -> "57 dequantize_per_tensor_28" [style=solid, label="(1, 128, 28, 28)"]; -"57 dequantize_per_tensor_28" -> "61 conv2d_6" [style=solid, label="(1, 128, 28, 28)"]; -"58 layer2_0_conv2_weight_bias" -> "61 conv2d_6" [style=solid, label="(128,)"]; -"59 _frozen_param6" -> "60 dequantize_per_tensor_29" [style=solid, label="(128, 128, 3, 3)"]; -"60 dequantize_per_tensor_29" -> "61 conv2d_6" [style=solid, label="(128, 128, 3, 3)"]; -"61 conv2d_6" -> "62 quantize_per_tensor_30" [style=solid, label="(1, 128, 28, 28)"]; -"62 quantize_per_tensor_30" -> "63 dequantize_per_tensor_31" [style=solid, label="(1, 128, 28, 28)"]; -"63 dequantize_per_tensor_31" -> "70 add__2" [style=solid, label="(1, 128, 28, 28)"]; -"64 layer2_0_downsample_0_weight_bias" -> "67 conv2d_7" [style=solid, label="(128,)"]; -"65 _frozen_param7" -> "66 dequantize_per_tensor_32" [style=solid, label="(128, 64, 1, 1)"]; -"66 dequantize_per_tensor_32" -> "67 conv2d_7" [style=solid, label="(128, 64, 1, 1)"]; -"67 conv2d_7" -> "68 quantize_per_tensor_33" [style=solid, label="(1, 128, 28, 28)"]; -"68 quantize_per_tensor_33" -> "69 dequantize_per_tensor_34" [style=solid, label="(1, 128, 28, 28)"]; -"69 dequantize_per_tensor_34" -> "70 add__2" [style=solid, label="(1, 128, 28, 28)"]; -"70 add__2" -> "71 relu__6" [style=solid, label="(1, 128, 28, 28)"]; -"71 relu__6" -> "72 quantize_per_tensor_35" [style=solid, label="(1, 128, 28, 28)"]; -"72 quantize_per_tensor_35" -> "73 dequantize_per_tensor_36" [style=solid, label="(1, 128, 28, 28)"]; -"72 quantize_per_tensor_35" -> "74 dequantize_per_tensor_37" [style=solid, label="(1, 128, 28, 28)"]; -"73 dequantize_per_tensor_36" -> "88 add__3" [style=solid, label="(1, 128, 28, 28)"]; -"74 dequantize_per_tensor_37" -> "78 conv2d_8" [style=solid, label="(1, 128, 28, 28)"]; -"75 layer2_1_conv1_weight_bias" -> "78 conv2d_8" [style=solid, label="(128,)"]; -"76 _frozen_param8" -> "77 dequantize_per_tensor_38" [style=solid, label="(128, 128, 3, 3)"]; -"77 dequantize_per_tensor_38" -> "78 conv2d_8" [style=solid, label="(128, 128, 3, 3)"]; -"78 conv2d_8" -> "79 relu__7" [style=solid, label="(1, 128, 28, 28)"]; -"79 relu__7" -> "80 quantize_per_tensor_39" [style=solid, label="(1, 128, 28, 28)"]; -"80 quantize_per_tensor_39" -> "81 dequantize_per_tensor_40" [style=solid, label="(1, 128, 28, 28)"]; -"81 dequantize_per_tensor_40" -> "85 conv2d_9" [style=solid, label="(1, 128, 28, 28)"]; -"82 layer2_1_conv2_weight_bias" -> "85 conv2d_9" [style=solid, label="(128,)"]; -"83 _frozen_param9" -> "84 dequantize_per_tensor_41" [style=solid, label="(128, 128, 3, 3)"]; -"84 dequantize_per_tensor_41" -> "85 conv2d_9" [style=solid, label="(128, 128, 3, 3)"]; -"85 conv2d_9" -> "86 quantize_per_tensor_42" [style=solid, label="(1, 128, 28, 28)"]; -"86 quantize_per_tensor_42" -> "87 dequantize_per_tensor_43" [style=solid, label="(1, 128, 28, 28)"]; -"87 dequantize_per_tensor_43" -> "88 add__3" [style=solid, label="(1, 128, 28, 28)"]; -"88 add__3" -> "89 relu__8" [style=solid, label="(1, 128, 28, 28)"]; -"89 relu__8" -> "90 quantize_per_tensor_44" [style=solid, label="(1, 128, 28, 28)"]; -"90 quantize_per_tensor_44" -> "91 dequantize_per_tensor_45" [style=solid, label="(1, 128, 28, 28)"]; -"90 quantize_per_tensor_44" -> "92 dequantize_per_tensor_46" [style=solid, label="(1, 128, 28, 28)"]; -"91 dequantize_per_tensor_45" -> "109 conv2d_12" [style=solid, label="(1, 128, 28, 28)"]; -"92 dequantize_per_tensor_46" -> "96 conv2d_10" [style=solid, label="(1, 128, 28, 28)"]; -"93 layer3_0_conv1_weight_bias" -> "96 conv2d_10" [style=solid, label="(256,)"]; -"94 _frozen_param10" -> "95 dequantize_per_tensor_47" [style=solid, label="(256, 128, 3, 3)"]; -"95 dequantize_per_tensor_47" -> "96 conv2d_10" [style=solid, label="(256, 128, 3, 3)"]; -"96 conv2d_10" -> "97 relu__9" [style=solid, label="(1, 256, 14, 14)"]; -"97 relu__9" -> "98 quantize_per_tensor_48" [style=solid, label="(1, 256, 14, 14)"]; -"98 quantize_per_tensor_48" -> "99 dequantize_per_tensor_49" [style=solid, label="(1, 256, 14, 14)"]; -"99 dequantize_per_tensor_49" -> "103 conv2d_11" [style=solid, label="(1, 256, 14, 14)"]; -"100 layer3_0_conv2_weight_bias" -> "103 conv2d_11" [style=solid, label="(256,)"]; -"101 _frozen_param11" -> "102 dequantize_per_tensor_50" [style=solid, label="(256, 256, 3, 3)"]; -"102 dequantize_per_tensor_50" -> "103 conv2d_11" [style=solid, label="(256, 256, 3, 3)"]; -"103 conv2d_11" -> "104 quantize_per_tensor_51" [style=solid, label="(1, 256, 14, 14)"]; -"104 quantize_per_tensor_51" -> "105 dequantize_per_tensor_52" [style=solid, label="(1, 256, 14, 14)"]; -"105 dequantize_per_tensor_52" -> "112 add__4" [style=solid, label="(1, 256, 14, 14)"]; -"106 layer3_0_downsample_0_weight_bias" -> "109 conv2d_12" [style=solid, label="(256,)"]; -"107 _frozen_param12" -> "108 dequantize_per_tensor_53" [style=solid, label="(256, 128, 1, 1)"]; -"108 dequantize_per_tensor_53" -> "109 conv2d_12" [style=solid, label="(256, 128, 1, 1)"]; -"109 conv2d_12" -> "110 quantize_per_tensor_54" [style=solid, label="(1, 256, 14, 14)"]; -"110 quantize_per_tensor_54" -> "111 dequantize_per_tensor_55" [style=solid, label="(1, 256, 14, 14)"]; -"111 dequantize_per_tensor_55" -> "112 add__4" [style=solid, label="(1, 256, 14, 14)"]; -"112 add__4" -> "113 relu__10" [style=solid, label="(1, 256, 14, 14)"]; -"113 relu__10" -> "114 quantize_per_tensor_56" [style=solid, label="(1, 256, 14, 14)"]; -"114 quantize_per_tensor_56" -> "115 dequantize_per_tensor_57" [style=solid, label="(1, 256, 14, 14)"]; -"114 quantize_per_tensor_56" -> "116 dequantize_per_tensor_58" [style=solid, label="(1, 256, 14, 14)"]; -"115 dequantize_per_tensor_57" -> "130 add__5" [style=solid, label="(1, 256, 14, 14)"]; -"116 dequantize_per_tensor_58" -> "120 conv2d_13" [style=solid, label="(1, 256, 14, 14)"]; -"117 layer3_1_conv1_weight_bias" -> "120 conv2d_13" [style=solid, label="(256,)"]; -"118 _frozen_param13" -> "119 dequantize_per_tensor_59" [style=solid, label="(256, 256, 3, 3)"]; -"119 dequantize_per_tensor_59" -> "120 conv2d_13" [style=solid, label="(256, 256, 3, 3)"]; -"120 conv2d_13" -> "121 relu__11" [style=solid, label="(1, 256, 14, 14)"]; -"121 relu__11" -> "122 quantize_per_tensor_60" [style=solid, label="(1, 256, 14, 14)"]; -"122 quantize_per_tensor_60" -> "123 dequantize_per_tensor_61" [style=solid, label="(1, 256, 14, 14)"]; -"123 dequantize_per_tensor_61" -> "127 conv2d_14" [style=solid, label="(1, 256, 14, 14)"]; -"124 layer3_1_conv2_weight_bias" -> "127 conv2d_14" [style=solid, label="(256,)"]; -"125 _frozen_param14" -> "126 dequantize_per_tensor_62" [style=solid, label="(256, 256, 3, 3)"]; -"126 dequantize_per_tensor_62" -> "127 conv2d_14" [style=solid, label="(256, 256, 3, 3)"]; -"127 conv2d_14" -> "128 quantize_per_tensor_63" [style=solid, label="(1, 256, 14, 14)"]; -"128 quantize_per_tensor_63" -> "129 dequantize_per_tensor_64" [style=solid, label="(1, 256, 14, 14)"]; -"129 dequantize_per_tensor_64" -> "130 add__5" [style=solid, label="(1, 256, 14, 14)"]; -"130 add__5" -> "131 relu__12" [style=solid, label="(1, 256, 14, 14)"]; -"131 relu__12" -> "132 quantize_per_tensor_65" [style=solid, label="(1, 256, 14, 14)"]; -"132 quantize_per_tensor_65" -> "133 dequantize_per_tensor_66" [style=solid, label="(1, 256, 14, 14)"]; -"132 quantize_per_tensor_65" -> "134 dequantize_per_tensor_67" [style=solid, label="(1, 256, 14, 14)"]; -"133 dequantize_per_tensor_66" -> "151 conv2d_17" [style=solid, label="(1, 256, 14, 14)"]; -"134 dequantize_per_tensor_67" -> "138 conv2d_15" [style=solid, label="(1, 256, 14, 14)"]; -"135 layer4_0_conv1_weight_bias" -> "138 conv2d_15" [style=solid, label="(512,)"]; -"136 _frozen_param15" -> "137 dequantize_per_tensor_68" [style=solid, label="(512, 256, 3, 3)"]; -"137 dequantize_per_tensor_68" -> "138 conv2d_15" [style=solid, label="(512, 256, 3, 3)"]; -"138 conv2d_15" -> "139 relu__13" [style=solid, label="(1, 512, 7, 7)"]; -"139 relu__13" -> "140 quantize_per_tensor_69" [style=solid, label="(1, 512, 7, 7)"]; -"140 quantize_per_tensor_69" -> "141 dequantize_per_tensor_70" [style=solid, label="(1, 512, 7, 7)"]; -"141 dequantize_per_tensor_70" -> "145 conv2d_16" [style=solid, label="(1, 512, 7, 7)"]; -"142 layer4_0_conv2_weight_bias" -> "145 conv2d_16" [style=solid, label="(512,)"]; -"143 _frozen_param16" -> "144 dequantize_per_tensor_71" [style=solid, label="(512, 512, 3, 3)"]; -"144 dequantize_per_tensor_71" -> "145 conv2d_16" [style=solid, label="(512, 512, 3, 3)"]; -"145 conv2d_16" -> "146 quantize_per_tensor_72" [style=solid, label="(1, 512, 7, 7)"]; -"146 quantize_per_tensor_72" -> "147 dequantize_per_tensor_73" [style=solid, label="(1, 512, 7, 7)"]; -"147 dequantize_per_tensor_73" -> "154 add__6" [style=solid, label="(1, 512, 7, 7)"]; -"148 layer4_0_downsample_0_weight_bias" -> "151 conv2d_17" [style=solid, label="(512,)"]; -"149 _frozen_param17" -> "150 dequantize_per_tensor_74" [style=solid, label="(512, 256, 1, 1)"]; -"150 dequantize_per_tensor_74" -> "151 conv2d_17" [style=solid, label="(512, 256, 1, 1)"]; -"151 conv2d_17" -> "152 quantize_per_tensor_75" [style=solid, label="(1, 512, 7, 7)"]; -"152 quantize_per_tensor_75" -> "153 dequantize_per_tensor_76" [style=solid, label="(1, 512, 7, 7)"]; -"153 dequantize_per_tensor_76" -> "154 add__6" [style=solid, label="(1, 512, 7, 7)"]; -"154 add__6" -> "155 relu__14" [style=solid, label="(1, 512, 7, 7)"]; -"155 relu__14" -> "156 quantize_per_tensor_77" [style=solid, label="(1, 512, 7, 7)"]; -"156 quantize_per_tensor_77" -> "157 dequantize_per_tensor_78" [style=solid, label="(1, 512, 7, 7)"]; -"156 quantize_per_tensor_77" -> "158 dequantize_per_tensor_79" [style=solid, label="(1, 512, 7, 7)"]; -"157 dequantize_per_tensor_78" -> "172 add__7" [style=solid, label="(1, 512, 7, 7)"]; -"158 dequantize_per_tensor_79" -> "162 conv2d_18" [style=solid, label="(1, 512, 7, 7)"]; -"159 layer4_1_conv1_weight_bias" -> "162 conv2d_18" [style=solid, label="(512,)"]; -"160 _frozen_param18" -> "161 dequantize_per_tensor_80" [style=solid, label="(512, 512, 3, 3)"]; -"161 dequantize_per_tensor_80" -> "162 conv2d_18" [style=solid, label="(512, 512, 3, 3)"]; -"162 conv2d_18" -> "163 relu__15" [style=solid, label="(1, 512, 7, 7)"]; -"163 relu__15" -> "164 quantize_per_tensor_81" [style=solid, label="(1, 512, 7, 7)"]; -"164 quantize_per_tensor_81" -> "165 dequantize_per_tensor_82" [style=solid, label="(1, 512, 7, 7)"]; -"165 dequantize_per_tensor_82" -> "169 conv2d_19" [style=solid, label="(1, 512, 7, 7)"]; -"166 layer4_1_conv2_weight_bias" -> "169 conv2d_19" [style=solid, label="(512,)"]; -"167 _frozen_param19" -> "168 dequantize_per_tensor_83" [style=solid, label="(512, 512, 3, 3)"]; -"168 dequantize_per_tensor_83" -> "169 conv2d_19" [style=solid, label="(512, 512, 3, 3)"]; -"169 conv2d_19" -> "170 quantize_per_tensor_84" [style=solid, label="(1, 512, 7, 7)"]; -"170 quantize_per_tensor_84" -> "171 dequantize_per_tensor_85" [style=solid, label="(1, 512, 7, 7)"]; -"171 dequantize_per_tensor_85" -> "172 add__7" [style=solid, label="(1, 512, 7, 7)"]; -"172 add__7" -> "173 relu__16" [style=solid, label="(1, 512, 7, 7)"]; -"173 relu__16" -> "174 quantize_per_tensor_86" [style=solid, label="(1, 512, 7, 7)"]; -"174 quantize_per_tensor_86" -> "175 dequantize_per_tensor_87" [style=solid, label="(1, 512, 7, 7)"]; -"175 dequantize_per_tensor_87" -> "176 adaptive_avg_pool2d" [style=solid, label="(1, 512, 7, 7)"]; -"176 adaptive_avg_pool2d" -> "177 quantize_per_tensor_88" [style=solid, label="(1, 512, 1, 1)"]; -"177 quantize_per_tensor_88" -> "178 dequantize_per_tensor_89" [style=solid, label="(1, 512, 1, 1)"]; -"178 dequantize_per_tensor_89" -> "179 flatten" [style=solid, label="(1, 512, 1, 1)"]; -"179 flatten" -> "180 quantize_per_tensor_90" [style=solid, label="(1, 512)"]; -"180 quantize_per_tensor_90" -> "181 dequantize_per_tensor_91" [style=solid, label="(1, 512)"]; -"181 dequantize_per_tensor_91" -> "184 linear" [style=solid, label="(1, 512)"]; -"182 _frozen_param20" -> "183 dequantize_per_tensor_92" [style=solid, label="(1000, 512)"]; -"183 dequantize_per_tensor_92" -> "184 linear" [style=solid, label="(1000, 512)"]; -"184 linear" -> "185 quantize_per_tensor_93" [style=solid, label="(1, 1000)"]; -"185 quantize_per_tensor_93" -> "186 dequantize_per_tensor_94" [style=solid, label="(1, 1000)"]; -"186 dequantize_per_tensor_94" -> "187 output" [style=solid, label="(1, 1000)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/resnet18_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/resnet18_ref_qconfig.json deleted file mode 100644 index c9fd49c575d..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/resnet18_ref_qconfig.json +++ /dev/null @@ -1,424 +0,0 @@ -{ - "quantization_points": { - "('conv2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add_', 'conv2d_1')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('max_pool2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_2',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add_',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add__1', 'conv2d_3')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_3',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_4',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_5', 'conv2d_7')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_5',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_6',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_7',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__3', 'conv2d_8')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_8',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_9',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_10', 'conv2d_12')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_10',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_11',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_12',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__5', 'conv2d_13')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_13',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_14',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_15', 'conv2d_17')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_15',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_16',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_17',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__7', 'conv2d_18')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_18',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_19',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('add__7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('flatten',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('output',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": { - "0": [ - 2, - 3 - ], - "1": [ - 49, - 50, - 51 - ] - }, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t.dot b/tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t.dot deleted file mode 100644 index 1a459fe5c47..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t.dot +++ /dev/null @@ -1,3906 +0,0 @@ -strict digraph { -"0 features_1_0_attn_qkv_bias" [id=0, type="get_attr"]; -"1 features_1_0_attn_proj_bias" [id=1, type="get_attr"]; -"2 features_1_1_attn_qkv_bias" [id=2, type="get_attr"]; -"3 features_1_1_attn_proj_bias" [id=3, type="get_attr"]; -"4 features_3_0_attn_qkv_bias" [id=4, type="get_attr"]; -"5 features_3_0_attn_proj_bias" [id=5, type="get_attr"]; -"6 features_3_1_attn_qkv_bias" [id=6, type="get_attr"]; -"7 features_3_1_attn_proj_bias" [id=7, type="get_attr"]; -"8 features_5_0_attn_qkv_bias" [id=8, type="get_attr"]; -"9 features_5_0_attn_proj_bias" [id=9, type="get_attr"]; -"10 features_5_1_attn_qkv_bias" [id=10, type="get_attr"]; -"11 features_5_1_attn_proj_bias" [id=11, type="get_attr"]; -"12 features_5_2_attn_qkv_bias" [id=12, type="get_attr"]; -"13 features_5_2_attn_proj_bias" [id=13, type="get_attr"]; -"14 features_5_3_attn_qkv_bias" [id=14, type="get_attr"]; -"15 features_5_3_attn_proj_bias" [id=15, type="get_attr"]; -"16 features_5_4_attn_qkv_bias" [id=16, type="get_attr"]; -"17 features_5_4_attn_proj_bias" [id=17, type="get_attr"]; -"18 features_5_5_attn_qkv_bias" [id=18, type="get_attr"]; -"19 features_5_5_attn_proj_bias" [id=19, type="get_attr"]; -"20 features_7_0_attn_qkv_bias" [id=20, type="get_attr"]; -"21 features_7_0_attn_proj_bias" [id=21, type="get_attr"]; -"22 features_7_1_attn_qkv_bias" [id=22, type="get_attr"]; -"23 features_7_1_attn_proj_bias" [id=23, type="get_attr"]; -"24 features_0_0_bias" [id=24, type="get_attr"]; -"25 features_0_2_weight" [id=25, type="get_attr"]; -"26 features_0_2_bias" [id=26, type="get_attr"]; -"27 features_1_0_attn_cpb_mlp_0_bias" [id=27, type="get_attr"]; -"28 features_1_0_norm1_weight" [id=28, type="get_attr"]; -"29 features_1_0_norm1_bias" [id=29, type="get_attr"]; -"30 features_1_0_mlp_0_bias" [id=30, type="get_attr"]; -"31 features_1_0_mlp_3_bias" [id=31, type="get_attr"]; -"32 features_1_0_norm2_weight" [id=32, type="get_attr"]; -"33 features_1_0_norm2_bias" [id=33, type="get_attr"]; -"34 features_1_1_attn_cpb_mlp_0_bias" [id=34, type="get_attr"]; -"35 features_1_1_norm1_weight" [id=35, type="get_attr"]; -"36 features_1_1_norm1_bias" [id=36, type="get_attr"]; -"37 features_1_1_mlp_0_bias" [id=37, type="get_attr"]; -"38 features_1_1_mlp_3_bias" [id=38, type="get_attr"]; -"39 features_1_1_norm2_weight" [id=39, type="get_attr"]; -"40 features_1_1_norm2_bias" [id=40, type="get_attr"]; -"41 features_2_norm_weight" [id=41, type="get_attr"]; -"42 features_2_norm_bias" [id=42, type="get_attr"]; -"43 features_3_0_attn_cpb_mlp_0_bias" [id=43, type="get_attr"]; -"44 features_3_0_norm1_weight" [id=44, type="get_attr"]; -"45 features_3_0_norm1_bias" [id=45, type="get_attr"]; -"46 features_3_0_mlp_0_bias" [id=46, type="get_attr"]; -"47 features_3_0_mlp_3_bias" [id=47, type="get_attr"]; -"48 features_3_0_norm2_weight" [id=48, type="get_attr"]; -"49 features_3_0_norm2_bias" [id=49, type="get_attr"]; -"50 features_3_1_attn_cpb_mlp_0_bias" [id=50, type="get_attr"]; -"51 features_3_1_norm1_weight" [id=51, type="get_attr"]; -"52 features_3_1_norm1_bias" [id=52, type="get_attr"]; -"53 features_3_1_mlp_0_bias" [id=53, type="get_attr"]; -"54 features_3_1_mlp_3_bias" [id=54, type="get_attr"]; -"55 features_3_1_norm2_weight" [id=55, type="get_attr"]; -"56 features_3_1_norm2_bias" [id=56, type="get_attr"]; -"57 features_4_norm_weight" [id=57, type="get_attr"]; -"58 features_4_norm_bias" [id=58, type="get_attr"]; -"59 features_5_0_attn_cpb_mlp_0_bias" [id=59, type="get_attr"]; -"60 features_5_0_norm1_weight" [id=60, type="get_attr"]; -"61 features_5_0_norm1_bias" [id=61, type="get_attr"]; -"62 features_5_0_mlp_0_bias" [id=62, type="get_attr"]; -"63 features_5_0_mlp_3_bias" [id=63, type="get_attr"]; -"64 features_5_0_norm2_weight" [id=64, type="get_attr"]; -"65 features_5_0_norm2_bias" [id=65, type="get_attr"]; -"66 features_5_1_attn_cpb_mlp_0_bias" [id=66, type="get_attr"]; -"67 features_5_1_norm1_weight" [id=67, type="get_attr"]; -"68 features_5_1_norm1_bias" [id=68, type="get_attr"]; -"69 features_5_1_mlp_0_bias" [id=69, type="get_attr"]; -"70 features_5_1_mlp_3_bias" [id=70, type="get_attr"]; -"71 features_5_1_norm2_weight" [id=71, type="get_attr"]; -"72 features_5_1_norm2_bias" [id=72, type="get_attr"]; -"73 features_5_2_attn_cpb_mlp_0_bias" [id=73, type="get_attr"]; -"74 features_5_2_norm1_weight" [id=74, type="get_attr"]; -"75 features_5_2_norm1_bias" [id=75, type="get_attr"]; -"76 features_5_2_mlp_0_bias" [id=76, type="get_attr"]; -"77 features_5_2_mlp_3_bias" [id=77, type="get_attr"]; -"78 features_5_2_norm2_weight" [id=78, type="get_attr"]; -"79 features_5_2_norm2_bias" [id=79, type="get_attr"]; -"80 features_5_3_attn_cpb_mlp_0_bias" [id=80, type="get_attr"]; -"81 features_5_3_norm1_weight" [id=81, type="get_attr"]; -"82 features_5_3_norm1_bias" [id=82, type="get_attr"]; -"83 features_5_3_mlp_0_bias" [id=83, type="get_attr"]; -"84 features_5_3_mlp_3_bias" [id=84, type="get_attr"]; -"85 features_5_3_norm2_weight" [id=85, type="get_attr"]; -"86 features_5_3_norm2_bias" [id=86, type="get_attr"]; -"87 features_5_4_attn_cpb_mlp_0_bias" [id=87, type="get_attr"]; -"88 features_5_4_norm1_weight" [id=88, type="get_attr"]; -"89 features_5_4_norm1_bias" [id=89, type="get_attr"]; -"90 features_5_4_mlp_0_bias" [id=90, type="get_attr"]; -"91 features_5_4_mlp_3_bias" [id=91, type="get_attr"]; -"92 features_5_4_norm2_weight" [id=92, type="get_attr"]; -"93 features_5_4_norm2_bias" [id=93, type="get_attr"]; -"94 features_5_5_attn_cpb_mlp_0_bias" [id=94, type="get_attr"]; -"95 features_5_5_norm1_weight" [id=95, type="get_attr"]; -"96 features_5_5_norm1_bias" [id=96, type="get_attr"]; -"97 features_5_5_mlp_0_bias" [id=97, type="get_attr"]; -"98 features_5_5_mlp_3_bias" [id=98, type="get_attr"]; -"99 features_5_5_norm2_weight" [id=99, type="get_attr"]; -"100 features_5_5_norm2_bias" [id=100, type="get_attr"]; -"101 features_6_norm_weight" [id=101, type="get_attr"]; -"102 features_6_norm_bias" [id=102, type="get_attr"]; -"103 features_7_0_attn_cpb_mlp_0_bias" [id=103, type="get_attr"]; -"104 features_7_0_norm1_weight" [id=104, type="get_attr"]; -"105 features_7_0_norm1_bias" [id=105, type="get_attr"]; -"106 features_7_0_mlp_0_bias" [id=106, type="get_attr"]; -"107 features_7_0_mlp_3_bias" [id=107, type="get_attr"]; -"108 features_7_0_norm2_weight" [id=108, type="get_attr"]; -"109 features_7_0_norm2_bias" [id=109, type="get_attr"]; -"110 features_7_1_attn_cpb_mlp_0_bias" [id=110, type="get_attr"]; -"111 features_7_1_norm1_weight" [id=111, type="get_attr"]; -"112 features_7_1_norm1_bias" [id=112, type="get_attr"]; -"113 features_7_1_mlp_0_bias" [id=113, type="get_attr"]; -"114 features_7_1_mlp_3_bias" [id=114, type="get_attr"]; -"115 features_7_1_norm2_weight" [id=115, type="get_attr"]; -"116 features_7_1_norm2_bias" [id=116, type="get_attr"]; -"117 norm_weight" [id=117, type="get_attr"]; -"118 norm_bias" [id=118, type="get_attr"]; -"119 head_bias" [id=119, type="get_attr"]; -"120 features_1_0_attn_relative_position_index" [id=120, type="get_attr"]; -"121 features_1_1_attn_relative_position_index" [id=121, type="get_attr"]; -"122 features_3_0_attn_relative_position_index" [id=122, type="get_attr"]; -"123 features_3_1_attn_relative_position_index" [id=123, type="get_attr"]; -"124 features_5_0_attn_relative_position_index" [id=124, type="get_attr"]; -"125 features_5_1_attn_relative_position_index" [id=125, type="get_attr"]; -"126 features_5_2_attn_relative_position_index" [id=126, type="get_attr"]; -"127 features_5_3_attn_relative_position_index" [id=127, type="get_attr"]; -"128 features_5_4_attn_relative_position_index" [id=128, type="get_attr"]; -"129 features_5_5_attn_relative_position_index" [id=129, type="get_attr"]; -"130 features_7_0_attn_relative_position_index" [id=130, type="get_attr"]; -"131 features_7_1_attn_relative_position_index" [id=131, type="get_attr"]; -"132 x" [id=132, type=input]; -"133 quantize_per_tensor_0" [id=133, type="quantize_per_tensor"]; -"134 dequantize_per_tensor_1" [id=134, type="dequantize_per_tensor"]; -"135 _frozen_param0" [id=135, type="get_attr"]; -"136 dequantize_per_tensor_2" [id=136, type="dequantize_per_tensor"]; -"137 conv2d" [id=137, type=conv2d]; -"138 quantize_per_tensor_3" [id=138, type="quantize_per_tensor"]; -"139 dequantize_per_tensor_4" [id=139, type="dequantize_per_tensor"]; -"140 permute" [id=140, type=permute]; -"141 quantize_per_tensor_5" [id=141, type="quantize_per_tensor"]; -"142 dequantize_per_tensor_6" [id=142, type="dequantize_per_tensor"]; -"143 layer_norm" [id=143, type="layer_norm"]; -"144 _frozen_param1" [id=144, type="get_attr"]; -"145 dequantize_per_tensor_7" [id=145, type="dequantize_per_tensor"]; -"146 _frozen_param2" [id=146, type="get_attr"]; -"147 dequantize_per_tensor_8" [id=147, type="dequantize_per_tensor"]; -"148 linear" [id=148, type=linear]; -"149 relu_" [id=149, type="relu_"]; -"150 quantize_per_tensor_9" [id=150, type="quantize_per_tensor"]; -"151 dequantize_per_tensor_10" [id=151, type="dequantize_per_tensor"]; -"152 relu__0_0_nncf_smooth_quant_0" [id=152, type="call_module"]; -"153 quantize_per_tensor_11" [id=153, type="quantize_per_tensor"]; -"154 dequantize_per_tensor_12" [id=154, type="dequantize_per_tensor"]; -"155 _frozen_param3" [id=155, type="get_attr"]; -"156 dequantize_per_tensor_13" [id=156, type="dequantize_per_tensor"]; -"157 linear_1" [id=157, type=linear]; -"158 quantize_per_tensor_14" [id=158, type="quantize_per_tensor"]; -"159 dequantize_per_tensor_15" [id=159, type="dequantize_per_tensor"]; -"160 view" [id=160, type=view]; -"161 quantize_per_tensor_16" [id=161, type="quantize_per_tensor"]; -"162 dequantize_per_tensor_17" [id=162, type="dequantize_per_tensor"]; -"163 index" [id=163, type=index]; -"164 view_1" [id=164, type=view]; -"165 permute_1" [id=165, type=permute]; -"166 contiguous" [id=166, type=contiguous]; -"167 unsqueeze" [id=167, type=unsqueeze]; -"168 sigmoid" [id=168, type=sigmoid]; -"169 quantize_per_tensor_18" [id=169, type="quantize_per_tensor"]; -"170 dequantize_per_tensor_19" [id=170, type="dequantize_per_tensor"]; -"171 _frozen_param4" [id=171, type="get_attr"]; -"172 dequantize_per_tensor_20" [id=172, type="dequantize_per_tensor"]; -"173 mul" [id=173, type=mul]; -"174 quantize_per_tensor_21" [id=174, type="quantize_per_tensor"]; -"175 dequantize_per_tensor_22" [id=175, type="dequantize_per_tensor"]; -"176 pad" [id=176, type=pad]; -"177 view_2" [id=177, type=view]; -"178 permute_2" [id=178, type=permute]; -"179 reshape" [id=179, type=reshape]; -"180 clone" [id=180, type=clone]; -"181 reshape_0_0_nncf_smooth_quant_0" [id=181, type="call_module"]; -"182 quantize_per_tensor_23" [id=182, type="quantize_per_tensor"]; -"183 dequantize_per_tensor_24" [id=183, type="dequantize_per_tensor"]; -"184 _frozen_param5" [id=184, type="get_attr"]; -"185 dequantize_per_tensor_25" [id=185, type="dequantize_per_tensor"]; -"186 linear_2" [id=186, type=linear]; -"187 quantize_per_tensor_26" [id=187, type="quantize_per_tensor"]; -"188 dequantize_per_tensor_27" [id=188, type="dequantize_per_tensor"]; -"189 reshape_1" [id=189, type=reshape]; -"190 permute_3" [id=190, type=permute]; -"191 select" [id=191, type=select]; -"192 select_1" [id=192, type=select]; -"193 select_2" [id=193, type=select]; -"194 linalg_vector_norm" [id=194, type="linalg_vector_norm"]; -"195 clamp_min" [id=195, type="clamp_min"]; -"196 expand_as" [id=196, type="expand_as"]; -"197 div" [id=197, type=div]; -"198 linalg_vector_norm_1" [id=198, type="linalg_vector_norm"]; -"199 clamp_min_1" [id=199, type="clamp_min"]; -"200 expand_as_1" [id=200, type="expand_as"]; -"201 div_1" [id=201, type=div]; -"202 transpose" [id=202, type=transpose]; -"203 matmul" [id=203, type=matmul]; -"204 quantize_per_tensor_28" [id=204, type="quantize_per_tensor"]; -"205 dequantize_per_tensor_29" [id=205, type="dequantize_per_tensor"]; -"206 _frozen_param6" [id=206, type="get_attr"]; -"207 dequantize_per_tensor_30" [id=207, type="dequantize_per_tensor"]; -"208 mul_1" [id=208, type=mul]; -"209 quantize_per_tensor_31" [id=209, type="quantize_per_tensor"]; -"210 dequantize_per_tensor_32" [id=210, type="dequantize_per_tensor"]; -"211 add" [id=211, type=add]; -"212 quantize_per_tensor_33" [id=212, type="quantize_per_tensor"]; -"213 dequantize_per_tensor_34" [id=213, type="dequantize_per_tensor"]; -"214 softmax" [id=214, type=softmax]; -"215 dropout" [id=215, type=dropout]; -"216 matmul_1" [id=216, type=matmul]; -"217 transpose_1" [id=217, type=transpose]; -"218 reshape_2" [id=218, type=reshape]; -"219 reshape_2_0_0_nncf_smooth_quant_0" [id=219, type="call_module"]; -"220 quantize_per_tensor_35" [id=220, type="quantize_per_tensor"]; -"221 dequantize_per_tensor_36" [id=221, type="dequantize_per_tensor"]; -"222 _frozen_param7" [id=222, type="get_attr"]; -"223 dequantize_per_tensor_37" [id=223, type="dequantize_per_tensor"]; -"224 linear_3" [id=224, type=linear]; -"225 quantize_per_tensor_38" [id=225, type="quantize_per_tensor"]; -"226 dequantize_per_tensor_39" [id=226, type="dequantize_per_tensor"]; -"227 dropout_1" [id=227, type=dropout]; -"228 view_3" [id=228, type=view]; -"229 permute_4" [id=229, type=permute]; -"230 reshape_3" [id=230, type=reshape]; -"231 slice_2" [id=231, type=slice]; -"232 slice_3" [id=232, type=slice]; -"233 layer_norm_1" [id=233, type="layer_norm"]; -"234 quantize_per_tensor_40" [id=234, type="quantize_per_tensor"]; -"235 dequantize_per_tensor_41" [id=235, type="dequantize_per_tensor"]; -"236 quantize_per_tensor_42" [id=236, type="quantize_per_tensor"]; -"237 dequantize_per_tensor_43" [id=237, type="dequantize_per_tensor"]; -"238 add_1" [id=238, type=add]; -"239 quantize_per_tensor_44" [id=239, type="quantize_per_tensor"]; -"240 dequantize_per_tensor_45" [id=240, type="dequantize_per_tensor"]; -"241 dequantize_per_tensor_46" [id=241, type="dequantize_per_tensor"]; -"242 add_1_0_0_nncf_smooth_quant_0" [id=242, type="call_module"]; -"243 quantize_per_tensor_47" [id=243, type="quantize_per_tensor"]; -"244 dequantize_per_tensor_48" [id=244, type="dequantize_per_tensor"]; -"245 _frozen_param8" [id=245, type="get_attr"]; -"246 dequantize_per_tensor_49" [id=246, type="dequantize_per_tensor"]; -"247 linear_4" [id=247, type=linear]; -"248 quantize_per_tensor_50" [id=248, type="quantize_per_tensor"]; -"249 dequantize_per_tensor_51" [id=249, type="dequantize_per_tensor"]; -"250 gelu" [id=250, type=gelu]; -"251 dropout_2" [id=251, type=dropout]; -"252 dropout_2_0_0_nncf_smooth_quant_0" [id=252, type="call_module"]; -"253 quantize_per_tensor_52" [id=253, type="quantize_per_tensor"]; -"254 dequantize_per_tensor_53" [id=254, type="dequantize_per_tensor"]; -"255 _frozen_param9" [id=255, type="get_attr"]; -"256 dequantize_per_tensor_54" [id=256, type="dequantize_per_tensor"]; -"257 linear_5" [id=257, type=linear]; -"258 quantize_per_tensor_55" [id=258, type="quantize_per_tensor"]; -"259 dequantize_per_tensor_56" [id=259, type="dequantize_per_tensor"]; -"260 dropout_3" [id=260, type=dropout]; -"261 layer_norm_2" [id=261, type="layer_norm"]; -"262 quantize_per_tensor_57" [id=262, type="quantize_per_tensor"]; -"263 dequantize_per_tensor_58" [id=263, type="dequantize_per_tensor"]; -"264 add_2" [id=264, type=add]; -"265 quantize_per_tensor_59" [id=265, type="quantize_per_tensor"]; -"266 dequantize_per_tensor_60" [id=266, type="dequantize_per_tensor"]; -"267 dequantize_per_tensor_61" [id=267, type="dequantize_per_tensor"]; -"268 _frozen_param10" [id=268, type="get_attr"]; -"269 dequantize_per_tensor_62" [id=269, type="dequantize_per_tensor"]; -"270 _frozen_param11" [id=270, type="get_attr"]; -"271 dequantize_per_tensor_63" [id=271, type="dequantize_per_tensor"]; -"272 linear_6" [id=272, type=linear]; -"273 relu__1" [id=273, type="relu_"]; -"274 quantize_per_tensor_64" [id=274, type="quantize_per_tensor"]; -"275 dequantize_per_tensor_65" [id=275, type="dequantize_per_tensor"]; -"276 relu__1_0_0_nncf_smooth_quant_0" [id=276, type="call_module"]; -"277 quantize_per_tensor_66" [id=277, type="quantize_per_tensor"]; -"278 dequantize_per_tensor_67" [id=278, type="dequantize_per_tensor"]; -"279 _frozen_param12" [id=279, type="get_attr"]; -"280 dequantize_per_tensor_68" [id=280, type="dequantize_per_tensor"]; -"281 linear_7" [id=281, type=linear]; -"282 quantize_per_tensor_69" [id=282, type="quantize_per_tensor"]; -"283 dequantize_per_tensor_70" [id=283, type="dequantize_per_tensor"]; -"284 view_4" [id=284, type=view]; -"285 quantize_per_tensor_71" [id=285, type="quantize_per_tensor"]; -"286 dequantize_per_tensor_72" [id=286, type="dequantize_per_tensor"]; -"287 index_1" [id=287, type=index]; -"288 view_5" [id=288, type=view]; -"289 permute_5" [id=289, type=permute]; -"290 contiguous_1" [id=290, type=contiguous]; -"291 unsqueeze_1" [id=291, type=unsqueeze]; -"292 sigmoid_1" [id=292, type=sigmoid]; -"293 quantize_per_tensor_73" [id=293, type="quantize_per_tensor"]; -"294 dequantize_per_tensor_74" [id=294, type="dequantize_per_tensor"]; -"295 _frozen_param13" [id=295, type="get_attr"]; -"296 dequantize_per_tensor_75" [id=296, type="dequantize_per_tensor"]; -"297 mul_2" [id=297, type=mul]; -"298 quantize_per_tensor_76" [id=298, type="quantize_per_tensor"]; -"299 dequantize_per_tensor_77" [id=299, type="dequantize_per_tensor"]; -"300 pad_1" [id=300, type=pad]; -"301 roll" [id=301, type=roll]; -"302 view_6" [id=302, type=view]; -"303 permute_6" [id=303, type=permute]; -"304 reshape_4" [id=304, type=reshape]; -"305 clone_1" [id=305, type=clone]; -"306 reshape_4_0_0_nncf_smooth_quant_0" [id=306, type="call_module"]; -"307 quantize_per_tensor_78" [id=307, type="quantize_per_tensor"]; -"308 dequantize_per_tensor_79" [id=308, type="dequantize_per_tensor"]; -"309 _frozen_param14" [id=309, type="get_attr"]; -"310 dequantize_per_tensor_80" [id=310, type="dequantize_per_tensor"]; -"311 linear_8" [id=311, type=linear]; -"312 quantize_per_tensor_81" [id=312, type="quantize_per_tensor"]; -"313 dequantize_per_tensor_82" [id=313, type="dequantize_per_tensor"]; -"314 reshape_5" [id=314, type=reshape]; -"315 permute_7" [id=315, type=permute]; -"316 select_3" [id=316, type=select]; -"317 select_4" [id=317, type=select]; -"318 select_5" [id=318, type=select]; -"319 linalg_vector_norm_2" [id=319, type="linalg_vector_norm"]; -"320 clamp_min_2" [id=320, type="clamp_min"]; -"321 expand_as_2" [id=321, type="expand_as"]; -"322 div_2" [id=322, type=div]; -"323 linalg_vector_norm_3" [id=323, type="linalg_vector_norm"]; -"324 clamp_min_3" [id=324, type="clamp_min"]; -"325 expand_as_3" [id=325, type="expand_as"]; -"326 div_3" [id=326, type=div]; -"327 transpose_2" [id=327, type=transpose]; -"328 matmul_2" [id=328, type=matmul]; -"329 quantize_per_tensor_83" [id=329, type="quantize_per_tensor"]; -"330 dequantize_per_tensor_84" [id=330, type="dequantize_per_tensor"]; -"331 _frozen_param15" [id=331, type="get_attr"]; -"332 dequantize_per_tensor_85" [id=332, type="dequantize_per_tensor"]; -"333 mul_3" [id=333, type=mul]; -"334 quantize_per_tensor_86" [id=334, type="quantize_per_tensor"]; -"335 dequantize_per_tensor_87" [id=335, type="dequantize_per_tensor"]; -"336 add_3" [id=336, type=add]; -"337 quantize_per_tensor_88" [id=337, type="quantize_per_tensor"]; -"338 dequantize_per_tensor_89" [id=338, type="dequantize_per_tensor"]; -"339 new_zeros" [id=339, type="new_zeros"]; -"340 view_7" [id=340, type=view]; -"341 permute_8" [id=341, type=permute]; -"342 reshape_6" [id=342, type=reshape]; -"343 unsqueeze_2" [id=343, type=unsqueeze]; -"344 unsqueeze_3" [id=344, type=unsqueeze]; -"345 sub" [id=345, type=sub]; -"346 ne" [id=346, type=ne]; -"347 masked_fill" [id=347, type="masked_fill"]; -"348 eq" [id=348, type=eq]; -"349 masked_fill_1" [id=349, type="masked_fill"]; -"350 view_8" [id=350, type=view]; -"351 quantize_per_tensor_90" [id=351, type="quantize_per_tensor"]; -"352 dequantize_per_tensor_91" [id=352, type="dequantize_per_tensor"]; -"353 unsqueeze_4" [id=353, type=unsqueeze]; -"354 unsqueeze_5" [id=354, type=unsqueeze]; -"355 quantize_per_tensor_92" [id=355, type="quantize_per_tensor"]; -"356 dequantize_per_tensor_93" [id=356, type="dequantize_per_tensor"]; -"357 add_4" [id=357, type=add]; -"358 quantize_per_tensor_94" [id=358, type="quantize_per_tensor"]; -"359 dequantize_per_tensor_95" [id=359, type="dequantize_per_tensor"]; -"360 view_9" [id=360, type=view]; -"361 quantize_per_tensor_96" [id=361, type="quantize_per_tensor"]; -"362 dequantize_per_tensor_97" [id=362, type="dequantize_per_tensor"]; -"363 softmax_1" [id=363, type=softmax]; -"364 dropout_4" [id=364, type=dropout]; -"365 matmul_3" [id=365, type=matmul]; -"366 transpose_3" [id=366, type=transpose]; -"367 reshape_7" [id=367, type=reshape]; -"368 reshape_7_0_0_nncf_smooth_quant_0" [id=368, type="call_module"]; -"369 quantize_per_tensor_98" [id=369, type="quantize_per_tensor"]; -"370 dequantize_per_tensor_99" [id=370, type="dequantize_per_tensor"]; -"371 _frozen_param16" [id=371, type="get_attr"]; -"372 dequantize_per_tensor_100" [id=372, type="dequantize_per_tensor"]; -"373 linear_9" [id=373, type=linear]; -"374 quantize_per_tensor_101" [id=374, type="quantize_per_tensor"]; -"375 dequantize_per_tensor_102" [id=375, type="dequantize_per_tensor"]; -"376 dropout_5" [id=376, type=dropout]; -"377 view_10" [id=377, type=view]; -"378 permute_9" [id=378, type=permute]; -"379 reshape_8" [id=379, type=reshape]; -"380 roll_1" [id=380, type=roll]; -"381 slice_23" [id=381, type=slice]; -"382 slice_24" [id=382, type=slice]; -"383 layer_norm_3" [id=383, type="layer_norm"]; -"384 quantize_per_tensor_103" [id=384, type="quantize_per_tensor"]; -"385 dequantize_per_tensor_104" [id=385, type="dequantize_per_tensor"]; -"386 add_5" [id=386, type=add]; -"387 quantize_per_tensor_105" [id=387, type="quantize_per_tensor"]; -"388 dequantize_per_tensor_106" [id=388, type="dequantize_per_tensor"]; -"389 dequantize_per_tensor_107" [id=389, type="dequantize_per_tensor"]; -"390 add_5_0_0_nncf_smooth_quant_0" [id=390, type="call_module"]; -"391 quantize_per_tensor_108" [id=391, type="quantize_per_tensor"]; -"392 dequantize_per_tensor_109" [id=392, type="dequantize_per_tensor"]; -"393 _frozen_param17" [id=393, type="get_attr"]; -"394 dequantize_per_tensor_110" [id=394, type="dequantize_per_tensor"]; -"395 linear_10" [id=395, type=linear]; -"396 quantize_per_tensor_111" [id=396, type="quantize_per_tensor"]; -"397 dequantize_per_tensor_112" [id=397, type="dequantize_per_tensor"]; -"398 gelu_1" [id=398, type=gelu]; -"399 dropout_6" [id=399, type=dropout]; -"400 dropout_6_0_0_nncf_smooth_quant_0" [id=400, type="call_module"]; -"401 quantize_per_tensor_113" [id=401, type="quantize_per_tensor"]; -"402 dequantize_per_tensor_114" [id=402, type="dequantize_per_tensor"]; -"403 _frozen_param18" [id=403, type="get_attr"]; -"404 dequantize_per_tensor_115" [id=404, type="dequantize_per_tensor"]; -"405 linear_11" [id=405, type=linear]; -"406 quantize_per_tensor_116" [id=406, type="quantize_per_tensor"]; -"407 dequantize_per_tensor_117" [id=407, type="dequantize_per_tensor"]; -"408 dropout_7" [id=408, type=dropout]; -"409 layer_norm_4" [id=409, type="layer_norm"]; -"410 quantize_per_tensor_118" [id=410, type="quantize_per_tensor"]; -"411 dequantize_per_tensor_119" [id=411, type="dequantize_per_tensor"]; -"412 add_6" [id=412, type=add]; -"413 quantize_per_tensor_120" [id=413, type="quantize_per_tensor"]; -"414 dequantize_per_tensor_121" [id=414, type="dequantize_per_tensor"]; -"415 pad_2" [id=415, type=pad]; -"416 slice_25" [id=416, type=slice]; -"417 slice_26" [id=417, type=slice]; -"418 slice_27" [id=418, type=slice]; -"419 quantize_per_tensor_122" [id=419, type="quantize_per_tensor"]; -"420 dequantize_per_tensor_123" [id=420, type="dequantize_per_tensor"]; -"421 slice_28" [id=421, type=slice]; -"422 slice_29" [id=422, type=slice]; -"423 slice_30" [id=423, type=slice]; -"424 quantize_per_tensor_124" [id=424, type="quantize_per_tensor"]; -"425 dequantize_per_tensor_125" [id=425, type="dequantize_per_tensor"]; -"426 slice_31" [id=426, type=slice]; -"427 slice_32" [id=427, type=slice]; -"428 slice_33" [id=428, type=slice]; -"429 quantize_per_tensor_126" [id=429, type="quantize_per_tensor"]; -"430 dequantize_per_tensor_127" [id=430, type="dequantize_per_tensor"]; -"431 slice_34" [id=431, type=slice]; -"432 slice_35" [id=432, type=slice]; -"433 slice_36" [id=433, type=slice]; -"434 quantize_per_tensor_128" [id=434, type="quantize_per_tensor"]; -"435 dequantize_per_tensor_129" [id=435, type="dequantize_per_tensor"]; -"436 cat" [id=436, type=cat]; -"437 quantize_per_tensor_130" [id=437, type="quantize_per_tensor"]; -"438 dequantize_per_tensor_131" [id=438, type="dequantize_per_tensor"]; -"439 cat_0_0_nncf_smooth_quant_0" [id=439, type="call_module"]; -"440 quantize_per_tensor_132" [id=440, type="quantize_per_tensor"]; -"441 dequantize_per_tensor_133" [id=441, type="dequantize_per_tensor"]; -"442 _frozen_param19" [id=442, type="get_attr"]; -"443 dequantize_per_tensor_134" [id=443, type="dequantize_per_tensor"]; -"444 linear_12" [id=444, type=linear]; -"445 quantize_per_tensor_135" [id=445, type="quantize_per_tensor"]; -"446 dequantize_per_tensor_136" [id=446, type="dequantize_per_tensor"]; -"447 layer_norm_5" [id=447, type="layer_norm"]; -"448 _frozen_param20" [id=448, type="get_attr"]; -"449 dequantize_per_tensor_137" [id=449, type="dequantize_per_tensor"]; -"450 _frozen_param21" [id=450, type="get_attr"]; -"451 dequantize_per_tensor_138" [id=451, type="dequantize_per_tensor"]; -"452 linear_13" [id=452, type=linear]; -"453 relu__2" [id=453, type="relu_"]; -"454 quantize_per_tensor_139" [id=454, type="quantize_per_tensor"]; -"455 dequantize_per_tensor_140" [id=455, type="dequantize_per_tensor"]; -"456 relu__2_0_0_nncf_smooth_quant_0" [id=456, type="call_module"]; -"457 quantize_per_tensor_141" [id=457, type="quantize_per_tensor"]; -"458 dequantize_per_tensor_142" [id=458, type="dequantize_per_tensor"]; -"459 _frozen_param22" [id=459, type="get_attr"]; -"460 dequantize_per_tensor_143" [id=460, type="dequantize_per_tensor"]; -"461 linear_14" [id=461, type=linear]; -"462 quantize_per_tensor_144" [id=462, type="quantize_per_tensor"]; -"463 dequantize_per_tensor_145" [id=463, type="dequantize_per_tensor"]; -"464 view_11" [id=464, type=view]; -"465 quantize_per_tensor_146" [id=465, type="quantize_per_tensor"]; -"466 dequantize_per_tensor_147" [id=466, type="dequantize_per_tensor"]; -"467 index_2" [id=467, type=index]; -"468 view_12" [id=468, type=view]; -"469 permute_10" [id=469, type=permute]; -"470 contiguous_2" [id=470, type=contiguous]; -"471 unsqueeze_6" [id=471, type=unsqueeze]; -"472 sigmoid_2" [id=472, type=sigmoid]; -"473 quantize_per_tensor_148" [id=473, type="quantize_per_tensor"]; -"474 dequantize_per_tensor_149" [id=474, type="dequantize_per_tensor"]; -"475 _frozen_param23" [id=475, type="get_attr"]; -"476 dequantize_per_tensor_150" [id=476, type="dequantize_per_tensor"]; -"477 mul_4" [id=477, type=mul]; -"478 quantize_per_tensor_151" [id=478, type="quantize_per_tensor"]; -"479 dequantize_per_tensor_152" [id=479, type="dequantize_per_tensor"]; -"480 pad_3" [id=480, type=pad]; -"481 view_13" [id=481, type=view]; -"482 permute_11" [id=482, type=permute]; -"483 reshape_9" [id=483, type=reshape]; -"484 clone_2" [id=484, type=clone]; -"485 reshape_9_0_0_nncf_smooth_quant_0" [id=485, type="call_module"]; -"486 quantize_per_tensor_153" [id=486, type="quantize_per_tensor"]; -"487 dequantize_per_tensor_154" [id=487, type="dequantize_per_tensor"]; -"488 _frozen_param24" [id=488, type="get_attr"]; -"489 dequantize_per_tensor_155" [id=489, type="dequantize_per_tensor"]; -"490 linear_15" [id=490, type=linear]; -"491 quantize_per_tensor_156" [id=491, type="quantize_per_tensor"]; -"492 dequantize_per_tensor_157" [id=492, type="dequantize_per_tensor"]; -"493 reshape_10" [id=493, type=reshape]; -"494 permute_12" [id=494, type=permute]; -"495 select_6" [id=495, type=select]; -"496 select_7" [id=496, type=select]; -"497 select_8" [id=497, type=select]; -"498 linalg_vector_norm_4" [id=498, type="linalg_vector_norm"]; -"499 clamp_min_4" [id=499, type="clamp_min"]; -"500 expand_as_4" [id=500, type="expand_as"]; -"501 div_4" [id=501, type=div]; -"502 linalg_vector_norm_5" [id=502, type="linalg_vector_norm"]; -"503 clamp_min_5" [id=503, type="clamp_min"]; -"504 expand_as_5" [id=504, type="expand_as"]; -"505 div_5" [id=505, type=div]; -"506 transpose_4" [id=506, type=transpose]; -"507 matmul_4" [id=507, type=matmul]; -"508 quantize_per_tensor_158" [id=508, type="quantize_per_tensor"]; -"509 dequantize_per_tensor_159" [id=509, type="dequantize_per_tensor"]; -"510 _frozen_param25" [id=510, type="get_attr"]; -"511 dequantize_per_tensor_160" [id=511, type="dequantize_per_tensor"]; -"512 mul_5" [id=512, type=mul]; -"513 quantize_per_tensor_161" [id=513, type="quantize_per_tensor"]; -"514 dequantize_per_tensor_162" [id=514, type="dequantize_per_tensor"]; -"515 add_7" [id=515, type=add]; -"516 quantize_per_tensor_163" [id=516, type="quantize_per_tensor"]; -"517 dequantize_per_tensor_164" [id=517, type="dequantize_per_tensor"]; -"518 softmax_2" [id=518, type=softmax]; -"519 dropout_8" [id=519, type=dropout]; -"520 matmul_5" [id=520, type=matmul]; -"521 transpose_5" [id=521, type=transpose]; -"522 reshape_11" [id=522, type=reshape]; -"523 reshape_11_0_0_nncf_smooth_quant_0" [id=523, type="call_module"]; -"524 quantize_per_tensor_165" [id=524, type="quantize_per_tensor"]; -"525 dequantize_per_tensor_166" [id=525, type="dequantize_per_tensor"]; -"526 _frozen_param26" [id=526, type="get_attr"]; -"527 dequantize_per_tensor_167" [id=527, type="dequantize_per_tensor"]; -"528 linear_16" [id=528, type=linear]; -"529 quantize_per_tensor_168" [id=529, type="quantize_per_tensor"]; -"530 dequantize_per_tensor_169" [id=530, type="dequantize_per_tensor"]; -"531 dropout_9" [id=531, type=dropout]; -"532 view_14" [id=532, type=view]; -"533 permute_13" [id=533, type=permute]; -"534 reshape_12" [id=534, type=reshape]; -"535 slice_38" [id=535, type=slice]; -"536 slice_39" [id=536, type=slice]; -"537 slice_40" [id=537, type=slice]; -"538 slice_41" [id=538, type=slice]; -"539 contiguous_3" [id=539, type=contiguous]; -"540 layer_norm_6" [id=540, type="layer_norm"]; -"541 quantize_per_tensor_170" [id=541, type="quantize_per_tensor"]; -"542 dequantize_per_tensor_171" [id=542, type="dequantize_per_tensor"]; -"543 quantize_per_tensor_172" [id=543, type="quantize_per_tensor"]; -"544 dequantize_per_tensor_173" [id=544, type="dequantize_per_tensor"]; -"545 add_8" [id=545, type=add]; -"546 quantize_per_tensor_174" [id=546, type="quantize_per_tensor"]; -"547 dequantize_per_tensor_175" [id=547, type="dequantize_per_tensor"]; -"548 dequantize_per_tensor_176" [id=548, type="dequantize_per_tensor"]; -"549 add_8_0_0_nncf_smooth_quant_0" [id=549, type="call_module"]; -"550 quantize_per_tensor_177" [id=550, type="quantize_per_tensor"]; -"551 dequantize_per_tensor_178" [id=551, type="dequantize_per_tensor"]; -"552 _frozen_param27" [id=552, type="get_attr"]; -"553 dequantize_per_tensor_179" [id=553, type="dequantize_per_tensor"]; -"554 linear_17" [id=554, type=linear]; -"555 quantize_per_tensor_180" [id=555, type="quantize_per_tensor"]; -"556 dequantize_per_tensor_181" [id=556, type="dequantize_per_tensor"]; -"557 gelu_2" [id=557, type=gelu]; -"558 dropout_10" [id=558, type=dropout]; -"559 dropout_10_0_0_nncf_smooth_quant_0" [id=559, type="call_module"]; -"560 quantize_per_tensor_182" [id=560, type="quantize_per_tensor"]; -"561 dequantize_per_tensor_183" [id=561, type="dequantize_per_tensor"]; -"562 _frozen_param28" [id=562, type="get_attr"]; -"563 dequantize_per_tensor_184" [id=563, type="dequantize_per_tensor"]; -"564 linear_18" [id=564, type=linear]; -"565 quantize_per_tensor_185" [id=565, type="quantize_per_tensor"]; -"566 dequantize_per_tensor_186" [id=566, type="dequantize_per_tensor"]; -"567 dropout_11" [id=567, type=dropout]; -"568 layer_norm_7" [id=568, type="layer_norm"]; -"569 quantize_per_tensor_187" [id=569, type="quantize_per_tensor"]; -"570 dequantize_per_tensor_188" [id=570, type="dequantize_per_tensor"]; -"571 add_9" [id=571, type=add]; -"572 quantize_per_tensor_189" [id=572, type="quantize_per_tensor"]; -"573 dequantize_per_tensor_190" [id=573, type="dequantize_per_tensor"]; -"574 dequantize_per_tensor_191" [id=574, type="dequantize_per_tensor"]; -"575 _frozen_param29" [id=575, type="get_attr"]; -"576 dequantize_per_tensor_192" [id=576, type="dequantize_per_tensor"]; -"577 _frozen_param30" [id=577, type="get_attr"]; -"578 dequantize_per_tensor_193" [id=578, type="dequantize_per_tensor"]; -"579 linear_19" [id=579, type=linear]; -"580 relu__3" [id=580, type="relu_"]; -"581 quantize_per_tensor_194" [id=581, type="quantize_per_tensor"]; -"582 dequantize_per_tensor_195" [id=582, type="dequantize_per_tensor"]; -"583 relu__3_0_0_nncf_smooth_quant_0" [id=583, type="call_module"]; -"584 quantize_per_tensor_196" [id=584, type="quantize_per_tensor"]; -"585 dequantize_per_tensor_197" [id=585, type="dequantize_per_tensor"]; -"586 _frozen_param31" [id=586, type="get_attr"]; -"587 dequantize_per_tensor_198" [id=587, type="dequantize_per_tensor"]; -"588 linear_20" [id=588, type=linear]; -"589 quantize_per_tensor_199" [id=589, type="quantize_per_tensor"]; -"590 dequantize_per_tensor_200" [id=590, type="dequantize_per_tensor"]; -"591 view_15" [id=591, type=view]; -"592 quantize_per_tensor_201" [id=592, type="quantize_per_tensor"]; -"593 dequantize_per_tensor_202" [id=593, type="dequantize_per_tensor"]; -"594 index_3" [id=594, type=index]; -"595 view_16" [id=595, type=view]; -"596 permute_14" [id=596, type=permute]; -"597 contiguous_4" [id=597, type=contiguous]; -"598 unsqueeze_7" [id=598, type=unsqueeze]; -"599 sigmoid_3" [id=599, type=sigmoid]; -"600 quantize_per_tensor_203" [id=600, type="quantize_per_tensor"]; -"601 dequantize_per_tensor_204" [id=601, type="dequantize_per_tensor"]; -"602 _frozen_param32" [id=602, type="get_attr"]; -"603 dequantize_per_tensor_205" [id=603, type="dequantize_per_tensor"]; -"604 mul_6" [id=604, type=mul]; -"605 quantize_per_tensor_206" [id=605, type="quantize_per_tensor"]; -"606 dequantize_per_tensor_207" [id=606, type="dequantize_per_tensor"]; -"607 pad_4" [id=607, type=pad]; -"608 roll_2" [id=608, type=roll]; -"609 view_17" [id=609, type=view]; -"610 permute_15" [id=610, type=permute]; -"611 reshape_13" [id=611, type=reshape]; -"612 clone_3" [id=612, type=clone]; -"613 reshape_13_0_0_nncf_smooth_quant_0" [id=613, type="call_module"]; -"614 quantize_per_tensor_208" [id=614, type="quantize_per_tensor"]; -"615 dequantize_per_tensor_209" [id=615, type="dequantize_per_tensor"]; -"616 _frozen_param33" [id=616, type="get_attr"]; -"617 dequantize_per_tensor_210" [id=617, type="dequantize_per_tensor"]; -"618 linear_21" [id=618, type=linear]; -"619 quantize_per_tensor_211" [id=619, type="quantize_per_tensor"]; -"620 dequantize_per_tensor_212" [id=620, type="dequantize_per_tensor"]; -"621 reshape_14" [id=621, type=reshape]; -"622 permute_16" [id=622, type=permute]; -"623 select_9" [id=623, type=select]; -"624 select_10" [id=624, type=select]; -"625 select_11" [id=625, type=select]; -"626 linalg_vector_norm_6" [id=626, type="linalg_vector_norm"]; -"627 clamp_min_6" [id=627, type="clamp_min"]; -"628 expand_as_6" [id=628, type="expand_as"]; -"629 div_6" [id=629, type=div]; -"630 linalg_vector_norm_7" [id=630, type="linalg_vector_norm"]; -"631 clamp_min_7" [id=631, type="clamp_min"]; -"632 expand_as_7" [id=632, type="expand_as"]; -"633 div_7" [id=633, type=div]; -"634 transpose_6" [id=634, type=transpose]; -"635 matmul_6" [id=635, type=matmul]; -"636 quantize_per_tensor_213" [id=636, type="quantize_per_tensor"]; -"637 dequantize_per_tensor_214" [id=637, type="dequantize_per_tensor"]; -"638 _frozen_param34" [id=638, type="get_attr"]; -"639 dequantize_per_tensor_215" [id=639, type="dequantize_per_tensor"]; -"640 mul_7" [id=640, type=mul]; -"641 quantize_per_tensor_216" [id=641, type="quantize_per_tensor"]; -"642 dequantize_per_tensor_217" [id=642, type="dequantize_per_tensor"]; -"643 add_10" [id=643, type=add]; -"644 quantize_per_tensor_218" [id=644, type="quantize_per_tensor"]; -"645 dequantize_per_tensor_219" [id=645, type="dequantize_per_tensor"]; -"646 new_zeros_1" [id=646, type="new_zeros"]; -"647 view_18" [id=647, type=view]; -"648 permute_17" [id=648, type=permute]; -"649 reshape_15" [id=649, type=reshape]; -"650 unsqueeze_8" [id=650, type=unsqueeze]; -"651 unsqueeze_9" [id=651, type=unsqueeze]; -"652 sub_1" [id=652, type=sub]; -"653 ne_1" [id=653, type=ne]; -"654 masked_fill_2" [id=654, type="masked_fill"]; -"655 eq_1" [id=655, type=eq]; -"656 masked_fill_3" [id=656, type="masked_fill"]; -"657 view_19" [id=657, type=view]; -"658 quantize_per_tensor_220" [id=658, type="quantize_per_tensor"]; -"659 dequantize_per_tensor_221" [id=659, type="dequantize_per_tensor"]; -"660 unsqueeze_10" [id=660, type=unsqueeze]; -"661 unsqueeze_11" [id=661, type=unsqueeze]; -"662 quantize_per_tensor_222" [id=662, type="quantize_per_tensor"]; -"663 dequantize_per_tensor_223" [id=663, type="dequantize_per_tensor"]; -"664 add_11" [id=664, type=add]; -"665 quantize_per_tensor_224" [id=665, type="quantize_per_tensor"]; -"666 dequantize_per_tensor_225" [id=666, type="dequantize_per_tensor"]; -"667 view_20" [id=667, type=view]; -"668 quantize_per_tensor_226" [id=668, type="quantize_per_tensor"]; -"669 dequantize_per_tensor_227" [id=669, type="dequantize_per_tensor"]; -"670 softmax_3" [id=670, type=softmax]; -"671 dropout_12" [id=671, type=dropout]; -"672 matmul_7" [id=672, type=matmul]; -"673 transpose_7" [id=673, type=transpose]; -"674 reshape_16" [id=674, type=reshape]; -"675 reshape_16_0_0_nncf_smooth_quant_0" [id=675, type="call_module"]; -"676 quantize_per_tensor_228" [id=676, type="quantize_per_tensor"]; -"677 dequantize_per_tensor_229" [id=677, type="dequantize_per_tensor"]; -"678 _frozen_param35" [id=678, type="get_attr"]; -"679 dequantize_per_tensor_230" [id=679, type="dequantize_per_tensor"]; -"680 linear_22" [id=680, type=linear]; -"681 quantize_per_tensor_231" [id=681, type="quantize_per_tensor"]; -"682 dequantize_per_tensor_232" [id=682, type="dequantize_per_tensor"]; -"683 dropout_13" [id=683, type=dropout]; -"684 view_21" [id=684, type=view]; -"685 permute_18" [id=685, type=permute]; -"686 reshape_17" [id=686, type=reshape]; -"687 roll_3" [id=687, type=roll]; -"688 slice_61" [id=688, type=slice]; -"689 slice_62" [id=689, type=slice]; -"690 slice_63" [id=690, type=slice]; -"691 slice_64" [id=691, type=slice]; -"692 contiguous_5" [id=692, type=contiguous]; -"693 layer_norm_8" [id=693, type="layer_norm"]; -"694 quantize_per_tensor_233" [id=694, type="quantize_per_tensor"]; -"695 dequantize_per_tensor_234" [id=695, type="dequantize_per_tensor"]; -"696 add_12" [id=696, type=add]; -"697 quantize_per_tensor_235" [id=697, type="quantize_per_tensor"]; -"698 dequantize_per_tensor_236" [id=698, type="dequantize_per_tensor"]; -"699 dequantize_per_tensor_237" [id=699, type="dequantize_per_tensor"]; -"700 add_12_0_0_nncf_smooth_quant_0" [id=700, type="call_module"]; -"701 quantize_per_tensor_238" [id=701, type="quantize_per_tensor"]; -"702 dequantize_per_tensor_239" [id=702, type="dequantize_per_tensor"]; -"703 _frozen_param36" [id=703, type="get_attr"]; -"704 dequantize_per_tensor_240" [id=704, type="dequantize_per_tensor"]; -"705 linear_23" [id=705, type=linear]; -"706 quantize_per_tensor_241" [id=706, type="quantize_per_tensor"]; -"707 dequantize_per_tensor_242" [id=707, type="dequantize_per_tensor"]; -"708 gelu_3" [id=708, type=gelu]; -"709 dropout_14" [id=709, type=dropout]; -"710 dropout_14_0_0_nncf_smooth_quant_0" [id=710, type="call_module"]; -"711 quantize_per_tensor_243" [id=711, type="quantize_per_tensor"]; -"712 dequantize_per_tensor_244" [id=712, type="dequantize_per_tensor"]; -"713 _frozen_param37" [id=713, type="get_attr"]; -"714 dequantize_per_tensor_245" [id=714, type="dequantize_per_tensor"]; -"715 linear_24" [id=715, type=linear]; -"716 quantize_per_tensor_246" [id=716, type="quantize_per_tensor"]; -"717 dequantize_per_tensor_247" [id=717, type="dequantize_per_tensor"]; -"718 dropout_15" [id=718, type=dropout]; -"719 layer_norm_9" [id=719, type="layer_norm"]; -"720 quantize_per_tensor_248" [id=720, type="quantize_per_tensor"]; -"721 dequantize_per_tensor_249" [id=721, type="dequantize_per_tensor"]; -"722 add_13" [id=722, type=add]; -"723 quantize_per_tensor_250" [id=723, type="quantize_per_tensor"]; -"724 dequantize_per_tensor_251" [id=724, type="dequantize_per_tensor"]; -"725 pad_5" [id=725, type=pad]; -"726 slice_65" [id=726, type=slice]; -"727 slice_66" [id=727, type=slice]; -"728 slice_67" [id=728, type=slice]; -"729 quantize_per_tensor_252" [id=729, type="quantize_per_tensor"]; -"730 dequantize_per_tensor_253" [id=730, type="dequantize_per_tensor"]; -"731 slice_68" [id=731, type=slice]; -"732 slice_69" [id=732, type=slice]; -"733 slice_70" [id=733, type=slice]; -"734 quantize_per_tensor_254" [id=734, type="quantize_per_tensor"]; -"735 dequantize_per_tensor_255" [id=735, type="dequantize_per_tensor"]; -"736 slice_71" [id=736, type=slice]; -"737 slice_72" [id=737, type=slice]; -"738 slice_73" [id=738, type=slice]; -"739 quantize_per_tensor_256" [id=739, type="quantize_per_tensor"]; -"740 dequantize_per_tensor_257" [id=740, type="dequantize_per_tensor"]; -"741 slice_74" [id=741, type=slice]; -"742 slice_75" [id=742, type=slice]; -"743 slice_76" [id=743, type=slice]; -"744 quantize_per_tensor_258" [id=744, type="quantize_per_tensor"]; -"745 dequantize_per_tensor_259" [id=745, type="dequantize_per_tensor"]; -"746 cat_1" [id=746, type=cat]; -"747 quantize_per_tensor_260" [id=747, type="quantize_per_tensor"]; -"748 dequantize_per_tensor_261" [id=748, type="dequantize_per_tensor"]; -"749 cat_1_0_0_nncf_smooth_quant_0" [id=749, type="call_module"]; -"750 quantize_per_tensor_262" [id=750, type="quantize_per_tensor"]; -"751 dequantize_per_tensor_263" [id=751, type="dequantize_per_tensor"]; -"752 _frozen_param38" [id=752, type="get_attr"]; -"753 dequantize_per_tensor_264" [id=753, type="dequantize_per_tensor"]; -"754 linear_25" [id=754, type=linear]; -"755 quantize_per_tensor_265" [id=755, type="quantize_per_tensor"]; -"756 dequantize_per_tensor_266" [id=756, type="dequantize_per_tensor"]; -"757 layer_norm_10" [id=757, type="layer_norm"]; -"758 _frozen_param39" [id=758, type="get_attr"]; -"759 dequantize_per_tensor_267" [id=759, type="dequantize_per_tensor"]; -"760 _frozen_param40" [id=760, type="get_attr"]; -"761 dequantize_per_tensor_268" [id=761, type="dequantize_per_tensor"]; -"762 linear_26" [id=762, type=linear]; -"763 relu__4" [id=763, type="relu_"]; -"764 quantize_per_tensor_269" [id=764, type="quantize_per_tensor"]; -"765 dequantize_per_tensor_270" [id=765, type="dequantize_per_tensor"]; -"766 relu__4_0_0_nncf_smooth_quant_0" [id=766, type="call_module"]; -"767 quantize_per_tensor_271" [id=767, type="quantize_per_tensor"]; -"768 dequantize_per_tensor_272" [id=768, type="dequantize_per_tensor"]; -"769 _frozen_param41" [id=769, type="get_attr"]; -"770 dequantize_per_tensor_273" [id=770, type="dequantize_per_tensor"]; -"771 linear_27" [id=771, type=linear]; -"772 quantize_per_tensor_274" [id=772, type="quantize_per_tensor"]; -"773 dequantize_per_tensor_275" [id=773, type="dequantize_per_tensor"]; -"774 view_22" [id=774, type=view]; -"775 quantize_per_tensor_276" [id=775, type="quantize_per_tensor"]; -"776 dequantize_per_tensor_277" [id=776, type="dequantize_per_tensor"]; -"777 index_4" [id=777, type=index]; -"778 view_23" [id=778, type=view]; -"779 permute_19" [id=779, type=permute]; -"780 contiguous_6" [id=780, type=contiguous]; -"781 unsqueeze_12" [id=781, type=unsqueeze]; -"782 sigmoid_4" [id=782, type=sigmoid]; -"783 quantize_per_tensor_278" [id=783, type="quantize_per_tensor"]; -"784 dequantize_per_tensor_279" [id=784, type="dequantize_per_tensor"]; -"785 _frozen_param42" [id=785, type="get_attr"]; -"786 dequantize_per_tensor_280" [id=786, type="dequantize_per_tensor"]; -"787 mul_8" [id=787, type=mul]; -"788 quantize_per_tensor_281" [id=788, type="quantize_per_tensor"]; -"789 dequantize_per_tensor_282" [id=789, type="dequantize_per_tensor"]; -"790 pad_6" [id=790, type=pad]; -"791 view_24" [id=791, type=view]; -"792 permute_20" [id=792, type=permute]; -"793 reshape_18" [id=793, type=reshape]; -"794 clone_4" [id=794, type=clone]; -"795 reshape_18_0_0_nncf_smooth_quant_0" [id=795, type="call_module"]; -"796 quantize_per_tensor_283" [id=796, type="quantize_per_tensor"]; -"797 dequantize_per_tensor_284" [id=797, type="dequantize_per_tensor"]; -"798 _frozen_param43" [id=798, type="get_attr"]; -"799 dequantize_per_tensor_285" [id=799, type="dequantize_per_tensor"]; -"800 linear_28" [id=800, type=linear]; -"801 quantize_per_tensor_286" [id=801, type="quantize_per_tensor"]; -"802 dequantize_per_tensor_287" [id=802, type="dequantize_per_tensor"]; -"803 reshape_19" [id=803, type=reshape]; -"804 permute_21" [id=804, type=permute]; -"805 select_12" [id=805, type=select]; -"806 select_13" [id=806, type=select]; -"807 select_14" [id=807, type=select]; -"808 linalg_vector_norm_8" [id=808, type="linalg_vector_norm"]; -"809 clamp_min_8" [id=809, type="clamp_min"]; -"810 expand_as_8" [id=810, type="expand_as"]; -"811 div_8" [id=811, type=div]; -"812 linalg_vector_norm_9" [id=812, type="linalg_vector_norm"]; -"813 clamp_min_9" [id=813, type="clamp_min"]; -"814 expand_as_9" [id=814, type="expand_as"]; -"815 div_9" [id=815, type=div]; -"816 transpose_8" [id=816, type=transpose]; -"817 matmul_8" [id=817, type=matmul]; -"818 quantize_per_tensor_288" [id=818, type="quantize_per_tensor"]; -"819 dequantize_per_tensor_289" [id=819, type="dequantize_per_tensor"]; -"820 _frozen_param44" [id=820, type="get_attr"]; -"821 dequantize_per_tensor_290" [id=821, type="dequantize_per_tensor"]; -"822 mul_9" [id=822, type=mul]; -"823 quantize_per_tensor_291" [id=823, type="quantize_per_tensor"]; -"824 dequantize_per_tensor_292" [id=824, type="dequantize_per_tensor"]; -"825 add_14" [id=825, type=add]; -"826 quantize_per_tensor_293" [id=826, type="quantize_per_tensor"]; -"827 dequantize_per_tensor_294" [id=827, type="dequantize_per_tensor"]; -"828 softmax_4" [id=828, type=softmax]; -"829 dropout_16" [id=829, type=dropout]; -"830 matmul_9" [id=830, type=matmul]; -"831 transpose_9" [id=831, type=transpose]; -"832 reshape_20" [id=832, type=reshape]; -"833 reshape_20_0_0_nncf_smooth_quant_0" [id=833, type="call_module"]; -"834 quantize_per_tensor_295" [id=834, type="quantize_per_tensor"]; -"835 dequantize_per_tensor_296" [id=835, type="dequantize_per_tensor"]; -"836 _frozen_param45" [id=836, type="get_attr"]; -"837 dequantize_per_tensor_297" [id=837, type="dequantize_per_tensor"]; -"838 linear_29" [id=838, type=linear]; -"839 quantize_per_tensor_298" [id=839, type="quantize_per_tensor"]; -"840 dequantize_per_tensor_299" [id=840, type="dequantize_per_tensor"]; -"841 dropout_17" [id=841, type=dropout]; -"842 view_25" [id=842, type=view]; -"843 permute_22" [id=843, type=permute]; -"844 reshape_21" [id=844, type=reshape]; -"845 slice_78" [id=845, type=slice]; -"846 slice_79" [id=846, type=slice]; -"847 slice_80" [id=847, type=slice]; -"848 slice_81" [id=848, type=slice]; -"849 contiguous_7" [id=849, type=contiguous]; -"850 layer_norm_11" [id=850, type="layer_norm"]; -"851 quantize_per_tensor_300" [id=851, type="quantize_per_tensor"]; -"852 dequantize_per_tensor_301" [id=852, type="dequantize_per_tensor"]; -"853 quantize_per_tensor_302" [id=853, type="quantize_per_tensor"]; -"854 dequantize_per_tensor_303" [id=854, type="dequantize_per_tensor"]; -"855 add_15" [id=855, type=add]; -"856 quantize_per_tensor_304" [id=856, type="quantize_per_tensor"]; -"857 dequantize_per_tensor_305" [id=857, type="dequantize_per_tensor"]; -"858 dequantize_per_tensor_306" [id=858, type="dequantize_per_tensor"]; -"859 add_15_0_0_nncf_smooth_quant_0" [id=859, type="call_module"]; -"860 quantize_per_tensor_307" [id=860, type="quantize_per_tensor"]; -"861 dequantize_per_tensor_308" [id=861, type="dequantize_per_tensor"]; -"862 _frozen_param46" [id=862, type="get_attr"]; -"863 dequantize_per_tensor_309" [id=863, type="dequantize_per_tensor"]; -"864 linear_30" [id=864, type=linear]; -"865 quantize_per_tensor_310" [id=865, type="quantize_per_tensor"]; -"866 dequantize_per_tensor_311" [id=866, type="dequantize_per_tensor"]; -"867 gelu_4" [id=867, type=gelu]; -"868 dropout_18" [id=868, type=dropout]; -"869 dropout_18_0_0_nncf_smooth_quant_0" [id=869, type="call_module"]; -"870 quantize_per_tensor_312" [id=870, type="quantize_per_tensor"]; -"871 dequantize_per_tensor_313" [id=871, type="dequantize_per_tensor"]; -"872 _frozen_param47" [id=872, type="get_attr"]; -"873 dequantize_per_tensor_314" [id=873, type="dequantize_per_tensor"]; -"874 linear_31" [id=874, type=linear]; -"875 quantize_per_tensor_315" [id=875, type="quantize_per_tensor"]; -"876 dequantize_per_tensor_316" [id=876, type="dequantize_per_tensor"]; -"877 dropout_19" [id=877, type=dropout]; -"878 layer_norm_12" [id=878, type="layer_norm"]; -"879 quantize_per_tensor_317" [id=879, type="quantize_per_tensor"]; -"880 dequantize_per_tensor_318" [id=880, type="dequantize_per_tensor"]; -"881 add_16" [id=881, type=add]; -"882 quantize_per_tensor_319" [id=882, type="quantize_per_tensor"]; -"883 dequantize_per_tensor_320" [id=883, type="dequantize_per_tensor"]; -"884 dequantize_per_tensor_321" [id=884, type="dequantize_per_tensor"]; -"885 _frozen_param48" [id=885, type="get_attr"]; -"886 dequantize_per_tensor_322" [id=886, type="dequantize_per_tensor"]; -"887 _frozen_param49" [id=887, type="get_attr"]; -"888 dequantize_per_tensor_323" [id=888, type="dequantize_per_tensor"]; -"889 linear_32" [id=889, type=linear]; -"890 relu__5" [id=890, type="relu_"]; -"891 quantize_per_tensor_324" [id=891, type="quantize_per_tensor"]; -"892 dequantize_per_tensor_325" [id=892, type="dequantize_per_tensor"]; -"893 relu__5_0_0_nncf_smooth_quant_0" [id=893, type="call_module"]; -"894 quantize_per_tensor_326" [id=894, type="quantize_per_tensor"]; -"895 dequantize_per_tensor_327" [id=895, type="dequantize_per_tensor"]; -"896 _frozen_param50" [id=896, type="get_attr"]; -"897 dequantize_per_tensor_328" [id=897, type="dequantize_per_tensor"]; -"898 linear_33" [id=898, type=linear]; -"899 quantize_per_tensor_329" [id=899, type="quantize_per_tensor"]; -"900 dequantize_per_tensor_330" [id=900, type="dequantize_per_tensor"]; -"901 view_26" [id=901, type=view]; -"902 quantize_per_tensor_331" [id=902, type="quantize_per_tensor"]; -"903 dequantize_per_tensor_332" [id=903, type="dequantize_per_tensor"]; -"904 index_5" [id=904, type=index]; -"905 view_27" [id=905, type=view]; -"906 permute_23" [id=906, type=permute]; -"907 contiguous_8" [id=907, type=contiguous]; -"908 unsqueeze_13" [id=908, type=unsqueeze]; -"909 sigmoid_5" [id=909, type=sigmoid]; -"910 quantize_per_tensor_333" [id=910, type="quantize_per_tensor"]; -"911 dequantize_per_tensor_334" [id=911, type="dequantize_per_tensor"]; -"912 _frozen_param51" [id=912, type="get_attr"]; -"913 dequantize_per_tensor_335" [id=913, type="dequantize_per_tensor"]; -"914 mul_10" [id=914, type=mul]; -"915 quantize_per_tensor_336" [id=915, type="quantize_per_tensor"]; -"916 dequantize_per_tensor_337" [id=916, type="dequantize_per_tensor"]; -"917 pad_7" [id=917, type=pad]; -"918 roll_4" [id=918, type=roll]; -"919 view_28" [id=919, type=view]; -"920 permute_24" [id=920, type=permute]; -"921 reshape_22" [id=921, type=reshape]; -"922 clone_5" [id=922, type=clone]; -"923 reshape_22_0_0_nncf_smooth_quant_0" [id=923, type="call_module"]; -"924 quantize_per_tensor_338" [id=924, type="quantize_per_tensor"]; -"925 dequantize_per_tensor_339" [id=925, type="dequantize_per_tensor"]; -"926 _frozen_param52" [id=926, type="get_attr"]; -"927 dequantize_per_tensor_340" [id=927, type="dequantize_per_tensor"]; -"928 linear_34" [id=928, type=linear]; -"929 quantize_per_tensor_341" [id=929, type="quantize_per_tensor"]; -"930 dequantize_per_tensor_342" [id=930, type="dequantize_per_tensor"]; -"931 reshape_23" [id=931, type=reshape]; -"932 permute_25" [id=932, type=permute]; -"933 select_15" [id=933, type=select]; -"934 select_16" [id=934, type=select]; -"935 select_17" [id=935, type=select]; -"936 linalg_vector_norm_10" [id=936, type="linalg_vector_norm"]; -"937 clamp_min_10" [id=937, type="clamp_min"]; -"938 expand_as_10" [id=938, type="expand_as"]; -"939 div_10" [id=939, type=div]; -"940 linalg_vector_norm_11" [id=940, type="linalg_vector_norm"]; -"941 clamp_min_11" [id=941, type="clamp_min"]; -"942 expand_as_11" [id=942, type="expand_as"]; -"943 div_11" [id=943, type=div]; -"944 transpose_10" [id=944, type=transpose]; -"945 matmul_10" [id=945, type=matmul]; -"946 quantize_per_tensor_343" [id=946, type="quantize_per_tensor"]; -"947 dequantize_per_tensor_344" [id=947, type="dequantize_per_tensor"]; -"948 _frozen_param53" [id=948, type="get_attr"]; -"949 dequantize_per_tensor_345" [id=949, type="dequantize_per_tensor"]; -"950 mul_11" [id=950, type=mul]; -"951 quantize_per_tensor_346" [id=951, type="quantize_per_tensor"]; -"952 dequantize_per_tensor_347" [id=952, type="dequantize_per_tensor"]; -"953 add_17" [id=953, type=add]; -"954 quantize_per_tensor_348" [id=954, type="quantize_per_tensor"]; -"955 dequantize_per_tensor_349" [id=955, type="dequantize_per_tensor"]; -"956 new_zeros_2" [id=956, type="new_zeros"]; -"957 view_29" [id=957, type=view]; -"958 permute_26" [id=958, type=permute]; -"959 reshape_24" [id=959, type=reshape]; -"960 unsqueeze_14" [id=960, type=unsqueeze]; -"961 unsqueeze_15" [id=961, type=unsqueeze]; -"962 sub_2" [id=962, type=sub]; -"963 ne_2" [id=963, type=ne]; -"964 masked_fill_4" [id=964, type="masked_fill"]; -"965 eq_2" [id=965, type=eq]; -"966 masked_fill_5" [id=966, type="masked_fill"]; -"967 view_30" [id=967, type=view]; -"968 quantize_per_tensor_350" [id=968, type="quantize_per_tensor"]; -"969 dequantize_per_tensor_351" [id=969, type="dequantize_per_tensor"]; -"970 unsqueeze_16" [id=970, type=unsqueeze]; -"971 unsqueeze_17" [id=971, type=unsqueeze]; -"972 quantize_per_tensor_352" [id=972, type="quantize_per_tensor"]; -"973 dequantize_per_tensor_353" [id=973, type="dequantize_per_tensor"]; -"974 add_18" [id=974, type=add]; -"975 quantize_per_tensor_354" [id=975, type="quantize_per_tensor"]; -"976 dequantize_per_tensor_355" [id=976, type="dequantize_per_tensor"]; -"977 view_31" [id=977, type=view]; -"978 quantize_per_tensor_356" [id=978, type="quantize_per_tensor"]; -"979 dequantize_per_tensor_357" [id=979, type="dequantize_per_tensor"]; -"980 softmax_5" [id=980, type=softmax]; -"981 dropout_20" [id=981, type=dropout]; -"982 matmul_11" [id=982, type=matmul]; -"983 transpose_11" [id=983, type=transpose]; -"984 reshape_25" [id=984, type=reshape]; -"985 reshape_25_0_0_nncf_smooth_quant_0" [id=985, type="call_module"]; -"986 quantize_per_tensor_358" [id=986, type="quantize_per_tensor"]; -"987 dequantize_per_tensor_359" [id=987, type="dequantize_per_tensor"]; -"988 _frozen_param54" [id=988, type="get_attr"]; -"989 dequantize_per_tensor_360" [id=989, type="dequantize_per_tensor"]; -"990 linear_35" [id=990, type=linear]; -"991 quantize_per_tensor_361" [id=991, type="quantize_per_tensor"]; -"992 dequantize_per_tensor_362" [id=992, type="dequantize_per_tensor"]; -"993 dropout_21" [id=993, type=dropout]; -"994 view_32" [id=994, type=view]; -"995 permute_27" [id=995, type=permute]; -"996 reshape_26" [id=996, type=reshape]; -"997 roll_5" [id=997, type=roll]; -"998 slice_101" [id=998, type=slice]; -"999 slice_102" [id=999, type=slice]; -"1000 slice_103" [id=1000, type=slice]; -"1001 slice_104" [id=1001, type=slice]; -"1002 contiguous_9" [id=1002, type=contiguous]; -"1003 layer_norm_13" [id=1003, type="layer_norm"]; -"1004 quantize_per_tensor_363" [id=1004, type="quantize_per_tensor"]; -"1005 dequantize_per_tensor_364" [id=1005, type="dequantize_per_tensor"]; -"1006 add_19" [id=1006, type=add]; -"1007 quantize_per_tensor_365" [id=1007, type="quantize_per_tensor"]; -"1008 dequantize_per_tensor_366" [id=1008, type="dequantize_per_tensor"]; -"1009 dequantize_per_tensor_367" [id=1009, type="dequantize_per_tensor"]; -"1010 add_19_0_0_nncf_smooth_quant_0" [id=1010, type="call_module"]; -"1011 quantize_per_tensor_368" [id=1011, type="quantize_per_tensor"]; -"1012 dequantize_per_tensor_369" [id=1012, type="dequantize_per_tensor"]; -"1013 _frozen_param55" [id=1013, type="get_attr"]; -"1014 dequantize_per_tensor_370" [id=1014, type="dequantize_per_tensor"]; -"1015 linear_36" [id=1015, type=linear]; -"1016 quantize_per_tensor_371" [id=1016, type="quantize_per_tensor"]; -"1017 dequantize_per_tensor_372" [id=1017, type="dequantize_per_tensor"]; -"1018 gelu_5" [id=1018, type=gelu]; -"1019 dropout_22" [id=1019, type=dropout]; -"1020 dropout_22_0_0_nncf_smooth_quant_0" [id=1020, type="call_module"]; -"1021 quantize_per_tensor_373" [id=1021, type="quantize_per_tensor"]; -"1022 dequantize_per_tensor_374" [id=1022, type="dequantize_per_tensor"]; -"1023 _frozen_param56" [id=1023, type="get_attr"]; -"1024 dequantize_per_tensor_375" [id=1024, type="dequantize_per_tensor"]; -"1025 linear_37" [id=1025, type=linear]; -"1026 quantize_per_tensor_376" [id=1026, type="quantize_per_tensor"]; -"1027 dequantize_per_tensor_377" [id=1027, type="dequantize_per_tensor"]; -"1028 dropout_23" [id=1028, type=dropout]; -"1029 layer_norm_14" [id=1029, type="layer_norm"]; -"1030 quantize_per_tensor_378" [id=1030, type="quantize_per_tensor"]; -"1031 dequantize_per_tensor_379" [id=1031, type="dequantize_per_tensor"]; -"1032 add_20" [id=1032, type=add]; -"1033 quantize_per_tensor_380" [id=1033, type="quantize_per_tensor"]; -"1034 dequantize_per_tensor_381" [id=1034, type="dequantize_per_tensor"]; -"1035 dequantize_per_tensor_382" [id=1035, type="dequantize_per_tensor"]; -"1036 _frozen_param57" [id=1036, type="get_attr"]; -"1037 dequantize_per_tensor_383" [id=1037, type="dequantize_per_tensor"]; -"1038 _frozen_param58" [id=1038, type="get_attr"]; -"1039 dequantize_per_tensor_384" [id=1039, type="dequantize_per_tensor"]; -"1040 linear_38" [id=1040, type=linear]; -"1041 relu__6" [id=1041, type="relu_"]; -"1042 quantize_per_tensor_385" [id=1042, type="quantize_per_tensor"]; -"1043 dequantize_per_tensor_386" [id=1043, type="dequantize_per_tensor"]; -"1044 relu__6_0_0_nncf_smooth_quant_0" [id=1044, type="call_module"]; -"1045 quantize_per_tensor_387" [id=1045, type="quantize_per_tensor"]; -"1046 dequantize_per_tensor_388" [id=1046, type="dequantize_per_tensor"]; -"1047 _frozen_param59" [id=1047, type="get_attr"]; -"1048 dequantize_per_tensor_389" [id=1048, type="dequantize_per_tensor"]; -"1049 linear_39" [id=1049, type=linear]; -"1050 quantize_per_tensor_390" [id=1050, type="quantize_per_tensor"]; -"1051 dequantize_per_tensor_391" [id=1051, type="dequantize_per_tensor"]; -"1052 view_33" [id=1052, type=view]; -"1053 quantize_per_tensor_392" [id=1053, type="quantize_per_tensor"]; -"1054 dequantize_per_tensor_393" [id=1054, type="dequantize_per_tensor"]; -"1055 index_6" [id=1055, type=index]; -"1056 view_34" [id=1056, type=view]; -"1057 permute_28" [id=1057, type=permute]; -"1058 contiguous_10" [id=1058, type=contiguous]; -"1059 unsqueeze_18" [id=1059, type=unsqueeze]; -"1060 sigmoid_6" [id=1060, type=sigmoid]; -"1061 quantize_per_tensor_394" [id=1061, type="quantize_per_tensor"]; -"1062 dequantize_per_tensor_395" [id=1062, type="dequantize_per_tensor"]; -"1063 _frozen_param60" [id=1063, type="get_attr"]; -"1064 dequantize_per_tensor_396" [id=1064, type="dequantize_per_tensor"]; -"1065 mul_12" [id=1065, type=mul]; -"1066 quantize_per_tensor_397" [id=1066, type="quantize_per_tensor"]; -"1067 dequantize_per_tensor_398" [id=1067, type="dequantize_per_tensor"]; -"1068 pad_8" [id=1068, type=pad]; -"1069 view_35" [id=1069, type=view]; -"1070 permute_29" [id=1070, type=permute]; -"1071 reshape_27" [id=1071, type=reshape]; -"1072 clone_6" [id=1072, type=clone]; -"1073 reshape_27_0_0_nncf_smooth_quant_0" [id=1073, type="call_module"]; -"1074 quantize_per_tensor_399" [id=1074, type="quantize_per_tensor"]; -"1075 dequantize_per_tensor_400" [id=1075, type="dequantize_per_tensor"]; -"1076 _frozen_param61" [id=1076, type="get_attr"]; -"1077 dequantize_per_tensor_401" [id=1077, type="dequantize_per_tensor"]; -"1078 linear_40" [id=1078, type=linear]; -"1079 quantize_per_tensor_402" [id=1079, type="quantize_per_tensor"]; -"1080 dequantize_per_tensor_403" [id=1080, type="dequantize_per_tensor"]; -"1081 reshape_28" [id=1081, type=reshape]; -"1082 permute_30" [id=1082, type=permute]; -"1083 select_18" [id=1083, type=select]; -"1084 select_19" [id=1084, type=select]; -"1085 select_20" [id=1085, type=select]; -"1086 linalg_vector_norm_12" [id=1086, type="linalg_vector_norm"]; -"1087 clamp_min_12" [id=1087, type="clamp_min"]; -"1088 expand_as_12" [id=1088, type="expand_as"]; -"1089 div_12" [id=1089, type=div]; -"1090 linalg_vector_norm_13" [id=1090, type="linalg_vector_norm"]; -"1091 clamp_min_13" [id=1091, type="clamp_min"]; -"1092 expand_as_13" [id=1092, type="expand_as"]; -"1093 div_13" [id=1093, type=div]; -"1094 transpose_12" [id=1094, type=transpose]; -"1095 matmul_12" [id=1095, type=matmul]; -"1096 quantize_per_tensor_404" [id=1096, type="quantize_per_tensor"]; -"1097 dequantize_per_tensor_405" [id=1097, type="dequantize_per_tensor"]; -"1098 _frozen_param62" [id=1098, type="get_attr"]; -"1099 dequantize_per_tensor_406" [id=1099, type="dequantize_per_tensor"]; -"1100 mul_13" [id=1100, type=mul]; -"1101 quantize_per_tensor_407" [id=1101, type="quantize_per_tensor"]; -"1102 dequantize_per_tensor_408" [id=1102, type="dequantize_per_tensor"]; -"1103 add_21" [id=1103, type=add]; -"1104 quantize_per_tensor_409" [id=1104, type="quantize_per_tensor"]; -"1105 dequantize_per_tensor_410" [id=1105, type="dequantize_per_tensor"]; -"1106 softmax_6" [id=1106, type=softmax]; -"1107 dropout_24" [id=1107, type=dropout]; -"1108 matmul_13" [id=1108, type=matmul]; -"1109 transpose_13" [id=1109, type=transpose]; -"1110 reshape_29" [id=1110, type=reshape]; -"1111 reshape_29_0_0_nncf_smooth_quant_0" [id=1111, type="call_module"]; -"1112 quantize_per_tensor_411" [id=1112, type="quantize_per_tensor"]; -"1113 dequantize_per_tensor_412" [id=1113, type="dequantize_per_tensor"]; -"1114 _frozen_param63" [id=1114, type="get_attr"]; -"1115 dequantize_per_tensor_413" [id=1115, type="dequantize_per_tensor"]; -"1116 linear_41" [id=1116, type=linear]; -"1117 quantize_per_tensor_414" [id=1117, type="quantize_per_tensor"]; -"1118 dequantize_per_tensor_415" [id=1118, type="dequantize_per_tensor"]; -"1119 dropout_25" [id=1119, type=dropout]; -"1120 view_36" [id=1120, type=view]; -"1121 permute_31" [id=1121, type=permute]; -"1122 reshape_30" [id=1122, type=reshape]; -"1123 slice_106" [id=1123, type=slice]; -"1124 slice_107" [id=1124, type=slice]; -"1125 slice_108" [id=1125, type=slice]; -"1126 slice_109" [id=1126, type=slice]; -"1127 contiguous_11" [id=1127, type=contiguous]; -"1128 layer_norm_15" [id=1128, type="layer_norm"]; -"1129 quantize_per_tensor_416" [id=1129, type="quantize_per_tensor"]; -"1130 dequantize_per_tensor_417" [id=1130, type="dequantize_per_tensor"]; -"1131 add_22" [id=1131, type=add]; -"1132 quantize_per_tensor_418" [id=1132, type="quantize_per_tensor"]; -"1133 dequantize_per_tensor_419" [id=1133, type="dequantize_per_tensor"]; -"1134 dequantize_per_tensor_420" [id=1134, type="dequantize_per_tensor"]; -"1135 add_22_0_0_nncf_smooth_quant_0" [id=1135, type="call_module"]; -"1136 quantize_per_tensor_421" [id=1136, type="quantize_per_tensor"]; -"1137 dequantize_per_tensor_422" [id=1137, type="dequantize_per_tensor"]; -"1138 _frozen_param64" [id=1138, type="get_attr"]; -"1139 dequantize_per_tensor_423" [id=1139, type="dequantize_per_tensor"]; -"1140 linear_42" [id=1140, type=linear]; -"1141 quantize_per_tensor_424" [id=1141, type="quantize_per_tensor"]; -"1142 dequantize_per_tensor_425" [id=1142, type="dequantize_per_tensor"]; -"1143 gelu_6" [id=1143, type=gelu]; -"1144 dropout_26" [id=1144, type=dropout]; -"1145 dropout_26_0_0_nncf_smooth_quant_0" [id=1145, type="call_module"]; -"1146 quantize_per_tensor_426" [id=1146, type="quantize_per_tensor"]; -"1147 dequantize_per_tensor_427" [id=1147, type="dequantize_per_tensor"]; -"1148 _frozen_param65" [id=1148, type="get_attr"]; -"1149 dequantize_per_tensor_428" [id=1149, type="dequantize_per_tensor"]; -"1150 linear_43" [id=1150, type=linear]; -"1151 quantize_per_tensor_429" [id=1151, type="quantize_per_tensor"]; -"1152 dequantize_per_tensor_430" [id=1152, type="dequantize_per_tensor"]; -"1153 dropout_27" [id=1153, type=dropout]; -"1154 layer_norm_16" [id=1154, type="layer_norm"]; -"1155 quantize_per_tensor_431" [id=1155, type="quantize_per_tensor"]; -"1156 dequantize_per_tensor_432" [id=1156, type="dequantize_per_tensor"]; -"1157 add_23" [id=1157, type=add]; -"1158 quantize_per_tensor_433" [id=1158, type="quantize_per_tensor"]; -"1159 dequantize_per_tensor_434" [id=1159, type="dequantize_per_tensor"]; -"1160 dequantize_per_tensor_435" [id=1160, type="dequantize_per_tensor"]; -"1161 _frozen_param66" [id=1161, type="get_attr"]; -"1162 dequantize_per_tensor_436" [id=1162, type="dequantize_per_tensor"]; -"1163 _frozen_param67" [id=1163, type="get_attr"]; -"1164 dequantize_per_tensor_437" [id=1164, type="dequantize_per_tensor"]; -"1165 linear_44" [id=1165, type=linear]; -"1166 relu__7" [id=1166, type="relu_"]; -"1167 quantize_per_tensor_438" [id=1167, type="quantize_per_tensor"]; -"1168 dequantize_per_tensor_439" [id=1168, type="dequantize_per_tensor"]; -"1169 relu__7_0_0_nncf_smooth_quant_0" [id=1169, type="call_module"]; -"1170 quantize_per_tensor_440" [id=1170, type="quantize_per_tensor"]; -"1171 dequantize_per_tensor_441" [id=1171, type="dequantize_per_tensor"]; -"1172 _frozen_param68" [id=1172, type="get_attr"]; -"1173 dequantize_per_tensor_442" [id=1173, type="dequantize_per_tensor"]; -"1174 linear_45" [id=1174, type=linear]; -"1175 quantize_per_tensor_443" [id=1175, type="quantize_per_tensor"]; -"1176 dequantize_per_tensor_444" [id=1176, type="dequantize_per_tensor"]; -"1177 view_37" [id=1177, type=view]; -"1178 quantize_per_tensor_445" [id=1178, type="quantize_per_tensor"]; -"1179 dequantize_per_tensor_446" [id=1179, type="dequantize_per_tensor"]; -"1180 index_7" [id=1180, type=index]; -"1181 view_38" [id=1181, type=view]; -"1182 permute_32" [id=1182, type=permute]; -"1183 contiguous_12" [id=1183, type=contiguous]; -"1184 unsqueeze_19" [id=1184, type=unsqueeze]; -"1185 sigmoid_7" [id=1185, type=sigmoid]; -"1186 quantize_per_tensor_447" [id=1186, type="quantize_per_tensor"]; -"1187 dequantize_per_tensor_448" [id=1187, type="dequantize_per_tensor"]; -"1188 _frozen_param69" [id=1188, type="get_attr"]; -"1189 dequantize_per_tensor_449" [id=1189, type="dequantize_per_tensor"]; -"1190 mul_14" [id=1190, type=mul]; -"1191 quantize_per_tensor_450" [id=1191, type="quantize_per_tensor"]; -"1192 dequantize_per_tensor_451" [id=1192, type="dequantize_per_tensor"]; -"1193 pad_9" [id=1193, type=pad]; -"1194 roll_6" [id=1194, type=roll]; -"1195 view_39" [id=1195, type=view]; -"1196 permute_33" [id=1196, type=permute]; -"1197 reshape_31" [id=1197, type=reshape]; -"1198 clone_7" [id=1198, type=clone]; -"1199 reshape_31_0_0_nncf_smooth_quant_0" [id=1199, type="call_module"]; -"1200 quantize_per_tensor_452" [id=1200, type="quantize_per_tensor"]; -"1201 dequantize_per_tensor_453" [id=1201, type="dequantize_per_tensor"]; -"1202 _frozen_param70" [id=1202, type="get_attr"]; -"1203 dequantize_per_tensor_454" [id=1203, type="dequantize_per_tensor"]; -"1204 linear_46" [id=1204, type=linear]; -"1205 quantize_per_tensor_455" [id=1205, type="quantize_per_tensor"]; -"1206 dequantize_per_tensor_456" [id=1206, type="dequantize_per_tensor"]; -"1207 reshape_32" [id=1207, type=reshape]; -"1208 permute_34" [id=1208, type=permute]; -"1209 select_21" [id=1209, type=select]; -"1210 select_22" [id=1210, type=select]; -"1211 select_23" [id=1211, type=select]; -"1212 linalg_vector_norm_14" [id=1212, type="linalg_vector_norm"]; -"1213 clamp_min_14" [id=1213, type="clamp_min"]; -"1214 expand_as_14" [id=1214, type="expand_as"]; -"1215 div_14" [id=1215, type=div]; -"1216 linalg_vector_norm_15" [id=1216, type="linalg_vector_norm"]; -"1217 clamp_min_15" [id=1217, type="clamp_min"]; -"1218 expand_as_15" [id=1218, type="expand_as"]; -"1219 div_15" [id=1219, type=div]; -"1220 transpose_14" [id=1220, type=transpose]; -"1221 matmul_14" [id=1221, type=matmul]; -"1222 quantize_per_tensor_457" [id=1222, type="quantize_per_tensor"]; -"1223 dequantize_per_tensor_458" [id=1223, type="dequantize_per_tensor"]; -"1224 _frozen_param71" [id=1224, type="get_attr"]; -"1225 dequantize_per_tensor_459" [id=1225, type="dequantize_per_tensor"]; -"1226 mul_15" [id=1226, type=mul]; -"1227 quantize_per_tensor_460" [id=1227, type="quantize_per_tensor"]; -"1228 dequantize_per_tensor_461" [id=1228, type="dequantize_per_tensor"]; -"1229 add_24" [id=1229, type=add]; -"1230 quantize_per_tensor_462" [id=1230, type="quantize_per_tensor"]; -"1231 dequantize_per_tensor_463" [id=1231, type="dequantize_per_tensor"]; -"1232 new_zeros_3" [id=1232, type="new_zeros"]; -"1233 view_40" [id=1233, type=view]; -"1234 permute_35" [id=1234, type=permute]; -"1235 reshape_33" [id=1235, type=reshape]; -"1236 unsqueeze_20" [id=1236, type=unsqueeze]; -"1237 unsqueeze_21" [id=1237, type=unsqueeze]; -"1238 sub_3" [id=1238, type=sub]; -"1239 ne_3" [id=1239, type=ne]; -"1240 masked_fill_6" [id=1240, type="masked_fill"]; -"1241 eq_3" [id=1241, type=eq]; -"1242 masked_fill_7" [id=1242, type="masked_fill"]; -"1243 view_41" [id=1243, type=view]; -"1244 quantize_per_tensor_464" [id=1244, type="quantize_per_tensor"]; -"1245 dequantize_per_tensor_465" [id=1245, type="dequantize_per_tensor"]; -"1246 unsqueeze_22" [id=1246, type=unsqueeze]; -"1247 unsqueeze_23" [id=1247, type=unsqueeze]; -"1248 quantize_per_tensor_466" [id=1248, type="quantize_per_tensor"]; -"1249 dequantize_per_tensor_467" [id=1249, type="dequantize_per_tensor"]; -"1250 add_25" [id=1250, type=add]; -"1251 quantize_per_tensor_468" [id=1251, type="quantize_per_tensor"]; -"1252 dequantize_per_tensor_469" [id=1252, type="dequantize_per_tensor"]; -"1253 view_42" [id=1253, type=view]; -"1254 quantize_per_tensor_470" [id=1254, type="quantize_per_tensor"]; -"1255 dequantize_per_tensor_471" [id=1255, type="dequantize_per_tensor"]; -"1256 softmax_7" [id=1256, type=softmax]; -"1257 dropout_28" [id=1257, type=dropout]; -"1258 matmul_15" [id=1258, type=matmul]; -"1259 transpose_15" [id=1259, type=transpose]; -"1260 reshape_34" [id=1260, type=reshape]; -"1261 reshape_34_0_0_nncf_smooth_quant_0" [id=1261, type="call_module"]; -"1262 quantize_per_tensor_472" [id=1262, type="quantize_per_tensor"]; -"1263 dequantize_per_tensor_473" [id=1263, type="dequantize_per_tensor"]; -"1264 _frozen_param72" [id=1264, type="get_attr"]; -"1265 dequantize_per_tensor_474" [id=1265, type="dequantize_per_tensor"]; -"1266 linear_47" [id=1266, type=linear]; -"1267 quantize_per_tensor_475" [id=1267, type="quantize_per_tensor"]; -"1268 dequantize_per_tensor_476" [id=1268, type="dequantize_per_tensor"]; -"1269 dropout_29" [id=1269, type=dropout]; -"1270 view_43" [id=1270, type=view]; -"1271 permute_36" [id=1271, type=permute]; -"1272 reshape_35" [id=1272, type=reshape]; -"1273 roll_7" [id=1273, type=roll]; -"1274 slice_129" [id=1274, type=slice]; -"1275 slice_130" [id=1275, type=slice]; -"1276 slice_131" [id=1276, type=slice]; -"1277 slice_132" [id=1277, type=slice]; -"1278 contiguous_13" [id=1278, type=contiguous]; -"1279 layer_norm_17" [id=1279, type="layer_norm"]; -"1280 quantize_per_tensor_477" [id=1280, type="quantize_per_tensor"]; -"1281 dequantize_per_tensor_478" [id=1281, type="dequantize_per_tensor"]; -"1282 add_26" [id=1282, type=add]; -"1283 quantize_per_tensor_479" [id=1283, type="quantize_per_tensor"]; -"1284 dequantize_per_tensor_480" [id=1284, type="dequantize_per_tensor"]; -"1285 dequantize_per_tensor_481" [id=1285, type="dequantize_per_tensor"]; -"1286 add_26_0_0_nncf_smooth_quant_0" [id=1286, type="call_module"]; -"1287 quantize_per_tensor_482" [id=1287, type="quantize_per_tensor"]; -"1288 dequantize_per_tensor_483" [id=1288, type="dequantize_per_tensor"]; -"1289 _frozen_param73" [id=1289, type="get_attr"]; -"1290 dequantize_per_tensor_484" [id=1290, type="dequantize_per_tensor"]; -"1291 linear_48" [id=1291, type=linear]; -"1292 quantize_per_tensor_485" [id=1292, type="quantize_per_tensor"]; -"1293 dequantize_per_tensor_486" [id=1293, type="dequantize_per_tensor"]; -"1294 gelu_7" [id=1294, type=gelu]; -"1295 dropout_30" [id=1295, type=dropout]; -"1296 dropout_30_0_0_nncf_smooth_quant_0" [id=1296, type="call_module"]; -"1297 quantize_per_tensor_487" [id=1297, type="quantize_per_tensor"]; -"1298 dequantize_per_tensor_488" [id=1298, type="dequantize_per_tensor"]; -"1299 _frozen_param74" [id=1299, type="get_attr"]; -"1300 dequantize_per_tensor_489" [id=1300, type="dequantize_per_tensor"]; -"1301 linear_49" [id=1301, type=linear]; -"1302 quantize_per_tensor_490" [id=1302, type="quantize_per_tensor"]; -"1303 dequantize_per_tensor_491" [id=1303, type="dequantize_per_tensor"]; -"1304 dropout_31" [id=1304, type=dropout]; -"1305 layer_norm_18" [id=1305, type="layer_norm"]; -"1306 quantize_per_tensor_492" [id=1306, type="quantize_per_tensor"]; -"1307 dequantize_per_tensor_493" [id=1307, type="dequantize_per_tensor"]; -"1308 add_27" [id=1308, type=add]; -"1309 quantize_per_tensor_494" [id=1309, type="quantize_per_tensor"]; -"1310 dequantize_per_tensor_495" [id=1310, type="dequantize_per_tensor"]; -"1311 dequantize_per_tensor_496" [id=1311, type="dequantize_per_tensor"]; -"1312 _frozen_param75" [id=1312, type="get_attr"]; -"1313 dequantize_per_tensor_497" [id=1313, type="dequantize_per_tensor"]; -"1314 _frozen_param76" [id=1314, type="get_attr"]; -"1315 dequantize_per_tensor_498" [id=1315, type="dequantize_per_tensor"]; -"1316 linear_50" [id=1316, type=linear]; -"1317 relu__8" [id=1317, type="relu_"]; -"1318 quantize_per_tensor_499" [id=1318, type="quantize_per_tensor"]; -"1319 dequantize_per_tensor_500" [id=1319, type="dequantize_per_tensor"]; -"1320 relu__8_0_0_nncf_smooth_quant_0" [id=1320, type="call_module"]; -"1321 quantize_per_tensor_501" [id=1321, type="quantize_per_tensor"]; -"1322 dequantize_per_tensor_502" [id=1322, type="dequantize_per_tensor"]; -"1323 _frozen_param77" [id=1323, type="get_attr"]; -"1324 dequantize_per_tensor_503" [id=1324, type="dequantize_per_tensor"]; -"1325 linear_51" [id=1325, type=linear]; -"1326 quantize_per_tensor_504" [id=1326, type="quantize_per_tensor"]; -"1327 dequantize_per_tensor_505" [id=1327, type="dequantize_per_tensor"]; -"1328 view_44" [id=1328, type=view]; -"1329 quantize_per_tensor_506" [id=1329, type="quantize_per_tensor"]; -"1330 dequantize_per_tensor_507" [id=1330, type="dequantize_per_tensor"]; -"1331 index_8" [id=1331, type=index]; -"1332 view_45" [id=1332, type=view]; -"1333 permute_37" [id=1333, type=permute]; -"1334 contiguous_14" [id=1334, type=contiguous]; -"1335 unsqueeze_24" [id=1335, type=unsqueeze]; -"1336 sigmoid_8" [id=1336, type=sigmoid]; -"1337 quantize_per_tensor_508" [id=1337, type="quantize_per_tensor"]; -"1338 dequantize_per_tensor_509" [id=1338, type="dequantize_per_tensor"]; -"1339 _frozen_param78" [id=1339, type="get_attr"]; -"1340 dequantize_per_tensor_510" [id=1340, type="dequantize_per_tensor"]; -"1341 mul_16" [id=1341, type=mul]; -"1342 quantize_per_tensor_511" [id=1342, type="quantize_per_tensor"]; -"1343 dequantize_per_tensor_512" [id=1343, type="dequantize_per_tensor"]; -"1344 pad_10" [id=1344, type=pad]; -"1345 view_46" [id=1345, type=view]; -"1346 permute_38" [id=1346, type=permute]; -"1347 reshape_36" [id=1347, type=reshape]; -"1348 clone_8" [id=1348, type=clone]; -"1349 reshape_36_0_0_nncf_smooth_quant_0" [id=1349, type="call_module"]; -"1350 quantize_per_tensor_513" [id=1350, type="quantize_per_tensor"]; -"1351 dequantize_per_tensor_514" [id=1351, type="dequantize_per_tensor"]; -"1352 _frozen_param79" [id=1352, type="get_attr"]; -"1353 dequantize_per_tensor_515" [id=1353, type="dequantize_per_tensor"]; -"1354 linear_52" [id=1354, type=linear]; -"1355 quantize_per_tensor_516" [id=1355, type="quantize_per_tensor"]; -"1356 dequantize_per_tensor_517" [id=1356, type="dequantize_per_tensor"]; -"1357 reshape_37" [id=1357, type=reshape]; -"1358 permute_39" [id=1358, type=permute]; -"1359 select_24" [id=1359, type=select]; -"1360 select_25" [id=1360, type=select]; -"1361 select_26" [id=1361, type=select]; -"1362 linalg_vector_norm_16" [id=1362, type="linalg_vector_norm"]; -"1363 clamp_min_16" [id=1363, type="clamp_min"]; -"1364 expand_as_16" [id=1364, type="expand_as"]; -"1365 div_16" [id=1365, type=div]; -"1366 linalg_vector_norm_17" [id=1366, type="linalg_vector_norm"]; -"1367 clamp_min_17" [id=1367, type="clamp_min"]; -"1368 expand_as_17" [id=1368, type="expand_as"]; -"1369 div_17" [id=1369, type=div]; -"1370 transpose_16" [id=1370, type=transpose]; -"1371 matmul_16" [id=1371, type=matmul]; -"1372 quantize_per_tensor_518" [id=1372, type="quantize_per_tensor"]; -"1373 dequantize_per_tensor_519" [id=1373, type="dequantize_per_tensor"]; -"1374 _frozen_param80" [id=1374, type="get_attr"]; -"1375 dequantize_per_tensor_520" [id=1375, type="dequantize_per_tensor"]; -"1376 mul_17" [id=1376, type=mul]; -"1377 quantize_per_tensor_521" [id=1377, type="quantize_per_tensor"]; -"1378 dequantize_per_tensor_522" [id=1378, type="dequantize_per_tensor"]; -"1379 add_28" [id=1379, type=add]; -"1380 quantize_per_tensor_523" [id=1380, type="quantize_per_tensor"]; -"1381 dequantize_per_tensor_524" [id=1381, type="dequantize_per_tensor"]; -"1382 softmax_8" [id=1382, type=softmax]; -"1383 dropout_32" [id=1383, type=dropout]; -"1384 matmul_17" [id=1384, type=matmul]; -"1385 transpose_17" [id=1385, type=transpose]; -"1386 reshape_38" [id=1386, type=reshape]; -"1387 reshape_38_0_0_nncf_smooth_quant_0" [id=1387, type="call_module"]; -"1388 quantize_per_tensor_525" [id=1388, type="quantize_per_tensor"]; -"1389 dequantize_per_tensor_526" [id=1389, type="dequantize_per_tensor"]; -"1390 _frozen_param81" [id=1390, type="get_attr"]; -"1391 dequantize_per_tensor_527" [id=1391, type="dequantize_per_tensor"]; -"1392 linear_53" [id=1392, type=linear]; -"1393 quantize_per_tensor_528" [id=1393, type="quantize_per_tensor"]; -"1394 dequantize_per_tensor_529" [id=1394, type="dequantize_per_tensor"]; -"1395 dropout_33" [id=1395, type=dropout]; -"1396 view_47" [id=1396, type=view]; -"1397 permute_40" [id=1397, type=permute]; -"1398 reshape_39" [id=1398, type=reshape]; -"1399 slice_134" [id=1399, type=slice]; -"1400 slice_135" [id=1400, type=slice]; -"1401 slice_136" [id=1401, type=slice]; -"1402 slice_137" [id=1402, type=slice]; -"1403 contiguous_15" [id=1403, type=contiguous]; -"1404 layer_norm_19" [id=1404, type="layer_norm"]; -"1405 quantize_per_tensor_530" [id=1405, type="quantize_per_tensor"]; -"1406 dequantize_per_tensor_531" [id=1406, type="dequantize_per_tensor"]; -"1407 add_29" [id=1407, type=add]; -"1408 quantize_per_tensor_532" [id=1408, type="quantize_per_tensor"]; -"1409 dequantize_per_tensor_533" [id=1409, type="dequantize_per_tensor"]; -"1410 dequantize_per_tensor_534" [id=1410, type="dequantize_per_tensor"]; -"1411 add_29_0_0_nncf_smooth_quant_0" [id=1411, type="call_module"]; -"1412 quantize_per_tensor_535" [id=1412, type="quantize_per_tensor"]; -"1413 dequantize_per_tensor_536" [id=1413, type="dequantize_per_tensor"]; -"1414 _frozen_param82" [id=1414, type="get_attr"]; -"1415 dequantize_per_tensor_537" [id=1415, type="dequantize_per_tensor"]; -"1416 linear_54" [id=1416, type=linear]; -"1417 quantize_per_tensor_538" [id=1417, type="quantize_per_tensor"]; -"1418 dequantize_per_tensor_539" [id=1418, type="dequantize_per_tensor"]; -"1419 gelu_8" [id=1419, type=gelu]; -"1420 dropout_34" [id=1420, type=dropout]; -"1421 dropout_34_0_0_nncf_smooth_quant_0" [id=1421, type="call_module"]; -"1422 quantize_per_tensor_540" [id=1422, type="quantize_per_tensor"]; -"1423 dequantize_per_tensor_541" [id=1423, type="dequantize_per_tensor"]; -"1424 _frozen_param83" [id=1424, type="get_attr"]; -"1425 dequantize_per_tensor_542" [id=1425, type="dequantize_per_tensor"]; -"1426 linear_55" [id=1426, type=linear]; -"1427 quantize_per_tensor_543" [id=1427, type="quantize_per_tensor"]; -"1428 dequantize_per_tensor_544" [id=1428, type="dequantize_per_tensor"]; -"1429 dropout_35" [id=1429, type=dropout]; -"1430 layer_norm_20" [id=1430, type="layer_norm"]; -"1431 quantize_per_tensor_545" [id=1431, type="quantize_per_tensor"]; -"1432 dequantize_per_tensor_546" [id=1432, type="dequantize_per_tensor"]; -"1433 add_30" [id=1433, type=add]; -"1434 quantize_per_tensor_547" [id=1434, type="quantize_per_tensor"]; -"1435 dequantize_per_tensor_548" [id=1435, type="dequantize_per_tensor"]; -"1436 dequantize_per_tensor_549" [id=1436, type="dequantize_per_tensor"]; -"1437 _frozen_param84" [id=1437, type="get_attr"]; -"1438 dequantize_per_tensor_550" [id=1438, type="dequantize_per_tensor"]; -"1439 _frozen_param85" [id=1439, type="get_attr"]; -"1440 dequantize_per_tensor_551" [id=1440, type="dequantize_per_tensor"]; -"1441 linear_56" [id=1441, type=linear]; -"1442 relu__9" [id=1442, type="relu_"]; -"1443 quantize_per_tensor_552" [id=1443, type="quantize_per_tensor"]; -"1444 dequantize_per_tensor_553" [id=1444, type="dequantize_per_tensor"]; -"1445 relu__9_0_0_nncf_smooth_quant_0" [id=1445, type="call_module"]; -"1446 quantize_per_tensor_554" [id=1446, type="quantize_per_tensor"]; -"1447 dequantize_per_tensor_555" [id=1447, type="dequantize_per_tensor"]; -"1448 _frozen_param86" [id=1448, type="get_attr"]; -"1449 dequantize_per_tensor_556" [id=1449, type="dequantize_per_tensor"]; -"1450 linear_57" [id=1450, type=linear]; -"1451 quantize_per_tensor_557" [id=1451, type="quantize_per_tensor"]; -"1452 dequantize_per_tensor_558" [id=1452, type="dequantize_per_tensor"]; -"1453 view_48" [id=1453, type=view]; -"1454 quantize_per_tensor_559" [id=1454, type="quantize_per_tensor"]; -"1455 dequantize_per_tensor_560" [id=1455, type="dequantize_per_tensor"]; -"1456 index_9" [id=1456, type=index]; -"1457 view_49" [id=1457, type=view]; -"1458 permute_41" [id=1458, type=permute]; -"1459 contiguous_16" [id=1459, type=contiguous]; -"1460 unsqueeze_25" [id=1460, type=unsqueeze]; -"1461 sigmoid_9" [id=1461, type=sigmoid]; -"1462 quantize_per_tensor_561" [id=1462, type="quantize_per_tensor"]; -"1463 dequantize_per_tensor_562" [id=1463, type="dequantize_per_tensor"]; -"1464 _frozen_param87" [id=1464, type="get_attr"]; -"1465 dequantize_per_tensor_563" [id=1465, type="dequantize_per_tensor"]; -"1466 mul_18" [id=1466, type=mul]; -"1467 quantize_per_tensor_564" [id=1467, type="quantize_per_tensor"]; -"1468 dequantize_per_tensor_565" [id=1468, type="dequantize_per_tensor"]; -"1469 pad_11" [id=1469, type=pad]; -"1470 roll_8" [id=1470, type=roll]; -"1471 view_50" [id=1471, type=view]; -"1472 permute_42" [id=1472, type=permute]; -"1473 reshape_40" [id=1473, type=reshape]; -"1474 clone_9" [id=1474, type=clone]; -"1475 reshape_40_0_0_nncf_smooth_quant_0" [id=1475, type="call_module"]; -"1476 quantize_per_tensor_566" [id=1476, type="quantize_per_tensor"]; -"1477 dequantize_per_tensor_567" [id=1477, type="dequantize_per_tensor"]; -"1478 _frozen_param88" [id=1478, type="get_attr"]; -"1479 dequantize_per_tensor_568" [id=1479, type="dequantize_per_tensor"]; -"1480 linear_58" [id=1480, type=linear]; -"1481 quantize_per_tensor_569" [id=1481, type="quantize_per_tensor"]; -"1482 dequantize_per_tensor_570" [id=1482, type="dequantize_per_tensor"]; -"1483 reshape_41" [id=1483, type=reshape]; -"1484 permute_43" [id=1484, type=permute]; -"1485 select_27" [id=1485, type=select]; -"1486 select_28" [id=1486, type=select]; -"1487 select_29" [id=1487, type=select]; -"1488 linalg_vector_norm_18" [id=1488, type="linalg_vector_norm"]; -"1489 clamp_min_18" [id=1489, type="clamp_min"]; -"1490 expand_as_18" [id=1490, type="expand_as"]; -"1491 div_18" [id=1491, type=div]; -"1492 linalg_vector_norm_19" [id=1492, type="linalg_vector_norm"]; -"1493 clamp_min_19" [id=1493, type="clamp_min"]; -"1494 expand_as_19" [id=1494, type="expand_as"]; -"1495 div_19" [id=1495, type=div]; -"1496 transpose_18" [id=1496, type=transpose]; -"1497 matmul_18" [id=1497, type=matmul]; -"1498 quantize_per_tensor_571" [id=1498, type="quantize_per_tensor"]; -"1499 dequantize_per_tensor_572" [id=1499, type="dequantize_per_tensor"]; -"1500 _frozen_param89" [id=1500, type="get_attr"]; -"1501 dequantize_per_tensor_573" [id=1501, type="dequantize_per_tensor"]; -"1502 mul_19" [id=1502, type=mul]; -"1503 quantize_per_tensor_574" [id=1503, type="quantize_per_tensor"]; -"1504 dequantize_per_tensor_575" [id=1504, type="dequantize_per_tensor"]; -"1505 add_31" [id=1505, type=add]; -"1506 quantize_per_tensor_576" [id=1506, type="quantize_per_tensor"]; -"1507 dequantize_per_tensor_577" [id=1507, type="dequantize_per_tensor"]; -"1508 new_zeros_4" [id=1508, type="new_zeros"]; -"1509 view_51" [id=1509, type=view]; -"1510 permute_44" [id=1510, type=permute]; -"1511 reshape_42" [id=1511, type=reshape]; -"1512 unsqueeze_26" [id=1512, type=unsqueeze]; -"1513 unsqueeze_27" [id=1513, type=unsqueeze]; -"1514 sub_4" [id=1514, type=sub]; -"1515 ne_4" [id=1515, type=ne]; -"1516 masked_fill_8" [id=1516, type="masked_fill"]; -"1517 eq_4" [id=1517, type=eq]; -"1518 masked_fill_9" [id=1518, type="masked_fill"]; -"1519 view_52" [id=1519, type=view]; -"1520 quantize_per_tensor_578" [id=1520, type="quantize_per_tensor"]; -"1521 dequantize_per_tensor_579" [id=1521, type="dequantize_per_tensor"]; -"1522 unsqueeze_28" [id=1522, type=unsqueeze]; -"1523 unsqueeze_29" [id=1523, type=unsqueeze]; -"1524 quantize_per_tensor_580" [id=1524, type="quantize_per_tensor"]; -"1525 dequantize_per_tensor_581" [id=1525, type="dequantize_per_tensor"]; -"1526 add_32" [id=1526, type=add]; -"1527 quantize_per_tensor_582" [id=1527, type="quantize_per_tensor"]; -"1528 dequantize_per_tensor_583" [id=1528, type="dequantize_per_tensor"]; -"1529 view_53" [id=1529, type=view]; -"1530 quantize_per_tensor_584" [id=1530, type="quantize_per_tensor"]; -"1531 dequantize_per_tensor_585" [id=1531, type="dequantize_per_tensor"]; -"1532 softmax_9" [id=1532, type=softmax]; -"1533 dropout_36" [id=1533, type=dropout]; -"1534 matmul_19" [id=1534, type=matmul]; -"1535 transpose_19" [id=1535, type=transpose]; -"1536 reshape_43" [id=1536, type=reshape]; -"1537 reshape_43_0_0_nncf_smooth_quant_0" [id=1537, type="call_module"]; -"1538 quantize_per_tensor_586" [id=1538, type="quantize_per_tensor"]; -"1539 dequantize_per_tensor_587" [id=1539, type="dequantize_per_tensor"]; -"1540 _frozen_param90" [id=1540, type="get_attr"]; -"1541 dequantize_per_tensor_588" [id=1541, type="dequantize_per_tensor"]; -"1542 linear_59" [id=1542, type=linear]; -"1543 quantize_per_tensor_589" [id=1543, type="quantize_per_tensor"]; -"1544 dequantize_per_tensor_590" [id=1544, type="dequantize_per_tensor"]; -"1545 dropout_37" [id=1545, type=dropout]; -"1546 view_54" [id=1546, type=view]; -"1547 permute_45" [id=1547, type=permute]; -"1548 reshape_44" [id=1548, type=reshape]; -"1549 roll_9" [id=1549, type=roll]; -"1550 slice_157" [id=1550, type=slice]; -"1551 slice_158" [id=1551, type=slice]; -"1552 slice_159" [id=1552, type=slice]; -"1553 slice_160" [id=1553, type=slice]; -"1554 contiguous_17" [id=1554, type=contiguous]; -"1555 layer_norm_21" [id=1555, type="layer_norm"]; -"1556 quantize_per_tensor_591" [id=1556, type="quantize_per_tensor"]; -"1557 dequantize_per_tensor_592" [id=1557, type="dequantize_per_tensor"]; -"1558 add_33" [id=1558, type=add]; -"1559 quantize_per_tensor_593" [id=1559, type="quantize_per_tensor"]; -"1560 dequantize_per_tensor_594" [id=1560, type="dequantize_per_tensor"]; -"1561 dequantize_per_tensor_595" [id=1561, type="dequantize_per_tensor"]; -"1562 add_33_0_0_nncf_smooth_quant_0" [id=1562, type="call_module"]; -"1563 quantize_per_tensor_596" [id=1563, type="quantize_per_tensor"]; -"1564 dequantize_per_tensor_597" [id=1564, type="dequantize_per_tensor"]; -"1565 _frozen_param91" [id=1565, type="get_attr"]; -"1566 dequantize_per_tensor_598" [id=1566, type="dequantize_per_tensor"]; -"1567 linear_60" [id=1567, type=linear]; -"1568 quantize_per_tensor_599" [id=1568, type="quantize_per_tensor"]; -"1569 dequantize_per_tensor_600" [id=1569, type="dequantize_per_tensor"]; -"1570 gelu_9" [id=1570, type=gelu]; -"1571 dropout_38" [id=1571, type=dropout]; -"1572 dropout_38_0_0_nncf_smooth_quant_0" [id=1572, type="call_module"]; -"1573 quantize_per_tensor_601" [id=1573, type="quantize_per_tensor"]; -"1574 dequantize_per_tensor_602" [id=1574, type="dequantize_per_tensor"]; -"1575 _frozen_param92" [id=1575, type="get_attr"]; -"1576 dequantize_per_tensor_603" [id=1576, type="dequantize_per_tensor"]; -"1577 linear_61" [id=1577, type=linear]; -"1578 quantize_per_tensor_604" [id=1578, type="quantize_per_tensor"]; -"1579 dequantize_per_tensor_605" [id=1579, type="dequantize_per_tensor"]; -"1580 dropout_39" [id=1580, type=dropout]; -"1581 layer_norm_22" [id=1581, type="layer_norm"]; -"1582 quantize_per_tensor_606" [id=1582, type="quantize_per_tensor"]; -"1583 dequantize_per_tensor_607" [id=1583, type="dequantize_per_tensor"]; -"1584 add_34" [id=1584, type=add]; -"1585 quantize_per_tensor_608" [id=1585, type="quantize_per_tensor"]; -"1586 dequantize_per_tensor_609" [id=1586, type="dequantize_per_tensor"]; -"1587 pad_12" [id=1587, type=pad]; -"1588 slice_161" [id=1588, type=slice]; -"1589 slice_162" [id=1589, type=slice]; -"1590 slice_163" [id=1590, type=slice]; -"1591 quantize_per_tensor_610" [id=1591, type="quantize_per_tensor"]; -"1592 dequantize_per_tensor_611" [id=1592, type="dequantize_per_tensor"]; -"1593 slice_164" [id=1593, type=slice]; -"1594 slice_165" [id=1594, type=slice]; -"1595 slice_166" [id=1595, type=slice]; -"1596 quantize_per_tensor_612" [id=1596, type="quantize_per_tensor"]; -"1597 dequantize_per_tensor_613" [id=1597, type="dequantize_per_tensor"]; -"1598 slice_167" [id=1598, type=slice]; -"1599 slice_168" [id=1599, type=slice]; -"1600 slice_169" [id=1600, type=slice]; -"1601 quantize_per_tensor_614" [id=1601, type="quantize_per_tensor"]; -"1602 dequantize_per_tensor_615" [id=1602, type="dequantize_per_tensor"]; -"1603 slice_170" [id=1603, type=slice]; -"1604 slice_171" [id=1604, type=slice]; -"1605 slice_172" [id=1605, type=slice]; -"1606 quantize_per_tensor_616" [id=1606, type="quantize_per_tensor"]; -"1607 dequantize_per_tensor_617" [id=1607, type="dequantize_per_tensor"]; -"1608 cat_2" [id=1608, type=cat]; -"1609 quantize_per_tensor_618" [id=1609, type="quantize_per_tensor"]; -"1610 dequantize_per_tensor_619" [id=1610, type="dequantize_per_tensor"]; -"1611 cat_2_0_0_nncf_smooth_quant_0" [id=1611, type="call_module"]; -"1612 quantize_per_tensor_620" [id=1612, type="quantize_per_tensor"]; -"1613 dequantize_per_tensor_621" [id=1613, type="dequantize_per_tensor"]; -"1614 _frozen_param93" [id=1614, type="get_attr"]; -"1615 dequantize_per_tensor_622" [id=1615, type="dequantize_per_tensor"]; -"1616 linear_62" [id=1616, type=linear]; -"1617 quantize_per_tensor_623" [id=1617, type="quantize_per_tensor"]; -"1618 dequantize_per_tensor_624" [id=1618, type="dequantize_per_tensor"]; -"1619 layer_norm_23" [id=1619, type="layer_norm"]; -"1620 _frozen_param94" [id=1620, type="get_attr"]; -"1621 dequantize_per_tensor_625" [id=1621, type="dequantize_per_tensor"]; -"1622 _frozen_param95" [id=1622, type="get_attr"]; -"1623 dequantize_per_tensor_626" [id=1623, type="dequantize_per_tensor"]; -"1624 linear_63" [id=1624, type=linear]; -"1625 relu__10" [id=1625, type="relu_"]; -"1626 quantize_per_tensor_627" [id=1626, type="quantize_per_tensor"]; -"1627 dequantize_per_tensor_628" [id=1627, type="dequantize_per_tensor"]; -"1628 relu__10_0_0_nncf_smooth_quant_0" [id=1628, type="call_module"]; -"1629 quantize_per_tensor_629" [id=1629, type="quantize_per_tensor"]; -"1630 dequantize_per_tensor_630" [id=1630, type="dequantize_per_tensor"]; -"1631 _frozen_param96" [id=1631, type="get_attr"]; -"1632 dequantize_per_tensor_631" [id=1632, type="dequantize_per_tensor"]; -"1633 linear_64" [id=1633, type=linear]; -"1634 quantize_per_tensor_632" [id=1634, type="quantize_per_tensor"]; -"1635 dequantize_per_tensor_633" [id=1635, type="dequantize_per_tensor"]; -"1636 view_55" [id=1636, type=view]; -"1637 quantize_per_tensor_634" [id=1637, type="quantize_per_tensor"]; -"1638 dequantize_per_tensor_635" [id=1638, type="dequantize_per_tensor"]; -"1639 index_10" [id=1639, type=index]; -"1640 view_56" [id=1640, type=view]; -"1641 permute_46" [id=1641, type=permute]; -"1642 contiguous_18" [id=1642, type=contiguous]; -"1643 unsqueeze_30" [id=1643, type=unsqueeze]; -"1644 sigmoid_10" [id=1644, type=sigmoid]; -"1645 quantize_per_tensor_636" [id=1645, type="quantize_per_tensor"]; -"1646 dequantize_per_tensor_637" [id=1646, type="dequantize_per_tensor"]; -"1647 _frozen_param97" [id=1647, type="get_attr"]; -"1648 dequantize_per_tensor_638" [id=1648, type="dequantize_per_tensor"]; -"1649 mul_20" [id=1649, type=mul]; -"1650 quantize_per_tensor_639" [id=1650, type="quantize_per_tensor"]; -"1651 dequantize_per_tensor_640" [id=1651, type="dequantize_per_tensor"]; -"1652 pad_13" [id=1652, type=pad]; -"1653 view_57" [id=1653, type=view]; -"1654 permute_47" [id=1654, type=permute]; -"1655 reshape_45" [id=1655, type=reshape]; -"1656 clone_10" [id=1656, type=clone]; -"1657 reshape_45_0_0_nncf_smooth_quant_0" [id=1657, type="call_module"]; -"1658 quantize_per_tensor_641" [id=1658, type="quantize_per_tensor"]; -"1659 dequantize_per_tensor_642" [id=1659, type="dequantize_per_tensor"]; -"1660 _frozen_param98" [id=1660, type="get_attr"]; -"1661 dequantize_per_tensor_643" [id=1661, type="dequantize_per_tensor"]; -"1662 linear_65" [id=1662, type=linear]; -"1663 quantize_per_tensor_644" [id=1663, type="quantize_per_tensor"]; -"1664 dequantize_per_tensor_645" [id=1664, type="dequantize_per_tensor"]; -"1665 reshape_46" [id=1665, type=reshape]; -"1666 permute_48" [id=1666, type=permute]; -"1667 select_30" [id=1667, type=select]; -"1668 select_31" [id=1668, type=select]; -"1669 select_32" [id=1669, type=select]; -"1670 linalg_vector_norm_20" [id=1670, type="linalg_vector_norm"]; -"1671 clamp_min_20" [id=1671, type="clamp_min"]; -"1672 expand_as_20" [id=1672, type="expand_as"]; -"1673 div_20" [id=1673, type=div]; -"1674 linalg_vector_norm_21" [id=1674, type="linalg_vector_norm"]; -"1675 clamp_min_21" [id=1675, type="clamp_min"]; -"1676 expand_as_21" [id=1676, type="expand_as"]; -"1677 div_21" [id=1677, type=div]; -"1678 transpose_20" [id=1678, type=transpose]; -"1679 matmul_20" [id=1679, type=matmul]; -"1680 quantize_per_tensor_646" [id=1680, type="quantize_per_tensor"]; -"1681 dequantize_per_tensor_647" [id=1681, type="dequantize_per_tensor"]; -"1682 _frozen_param99" [id=1682, type="get_attr"]; -"1683 dequantize_per_tensor_648" [id=1683, type="dequantize_per_tensor"]; -"1684 mul_21" [id=1684, type=mul]; -"1685 quantize_per_tensor_649" [id=1685, type="quantize_per_tensor"]; -"1686 dequantize_per_tensor_650" [id=1686, type="dequantize_per_tensor"]; -"1687 add_35" [id=1687, type=add]; -"1688 quantize_per_tensor_651" [id=1688, type="quantize_per_tensor"]; -"1689 dequantize_per_tensor_652" [id=1689, type="dequantize_per_tensor"]; -"1690 softmax_10" [id=1690, type=softmax]; -"1691 dropout_40" [id=1691, type=dropout]; -"1692 matmul_21" [id=1692, type=matmul]; -"1693 transpose_21" [id=1693, type=transpose]; -"1694 reshape_47" [id=1694, type=reshape]; -"1695 reshape_47_0_0_nncf_smooth_quant_0" [id=1695, type="call_module"]; -"1696 quantize_per_tensor_653" [id=1696, type="quantize_per_tensor"]; -"1697 dequantize_per_tensor_654" [id=1697, type="dequantize_per_tensor"]; -"1698 _frozen_param100" [id=1698, type="get_attr"]; -"1699 dequantize_per_tensor_655" [id=1699, type="dequantize_per_tensor"]; -"1700 linear_66" [id=1700, type=linear]; -"1701 quantize_per_tensor_656" [id=1701, type="quantize_per_tensor"]; -"1702 dequantize_per_tensor_657" [id=1702, type="dequantize_per_tensor"]; -"1703 dropout_41" [id=1703, type=dropout]; -"1704 view_58" [id=1704, type=view]; -"1705 permute_49" [id=1705, type=permute]; -"1706 reshape_48" [id=1706, type=reshape]; -"1707 slice_174" [id=1707, type=slice]; -"1708 slice_175" [id=1708, type=slice]; -"1709 slice_176" [id=1709, type=slice]; -"1710 slice_177" [id=1710, type=slice]; -"1711 contiguous_19" [id=1711, type=contiguous]; -"1712 layer_norm_24" [id=1712, type="layer_norm"]; -"1713 quantize_per_tensor_658" [id=1713, type="quantize_per_tensor"]; -"1714 dequantize_per_tensor_659" [id=1714, type="dequantize_per_tensor"]; -"1715 quantize_per_tensor_660" [id=1715, type="quantize_per_tensor"]; -"1716 dequantize_per_tensor_661" [id=1716, type="dequantize_per_tensor"]; -"1717 add_36" [id=1717, type=add]; -"1718 quantize_per_tensor_662" [id=1718, type="quantize_per_tensor"]; -"1719 dequantize_per_tensor_663" [id=1719, type="dequantize_per_tensor"]; -"1720 dequantize_per_tensor_664" [id=1720, type="dequantize_per_tensor"]; -"1721 add_36_0_0_nncf_smooth_quant_0" [id=1721, type="call_module"]; -"1722 quantize_per_tensor_665" [id=1722, type="quantize_per_tensor"]; -"1723 dequantize_per_tensor_666" [id=1723, type="dequantize_per_tensor"]; -"1724 _frozen_param101" [id=1724, type="get_attr"]; -"1725 dequantize_per_tensor_667" [id=1725, type="dequantize_per_tensor"]; -"1726 linear_67" [id=1726, type=linear]; -"1727 quantize_per_tensor_668" [id=1727, type="quantize_per_tensor"]; -"1728 dequantize_per_tensor_669" [id=1728, type="dequantize_per_tensor"]; -"1729 gelu_10" [id=1729, type=gelu]; -"1730 dropout_42" [id=1730, type=dropout]; -"1731 dropout_42_0_0_nncf_smooth_quant_0" [id=1731, type="call_module"]; -"1732 quantize_per_tensor_670" [id=1732, type="quantize_per_tensor"]; -"1733 dequantize_per_tensor_671" [id=1733, type="dequantize_per_tensor"]; -"1734 _frozen_param102" [id=1734, type="get_attr"]; -"1735 dequantize_per_tensor_672" [id=1735, type="dequantize_per_tensor"]; -"1736 linear_68" [id=1736, type=linear]; -"1737 quantize_per_tensor_673" [id=1737, type="quantize_per_tensor"]; -"1738 dequantize_per_tensor_674" [id=1738, type="dequantize_per_tensor"]; -"1739 dropout_43" [id=1739, type=dropout]; -"1740 layer_norm_25" [id=1740, type="layer_norm"]; -"1741 quantize_per_tensor_675" [id=1741, type="quantize_per_tensor"]; -"1742 dequantize_per_tensor_676" [id=1742, type="dequantize_per_tensor"]; -"1743 add_37" [id=1743, type=add]; -"1744 quantize_per_tensor_677" [id=1744, type="quantize_per_tensor"]; -"1745 dequantize_per_tensor_678" [id=1745, type="dequantize_per_tensor"]; -"1746 dequantize_per_tensor_679" [id=1746, type="dequantize_per_tensor"]; -"1747 _frozen_param103" [id=1747, type="get_attr"]; -"1748 dequantize_per_tensor_680" [id=1748, type="dequantize_per_tensor"]; -"1749 _frozen_param104" [id=1749, type="get_attr"]; -"1750 dequantize_per_tensor_681" [id=1750, type="dequantize_per_tensor"]; -"1751 linear_69" [id=1751, type=linear]; -"1752 relu__11" [id=1752, type="relu_"]; -"1753 quantize_per_tensor_682" [id=1753, type="quantize_per_tensor"]; -"1754 dequantize_per_tensor_683" [id=1754, type="dequantize_per_tensor"]; -"1755 relu__11_0_0_nncf_smooth_quant_0" [id=1755, type="call_module"]; -"1756 quantize_per_tensor_684" [id=1756, type="quantize_per_tensor"]; -"1757 dequantize_per_tensor_685" [id=1757, type="dequantize_per_tensor"]; -"1758 _frozen_param105" [id=1758, type="get_attr"]; -"1759 dequantize_per_tensor_686" [id=1759, type="dequantize_per_tensor"]; -"1760 linear_70" [id=1760, type=linear]; -"1761 quantize_per_tensor_687" [id=1761, type="quantize_per_tensor"]; -"1762 dequantize_per_tensor_688" [id=1762, type="dequantize_per_tensor"]; -"1763 view_59" [id=1763, type=view]; -"1764 quantize_per_tensor_689" [id=1764, type="quantize_per_tensor"]; -"1765 dequantize_per_tensor_690" [id=1765, type="dequantize_per_tensor"]; -"1766 index_11" [id=1766, type=index]; -"1767 view_60" [id=1767, type=view]; -"1768 permute_50" [id=1768, type=permute]; -"1769 contiguous_20" [id=1769, type=contiguous]; -"1770 unsqueeze_31" [id=1770, type=unsqueeze]; -"1771 sigmoid_11" [id=1771, type=sigmoid]; -"1772 quantize_per_tensor_691" [id=1772, type="quantize_per_tensor"]; -"1773 dequantize_per_tensor_692" [id=1773, type="dequantize_per_tensor"]; -"1774 _frozen_param106" [id=1774, type="get_attr"]; -"1775 dequantize_per_tensor_693" [id=1775, type="dequantize_per_tensor"]; -"1776 mul_22" [id=1776, type=mul]; -"1777 quantize_per_tensor_694" [id=1777, type="quantize_per_tensor"]; -"1778 dequantize_per_tensor_695" [id=1778, type="dequantize_per_tensor"]; -"1779 pad_14" [id=1779, type=pad]; -"1780 view_61" [id=1780, type=view]; -"1781 permute_51" [id=1781, type=permute]; -"1782 reshape_49" [id=1782, type=reshape]; -"1783 clone_11" [id=1783, type=clone]; -"1784 reshape_49_0_0_nncf_smooth_quant_0" [id=1784, type="call_module"]; -"1785 quantize_per_tensor_696" [id=1785, type="quantize_per_tensor"]; -"1786 dequantize_per_tensor_697" [id=1786, type="dequantize_per_tensor"]; -"1787 _frozen_param107" [id=1787, type="get_attr"]; -"1788 dequantize_per_tensor_698" [id=1788, type="dequantize_per_tensor"]; -"1789 linear_71" [id=1789, type=linear]; -"1790 quantize_per_tensor_699" [id=1790, type="quantize_per_tensor"]; -"1791 dequantize_per_tensor_700" [id=1791, type="dequantize_per_tensor"]; -"1792 reshape_50" [id=1792, type=reshape]; -"1793 permute_52" [id=1793, type=permute]; -"1794 select_33" [id=1794, type=select]; -"1795 select_34" [id=1795, type=select]; -"1796 select_35" [id=1796, type=select]; -"1797 linalg_vector_norm_22" [id=1797, type="linalg_vector_norm"]; -"1798 clamp_min_22" [id=1798, type="clamp_min"]; -"1799 expand_as_22" [id=1799, type="expand_as"]; -"1800 div_22" [id=1800, type=div]; -"1801 linalg_vector_norm_23" [id=1801, type="linalg_vector_norm"]; -"1802 clamp_min_23" [id=1802, type="clamp_min"]; -"1803 expand_as_23" [id=1803, type="expand_as"]; -"1804 div_23" [id=1804, type=div]; -"1805 transpose_22" [id=1805, type=transpose]; -"1806 matmul_22" [id=1806, type=matmul]; -"1807 quantize_per_tensor_701" [id=1807, type="quantize_per_tensor"]; -"1808 dequantize_per_tensor_702" [id=1808, type="dequantize_per_tensor"]; -"1809 _frozen_param108" [id=1809, type="get_attr"]; -"1810 dequantize_per_tensor_703" [id=1810, type="dequantize_per_tensor"]; -"1811 mul_23" [id=1811, type=mul]; -"1812 quantize_per_tensor_704" [id=1812, type="quantize_per_tensor"]; -"1813 dequantize_per_tensor_705" [id=1813, type="dequantize_per_tensor"]; -"1814 add_38" [id=1814, type=add]; -"1815 quantize_per_tensor_706" [id=1815, type="quantize_per_tensor"]; -"1816 dequantize_per_tensor_707" [id=1816, type="dequantize_per_tensor"]; -"1817 softmax_11" [id=1817, type=softmax]; -"1818 dropout_44" [id=1818, type=dropout]; -"1819 matmul_23" [id=1819, type=matmul]; -"1820 transpose_23" [id=1820, type=transpose]; -"1821 reshape_51" [id=1821, type=reshape]; -"1822 reshape_51_0_0_nncf_smooth_quant_0" [id=1822, type="call_module"]; -"1823 quantize_per_tensor_708" [id=1823, type="quantize_per_tensor"]; -"1824 dequantize_per_tensor_709" [id=1824, type="dequantize_per_tensor"]; -"1825 _frozen_param109" [id=1825, type="get_attr"]; -"1826 dequantize_per_tensor_710" [id=1826, type="dequantize_per_tensor"]; -"1827 linear_72" [id=1827, type=linear]; -"1828 quantize_per_tensor_711" [id=1828, type="quantize_per_tensor"]; -"1829 dequantize_per_tensor_712" [id=1829, type="dequantize_per_tensor"]; -"1830 dropout_45" [id=1830, type=dropout]; -"1831 view_62" [id=1831, type=view]; -"1832 permute_53" [id=1832, type=permute]; -"1833 reshape_52" [id=1833, type=reshape]; -"1834 slice_179" [id=1834, type=slice]; -"1835 slice_180" [id=1835, type=slice]; -"1836 slice_181" [id=1836, type=slice]; -"1837 slice_182" [id=1837, type=slice]; -"1838 contiguous_21" [id=1838, type=contiguous]; -"1839 layer_norm_26" [id=1839, type="layer_norm"]; -"1840 quantize_per_tensor_713" [id=1840, type="quantize_per_tensor"]; -"1841 dequantize_per_tensor_714" [id=1841, type="dequantize_per_tensor"]; -"1842 add_39" [id=1842, type=add]; -"1843 quantize_per_tensor_715" [id=1843, type="quantize_per_tensor"]; -"1844 dequantize_per_tensor_716" [id=1844, type="dequantize_per_tensor"]; -"1845 dequantize_per_tensor_717" [id=1845, type="dequantize_per_tensor"]; -"1846 add_39_0_0_nncf_smooth_quant_0" [id=1846, type="call_module"]; -"1847 quantize_per_tensor_718" [id=1847, type="quantize_per_tensor"]; -"1848 dequantize_per_tensor_719" [id=1848, type="dequantize_per_tensor"]; -"1849 _frozen_param110" [id=1849, type="get_attr"]; -"1850 dequantize_per_tensor_720" [id=1850, type="dequantize_per_tensor"]; -"1851 linear_73" [id=1851, type=linear]; -"1852 quantize_per_tensor_721" [id=1852, type="quantize_per_tensor"]; -"1853 dequantize_per_tensor_722" [id=1853, type="dequantize_per_tensor"]; -"1854 gelu_11" [id=1854, type=gelu]; -"1855 dropout_46" [id=1855, type=dropout]; -"1856 dropout_46_0_0_nncf_smooth_quant_0" [id=1856, type="call_module"]; -"1857 quantize_per_tensor_723" [id=1857, type="quantize_per_tensor"]; -"1858 dequantize_per_tensor_724" [id=1858, type="dequantize_per_tensor"]; -"1859 _frozen_param111" [id=1859, type="get_attr"]; -"1860 dequantize_per_tensor_725" [id=1860, type="dequantize_per_tensor"]; -"1861 linear_74" [id=1861, type=linear]; -"1862 quantize_per_tensor_726" [id=1862, type="quantize_per_tensor"]; -"1863 dequantize_per_tensor_727" [id=1863, type="dequantize_per_tensor"]; -"1864 dropout_47" [id=1864, type=dropout]; -"1865 layer_norm_27" [id=1865, type="layer_norm"]; -"1866 quantize_per_tensor_728" [id=1866, type="quantize_per_tensor"]; -"1867 dequantize_per_tensor_729" [id=1867, type="dequantize_per_tensor"]; -"1868 add_40" [id=1868, type=add]; -"1869 quantize_per_tensor_730" [id=1869, type="quantize_per_tensor"]; -"1870 dequantize_per_tensor_731" [id=1870, type="dequantize_per_tensor"]; -"1871 layer_norm_28" [id=1871, type="layer_norm"]; -"1872 permute_54" [id=1872, type=permute]; -"1873 quantize_per_tensor_732" [id=1873, type="quantize_per_tensor"]; -"1874 dequantize_per_tensor_733" [id=1874, type="dequantize_per_tensor"]; -"1875 adaptive_avg_pool2d" [id=1875, type="adaptive_avg_pool2d"]; -"1876 quantize_per_tensor_734" [id=1876, type="quantize_per_tensor"]; -"1877 dequantize_per_tensor_735" [id=1877, type="dequantize_per_tensor"]; -"1878 flatten" [id=1878, type=flatten]; -"1879 quantize_per_tensor_736" [id=1879, type="quantize_per_tensor"]; -"1880 dequantize_per_tensor_737" [id=1880, type="dequantize_per_tensor"]; -"1881 flatten_0_0_nncf_smooth_quant_0" [id=1881, type="call_module"]; -"1882 quantize_per_tensor_738" [id=1882, type="quantize_per_tensor"]; -"1883 dequantize_per_tensor_739" [id=1883, type="dequantize_per_tensor"]; -"1884 _frozen_param112" [id=1884, type="get_attr"]; -"1885 dequantize_per_tensor_740" [id=1885, type="dequantize_per_tensor"]; -"1886 linear_75" [id=1886, type=linear]; -"1887 quantize_per_tensor_741" [id=1887, type="quantize_per_tensor"]; -"1888 dequantize_per_tensor_742" [id=1888, type="dequantize_per_tensor"]; -"1889 output" [id=1889, type=output]; -"0 features_1_0_attn_qkv_bias" -> "180 clone" [style=solid, label="(288,)"]; -"1 features_1_0_attn_proj_bias" -> "224 linear_3" [style=solid, label="(96,)"]; -"2 features_1_1_attn_qkv_bias" -> "305 clone_1" [style=solid, label="(288,)"]; -"3 features_1_1_attn_proj_bias" -> "373 linear_9" [style=solid, label="(96,)"]; -"4 features_3_0_attn_qkv_bias" -> "484 clone_2" [style=solid, label="(576,)"]; -"5 features_3_0_attn_proj_bias" -> "528 linear_16" [style=solid, label="(192,)"]; -"6 features_3_1_attn_qkv_bias" -> "612 clone_3" [style=solid, label="(576,)"]; -"7 features_3_1_attn_proj_bias" -> "680 linear_22" [style=solid, label="(192,)"]; -"8 features_5_0_attn_qkv_bias" -> "794 clone_4" [style=solid, label="(1152,)"]; -"9 features_5_0_attn_proj_bias" -> "838 linear_29" [style=solid, label="(384,)"]; -"10 features_5_1_attn_qkv_bias" -> "922 clone_5" [style=solid, label="(1152,)"]; -"11 features_5_1_attn_proj_bias" -> "990 linear_35" [style=solid, label="(384,)"]; -"12 features_5_2_attn_qkv_bias" -> "1072 clone_6" [style=solid, label="(1152,)"]; -"13 features_5_2_attn_proj_bias" -> "1116 linear_41" [style=solid, label="(384,)"]; -"14 features_5_3_attn_qkv_bias" -> "1198 clone_7" [style=solid, label="(1152,)"]; -"15 features_5_3_attn_proj_bias" -> "1266 linear_47" [style=solid, label="(384,)"]; -"16 features_5_4_attn_qkv_bias" -> "1348 clone_8" [style=solid, label="(1152,)"]; -"17 features_5_4_attn_proj_bias" -> "1392 linear_53" [style=solid, label="(384,)"]; -"18 features_5_5_attn_qkv_bias" -> "1474 clone_9" [style=solid, label="(1152,)"]; -"19 features_5_5_attn_proj_bias" -> "1542 linear_59" [style=solid, label="(384,)"]; -"20 features_7_0_attn_qkv_bias" -> "1656 clone_10" [style=solid, label="(2304,)"]; -"21 features_7_0_attn_proj_bias" -> "1700 linear_66" [style=solid, label="(768,)"]; -"22 features_7_1_attn_qkv_bias" -> "1783 clone_11" [style=solid, label="(2304,)"]; -"23 features_7_1_attn_proj_bias" -> "1827 linear_72" [style=solid, label="(768,)"]; -"24 features_0_0_bias" -> "137 conv2d" [style=solid, label="(96,)"]; -"25 features_0_2_weight" -> "143 layer_norm" [style=solid, label="(96,)"]; -"26 features_0_2_bias" -> "143 layer_norm" [style=solid, label="(96,)"]; -"27 features_1_0_attn_cpb_mlp_0_bias" -> "148 linear" [style=solid, label="(512,)"]; -"28 features_1_0_norm1_weight" -> "233 layer_norm_1" [style=solid, label="(96,)"]; -"29 features_1_0_norm1_bias" -> "233 layer_norm_1" [style=solid, label="(96,)"]; -"30 features_1_0_mlp_0_bias" -> "247 linear_4" [style=solid, label="(384,)"]; -"31 features_1_0_mlp_3_bias" -> "257 linear_5" [style=solid, label="(96,)"]; -"32 features_1_0_norm2_weight" -> "261 layer_norm_2" [style=solid, label="(96,)"]; -"33 features_1_0_norm2_bias" -> "261 layer_norm_2" [style=solid, label="(96,)"]; -"34 features_1_1_attn_cpb_mlp_0_bias" -> "272 linear_6" [style=solid, label="(512,)"]; -"35 features_1_1_norm1_weight" -> "383 layer_norm_3" [style=solid, label="(96,)"]; -"36 features_1_1_norm1_bias" -> "383 layer_norm_3" [style=solid, label="(96,)"]; -"37 features_1_1_mlp_0_bias" -> "395 linear_10" [style=solid, label="(384,)"]; -"38 features_1_1_mlp_3_bias" -> "405 linear_11" [style=solid, label="(96,)"]; -"39 features_1_1_norm2_weight" -> "409 layer_norm_4" [style=solid, label="(96,)"]; -"40 features_1_1_norm2_bias" -> "409 layer_norm_4" [style=solid, label="(96,)"]; -"41 features_2_norm_weight" -> "447 layer_norm_5" [style=solid, label="(192,)"]; -"42 features_2_norm_bias" -> "447 layer_norm_5" [style=solid, label="(192,)"]; -"43 features_3_0_attn_cpb_mlp_0_bias" -> "452 linear_13" [style=solid, label="(512,)"]; -"44 features_3_0_norm1_weight" -> "540 layer_norm_6" [style=solid, label="(192,)"]; -"45 features_3_0_norm1_bias" -> "540 layer_norm_6" [style=solid, label="(192,)"]; -"46 features_3_0_mlp_0_bias" -> "554 linear_17" [style=solid, label="(768,)"]; -"47 features_3_0_mlp_3_bias" -> "564 linear_18" [style=solid, label="(192,)"]; -"48 features_3_0_norm2_weight" -> "568 layer_norm_7" [style=solid, label="(192,)"]; -"49 features_3_0_norm2_bias" -> "568 layer_norm_7" [style=solid, label="(192,)"]; -"50 features_3_1_attn_cpb_mlp_0_bias" -> "579 linear_19" [style=solid, label="(512,)"]; -"51 features_3_1_norm1_weight" -> "693 layer_norm_8" [style=solid, label="(192,)"]; -"52 features_3_1_norm1_bias" -> "693 layer_norm_8" [style=solid, label="(192,)"]; -"53 features_3_1_mlp_0_bias" -> "705 linear_23" [style=solid, label="(768,)"]; -"54 features_3_1_mlp_3_bias" -> "715 linear_24" [style=solid, label="(192,)"]; -"55 features_3_1_norm2_weight" -> "719 layer_norm_9" [style=solid, label="(192,)"]; -"56 features_3_1_norm2_bias" -> "719 layer_norm_9" [style=solid, label="(192,)"]; -"57 features_4_norm_weight" -> "757 layer_norm_10" [style=solid, label="(384,)"]; -"58 features_4_norm_bias" -> "757 layer_norm_10" [style=solid, label="(384,)"]; -"59 features_5_0_attn_cpb_mlp_0_bias" -> "762 linear_26" [style=solid, label="(512,)"]; -"60 features_5_0_norm1_weight" -> "850 layer_norm_11" [style=solid, label="(384,)"]; -"61 features_5_0_norm1_bias" -> "850 layer_norm_11" [style=solid, label="(384,)"]; -"62 features_5_0_mlp_0_bias" -> "864 linear_30" [style=solid, label="(1536,)"]; -"63 features_5_0_mlp_3_bias" -> "874 linear_31" [style=solid, label="(384,)"]; -"64 features_5_0_norm2_weight" -> "878 layer_norm_12" [style=solid, label="(384,)"]; -"65 features_5_0_norm2_bias" -> "878 layer_norm_12" [style=solid, label="(384,)"]; -"66 features_5_1_attn_cpb_mlp_0_bias" -> "889 linear_32" [style=solid, label="(512,)"]; -"67 features_5_1_norm1_weight" -> "1003 layer_norm_13" [style=solid, label="(384,)"]; -"68 features_5_1_norm1_bias" -> "1003 layer_norm_13" [style=solid, label="(384,)"]; -"69 features_5_1_mlp_0_bias" -> "1015 linear_36" [style=solid, label="(1536,)"]; -"70 features_5_1_mlp_3_bias" -> "1025 linear_37" [style=solid, label="(384,)"]; -"71 features_5_1_norm2_weight" -> "1029 layer_norm_14" [style=solid, label="(384,)"]; -"72 features_5_1_norm2_bias" -> "1029 layer_norm_14" [style=solid, label="(384,)"]; -"73 features_5_2_attn_cpb_mlp_0_bias" -> "1040 linear_38" [style=solid, label="(512,)"]; -"74 features_5_2_norm1_weight" -> "1128 layer_norm_15" [style=solid, label="(384,)"]; -"75 features_5_2_norm1_bias" -> "1128 layer_norm_15" [style=solid, label="(384,)"]; -"76 features_5_2_mlp_0_bias" -> "1140 linear_42" [style=solid, label="(1536,)"]; -"77 features_5_2_mlp_3_bias" -> "1150 linear_43" [style=solid, label="(384,)"]; -"78 features_5_2_norm2_weight" -> "1154 layer_norm_16" [style=solid, label="(384,)"]; -"79 features_5_2_norm2_bias" -> "1154 layer_norm_16" [style=solid, label="(384,)"]; -"80 features_5_3_attn_cpb_mlp_0_bias" -> "1165 linear_44" [style=solid, label="(512,)"]; -"81 features_5_3_norm1_weight" -> "1279 layer_norm_17" [style=solid, label="(384,)"]; -"82 features_5_3_norm1_bias" -> "1279 layer_norm_17" [style=solid, label="(384,)"]; -"83 features_5_3_mlp_0_bias" -> "1291 linear_48" [style=solid, label="(1536,)"]; -"84 features_5_3_mlp_3_bias" -> "1301 linear_49" [style=solid, label="(384,)"]; -"85 features_5_3_norm2_weight" -> "1305 layer_norm_18" [style=solid, label="(384,)"]; -"86 features_5_3_norm2_bias" -> "1305 layer_norm_18" [style=solid, label="(384,)"]; -"87 features_5_4_attn_cpb_mlp_0_bias" -> "1316 linear_50" [style=solid, label="(512,)"]; -"88 features_5_4_norm1_weight" -> "1404 layer_norm_19" [style=solid, label="(384,)"]; -"89 features_5_4_norm1_bias" -> "1404 layer_norm_19" [style=solid, label="(384,)"]; -"90 features_5_4_mlp_0_bias" -> "1416 linear_54" [style=solid, label="(1536,)"]; -"91 features_5_4_mlp_3_bias" -> "1426 linear_55" [style=solid, label="(384,)"]; -"92 features_5_4_norm2_weight" -> "1430 layer_norm_20" [style=solid, label="(384,)"]; -"93 features_5_4_norm2_bias" -> "1430 layer_norm_20" [style=solid, label="(384,)"]; -"94 features_5_5_attn_cpb_mlp_0_bias" -> "1441 linear_56" [style=solid, label="(512,)"]; -"95 features_5_5_norm1_weight" -> "1555 layer_norm_21" [style=solid, label="(384,)"]; -"96 features_5_5_norm1_bias" -> "1555 layer_norm_21" [style=solid, label="(384,)"]; -"97 features_5_5_mlp_0_bias" -> "1567 linear_60" [style=solid, label="(1536,)"]; -"98 features_5_5_mlp_3_bias" -> "1577 linear_61" [style=solid, label="(384,)"]; -"99 features_5_5_norm2_weight" -> "1581 layer_norm_22" [style=solid, label="(384,)"]; -"100 features_5_5_norm2_bias" -> "1581 layer_norm_22" [style=solid, label="(384,)"]; -"101 features_6_norm_weight" -> "1619 layer_norm_23" [style=solid, label="(768,)"]; -"102 features_6_norm_bias" -> "1619 layer_norm_23" [style=solid, label="(768,)"]; -"103 features_7_0_attn_cpb_mlp_0_bias" -> "1624 linear_63" [style=solid, label="(512,)"]; -"104 features_7_0_norm1_weight" -> "1712 layer_norm_24" [style=solid, label="(768,)"]; -"105 features_7_0_norm1_bias" -> "1712 layer_norm_24" [style=solid, label="(768,)"]; -"106 features_7_0_mlp_0_bias" -> "1726 linear_67" [style=solid, label="(3072,)"]; -"107 features_7_0_mlp_3_bias" -> "1736 linear_68" [style=solid, label="(768,)"]; -"108 features_7_0_norm2_weight" -> "1740 layer_norm_25" [style=solid, label="(768,)"]; -"109 features_7_0_norm2_bias" -> "1740 layer_norm_25" [style=solid, label="(768,)"]; -"110 features_7_1_attn_cpb_mlp_0_bias" -> "1751 linear_69" [style=solid, label="(512,)"]; -"111 features_7_1_norm1_weight" -> "1839 layer_norm_26" [style=solid, label="(768,)"]; -"112 features_7_1_norm1_bias" -> "1839 layer_norm_26" [style=solid, label="(768,)"]; -"113 features_7_1_mlp_0_bias" -> "1851 linear_73" [style=solid, label="(3072,)"]; -"114 features_7_1_mlp_3_bias" -> "1861 linear_74" [style=solid, label="(768,)"]; -"115 features_7_1_norm2_weight" -> "1865 layer_norm_27" [style=solid, label="(768,)"]; -"116 features_7_1_norm2_bias" -> "1865 layer_norm_27" [style=solid, label="(768,)"]; -"117 norm_weight" -> "1871 layer_norm_28" [style=solid, label="(768,)"]; -"118 norm_bias" -> "1871 layer_norm_28" [style=solid, label="(768,)"]; -"119 head_bias" -> "1886 linear_75" [style=solid, label="(1000,)"]; -"120 features_1_0_attn_relative_position_index" -> "163 index" [style=solid, label="(4096,)"]; -"121 features_1_1_attn_relative_position_index" -> "287 index_1" [style=solid, label="(4096,)"]; -"122 features_3_0_attn_relative_position_index" -> "467 index_2" [style=solid, label="(4096,)"]; -"123 features_3_1_attn_relative_position_index" -> "594 index_3" [style=solid, label="(4096,)"]; -"124 features_5_0_attn_relative_position_index" -> "777 index_4" [style=solid, label="(4096,)"]; -"125 features_5_1_attn_relative_position_index" -> "904 index_5" [style=solid, label="(4096,)"]; -"126 features_5_2_attn_relative_position_index" -> "1055 index_6" [style=solid, label="(4096,)"]; -"127 features_5_3_attn_relative_position_index" -> "1180 index_7" [style=solid, label="(4096,)"]; -"128 features_5_4_attn_relative_position_index" -> "1331 index_8" [style=solid, label="(4096,)"]; -"129 features_5_5_attn_relative_position_index" -> "1456 index_9" [style=solid, label="(4096,)"]; -"130 features_7_0_attn_relative_position_index" -> "1639 index_10" [style=solid, label="(4096,)"]; -"131 features_7_1_attn_relative_position_index" -> "1766 index_11" [style=solid, label="(4096,)"]; -"132 x" -> "133 quantize_per_tensor_0" [style=solid, label="(1, 3, 224, 224)"]; -"133 quantize_per_tensor_0" -> "134 dequantize_per_tensor_1" [style=solid, label="(1, 3, 224, 224)"]; -"134 dequantize_per_tensor_1" -> "137 conv2d" [style=solid, label="(1, 3, 224, 224)"]; -"135 _frozen_param0" -> "136 dequantize_per_tensor_2" [style=solid, label="(96, 3, 4, 4)"]; -"136 dequantize_per_tensor_2" -> "137 conv2d" [style=solid, label="(96, 3, 4, 4)"]; -"137 conv2d" -> "138 quantize_per_tensor_3" [style=solid, label="(1, 96, 56, 56)"]; -"138 quantize_per_tensor_3" -> "139 dequantize_per_tensor_4" [style=solid, label="(1, 96, 56, 56)"]; -"139 dequantize_per_tensor_4" -> "140 permute" [style=solid, label="(1, 96, 56, 56)"]; -"140 permute" -> "141 quantize_per_tensor_5" [style=solid, label="(1, 56, 56, 96)"]; -"141 quantize_per_tensor_5" -> "142 dequantize_per_tensor_6" [style=solid, label="(1, 56, 56, 96)"]; -"142 dequantize_per_tensor_6" -> "143 layer_norm" [style=solid, label="(1, 56, 56, 96)"]; -"143 layer_norm" -> "176 pad" [style=solid, label="(1, 56, 56, 96)"]; -"143 layer_norm" -> "236 quantize_per_tensor_42" [style=solid, label="(1, 56, 56, 96)"]; -"144 _frozen_param1" -> "145 dequantize_per_tensor_7" [style=solid, label="(1, 15, 15, 2)"]; -"145 dequantize_per_tensor_7" -> "148 linear" [style=solid, label="(1, 15, 15, 2)"]; -"146 _frozen_param2" -> "147 dequantize_per_tensor_8" [style=solid, label="(512, 2)"]; -"147 dequantize_per_tensor_8" -> "148 linear" [style=solid, label="(512, 2)"]; -"148 linear" -> "149 relu_" [style=solid, label="(1, 15, 15, 512)"]; -"149 relu_" -> "150 quantize_per_tensor_9" [style=solid, label="(1, 15, 15, 512)"]; -"150 quantize_per_tensor_9" -> "151 dequantize_per_tensor_10" [style=solid, label="(1, 15, 15, 512)"]; -"151 dequantize_per_tensor_10" -> "152 relu__0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"152 relu__0_0_nncf_smooth_quant_0" -> "153 quantize_per_tensor_11" [style=solid, label="(1, 15, 15, 512)"]; -"153 quantize_per_tensor_11" -> "154 dequantize_per_tensor_12" [style=solid, label="(1, 15, 15, 512)"]; -"154 dequantize_per_tensor_12" -> "157 linear_1" [style=solid, label="(1, 15, 15, 512)"]; -"155 _frozen_param3" -> "156 dequantize_per_tensor_13" [style=solid, label="(3, 512)"]; -"156 dequantize_per_tensor_13" -> "157 linear_1" [style=solid, label="(3, 512)"]; -"157 linear_1" -> "158 quantize_per_tensor_14" [style=solid, label="(1, 15, 15, 3)"]; -"158 quantize_per_tensor_14" -> "159 dequantize_per_tensor_15" [style=solid, label="(1, 15, 15, 3)"]; -"159 dequantize_per_tensor_15" -> "160 view" [style=solid, label="(1, 15, 15, 3)"]; -"160 view" -> "161 quantize_per_tensor_16" [style=solid, label="(225, 3)"]; -"161 quantize_per_tensor_16" -> "162 dequantize_per_tensor_17" [style=solid, label="(225, 3)"]; -"162 dequantize_per_tensor_17" -> "163 index" [style=solid, label="(225, 3)"]; -"163 index" -> "164 view_1" [style=solid, label="(4096, 3)"]; -"164 view_1" -> "165 permute_1" [style=solid, label="(64, 64, 3)"]; -"165 permute_1" -> "166 contiguous" [style=solid, label="(3, 64, 64)"]; -"166 contiguous" -> "167 unsqueeze" [style=solid, label="(3, 64, 64)"]; -"167 unsqueeze" -> "168 sigmoid" [style=solid, label="(1, 3, 64, 64)"]; -"168 sigmoid" -> "169 quantize_per_tensor_18" [style=solid, label="(1, 3, 64, 64)"]; -"169 quantize_per_tensor_18" -> "170 dequantize_per_tensor_19" [style=solid, label="(1, 3, 64, 64)"]; -"170 dequantize_per_tensor_19" -> "173 mul" [style=solid, label="(1, 3, 64, 64)"]; -"171 _frozen_param4" -> "172 dequantize_per_tensor_20" [style=solid, label="()"]; -"172 dequantize_per_tensor_20" -> "173 mul" [style=solid, label="()"]; -"173 mul" -> "174 quantize_per_tensor_21" [style=solid, label="(1, 3, 64, 64)"]; -"174 quantize_per_tensor_21" -> "175 dequantize_per_tensor_22" [style=solid, label="(1, 3, 64, 64)"]; -"175 dequantize_per_tensor_22" -> "211 add" [style=solid, label="(1, 3, 64, 64)"]; -"176 pad" -> "177 view_2" [style=solid, label="(1, 56, 56, 96)"]; -"177 view_2" -> "178 permute_2" [style=solid, label="(1, 7, 8, 7, 8, 96)"]; -"178 permute_2" -> "179 reshape" [style=solid, label="(1, 7, 7, 8, 8, 96)"]; -"179 reshape" -> "181 reshape_0_0_nncf_smooth_quant_0" [style=solid, label="(49, 64, 96)"]; -"180 clone" -> "186 linear_2" [style=solid, label="(288,)"]; -"181 reshape_0_0_nncf_smooth_quant_0" -> "182 quantize_per_tensor_23" [style=solid, label="(49, 64, 96)"]; -"182 quantize_per_tensor_23" -> "183 dequantize_per_tensor_24" [style=solid, label="(49, 64, 96)"]; -"183 dequantize_per_tensor_24" -> "186 linear_2" [style=solid, label="(49, 64, 96)"]; -"184 _frozen_param5" -> "185 dequantize_per_tensor_25" [style=solid, label="(288, 96)"]; -"185 dequantize_per_tensor_25" -> "186 linear_2" [style=solid, label="(288, 96)"]; -"186 linear_2" -> "187 quantize_per_tensor_26" [style=solid, label="(49, 64, 288)"]; -"187 quantize_per_tensor_26" -> "188 dequantize_per_tensor_27" [style=solid, label="(49, 64, 288)"]; -"188 dequantize_per_tensor_27" -> "189 reshape_1" [style=solid, label="(49, 64, 288)"]; -"189 reshape_1" -> "190 permute_3" [style=solid, label="(49, 64, 3, 3, 32)"]; -"190 permute_3" -> "191 select" [style=solid, label="(3, 49, 3, 64, 32)"]; -"190 permute_3" -> "192 select_1" [style=solid, label="(3, 49, 3, 64, 32)"]; -"190 permute_3" -> "193 select_2" [style=solid, label="(3, 49, 3, 64, 32)"]; -"191 select" -> "194 linalg_vector_norm" [style=solid, label="(49, 3, 64, 32)"]; -"191 select" -> "196 expand_as" [style=solid, label="(49, 3, 64, 32)"]; -"191 select" -> "197 div" [style=solid, label="(49, 3, 64, 32)"]; -"192 select_1" -> "198 linalg_vector_norm_1" [style=solid, label="(49, 3, 64, 32)"]; -"192 select_1" -> "200 expand_as_1" [style=solid, label="(49, 3, 64, 32)"]; -"192 select_1" -> "201 div_1" [style=solid, label="(49, 3, 64, 32)"]; -"193 select_2" -> "216 matmul_1" [style=solid, label="(49, 3, 64, 32)"]; -"194 linalg_vector_norm" -> "195 clamp_min" [style=solid, label="(49, 3, 64, 1)"]; -"195 clamp_min" -> "196 expand_as" [style=solid, label="(49, 3, 64, 1)"]; -"196 expand_as" -> "197 div" [style=solid, label="(49, 3, 64, 32)"]; -"197 div" -> "203 matmul" [style=solid, label="(49, 3, 64, 32)"]; -"198 linalg_vector_norm_1" -> "199 clamp_min_1" [style=solid, label="(49, 3, 64, 1)"]; -"199 clamp_min_1" -> "200 expand_as_1" [style=solid, label="(49, 3, 64, 1)"]; -"200 expand_as_1" -> "201 div_1" [style=solid, label="(49, 3, 64, 32)"]; -"201 div_1" -> "202 transpose" [style=solid, label="(49, 3, 64, 32)"]; -"202 transpose" -> "203 matmul" [style=solid, label="(49, 3, 32, 64)"]; -"203 matmul" -> "204 quantize_per_tensor_28" [style=solid, label="(49, 3, 64, 64)"]; -"204 quantize_per_tensor_28" -> "205 dequantize_per_tensor_29" [style=solid, label="(49, 3, 64, 64)"]; -"205 dequantize_per_tensor_29" -> "208 mul_1" [style=solid, label="(49, 3, 64, 64)"]; -"206 _frozen_param6" -> "207 dequantize_per_tensor_30" [style=solid, label="(3, 1, 1)"]; -"207 dequantize_per_tensor_30" -> "208 mul_1" [style=solid, label="(3, 1, 1)"]; -"208 mul_1" -> "209 quantize_per_tensor_31" [style=solid, label="(49, 3, 64, 64)"]; -"209 quantize_per_tensor_31" -> "210 dequantize_per_tensor_32" [style=solid, label="(49, 3, 64, 64)"]; -"210 dequantize_per_tensor_32" -> "211 add" [style=solid, label="(49, 3, 64, 64)"]; -"211 add" -> "212 quantize_per_tensor_33" [style=solid, label="(49, 3, 64, 64)"]; -"212 quantize_per_tensor_33" -> "213 dequantize_per_tensor_34" [style=solid, label="(49, 3, 64, 64)"]; -"213 dequantize_per_tensor_34" -> "214 softmax" [style=solid, label="(49, 3, 64, 64)"]; -"214 softmax" -> "215 dropout" [style=solid, label="(49, 3, 64, 64)"]; -"215 dropout" -> "216 matmul_1" [style=solid, label="(49, 3, 64, 64)"]; -"216 matmul_1" -> "217 transpose_1" [style=solid, label="(49, 3, 64, 32)"]; -"217 transpose_1" -> "218 reshape_2" [style=solid, label="(49, 64, 3, 32)"]; -"218 reshape_2" -> "219 reshape_2_0_0_nncf_smooth_quant_0" [style=solid, label="(49, 64, 96)"]; -"219 reshape_2_0_0_nncf_smooth_quant_0" -> "220 quantize_per_tensor_35" [style=solid, label="(49, 64, 96)"]; -"220 quantize_per_tensor_35" -> "221 dequantize_per_tensor_36" [style=solid, label="(49, 64, 96)"]; -"221 dequantize_per_tensor_36" -> "224 linear_3" [style=solid, label="(49, 64, 96)"]; -"222 _frozen_param7" -> "223 dequantize_per_tensor_37" [style=solid, label="(96, 96)"]; -"223 dequantize_per_tensor_37" -> "224 linear_3" [style=solid, label="(96, 96)"]; -"224 linear_3" -> "225 quantize_per_tensor_38" [style=solid, label="(49, 64, 96)"]; -"225 quantize_per_tensor_38" -> "226 dequantize_per_tensor_39" [style=solid, label="(49, 64, 96)"]; -"226 dequantize_per_tensor_39" -> "227 dropout_1" [style=solid, label="(49, 64, 96)"]; -"227 dropout_1" -> "228 view_3" [style=solid, label="(49, 64, 96)"]; -"228 view_3" -> "229 permute_4" [style=solid, label="(1, 7, 7, 8, 8, 96)"]; -"229 permute_4" -> "230 reshape_3" [style=solid, label="(1, 7, 8, 7, 8, 96)"]; -"230 reshape_3" -> "231 slice_2" [style=solid, label="(1, 56, 56, 96)"]; -"231 slice_2" -> "232 slice_3" [style=solid, label="(1, 56, 56, 96)"]; -"232 slice_3" -> "233 layer_norm_1" [style=solid, label="(1, 56, 56, 96)"]; -"233 layer_norm_1" -> "234 quantize_per_tensor_40" [style=solid, label="(1, 56, 56, 96)"]; -"234 quantize_per_tensor_40" -> "235 dequantize_per_tensor_41" [style=solid, label="(1, 56, 56, 96)"]; -"235 dequantize_per_tensor_41" -> "238 add_1" [style=solid, label="(1, 56, 56, 96)"]; -"236 quantize_per_tensor_42" -> "237 dequantize_per_tensor_43" [style=solid, label="(1, 56, 56, 96)"]; -"237 dequantize_per_tensor_43" -> "238 add_1" [style=solid, label="(1, 56, 56, 96)"]; -"238 add_1" -> "239 quantize_per_tensor_44" [style=solid, label="(1, 56, 56, 96)"]; -"239 quantize_per_tensor_44" -> "240 dequantize_per_tensor_45" [style=solid, label="(1, 56, 56, 96)"]; -"239 quantize_per_tensor_44" -> "241 dequantize_per_tensor_46" [style=solid, label="(1, 56, 56, 96)"]; -"240 dequantize_per_tensor_45" -> "264 add_2" [style=solid, label="(1, 56, 56, 96)"]; -"241 dequantize_per_tensor_46" -> "242 add_1_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 56, 56, 96)"]; -"242 add_1_0_0_nncf_smooth_quant_0" -> "243 quantize_per_tensor_47" [style=solid, label="(1, 56, 56, 96)"]; -"243 quantize_per_tensor_47" -> "244 dequantize_per_tensor_48" [style=solid, label="(1, 56, 56, 96)"]; -"244 dequantize_per_tensor_48" -> "247 linear_4" [style=solid, label="(1, 56, 56, 96)"]; -"245 _frozen_param8" -> "246 dequantize_per_tensor_49" [style=solid, label="(384, 96)"]; -"246 dequantize_per_tensor_49" -> "247 linear_4" [style=solid, label="(384, 96)"]; -"247 linear_4" -> "248 quantize_per_tensor_50" [style=solid, label="(1, 56, 56, 384)"]; -"248 quantize_per_tensor_50" -> "249 dequantize_per_tensor_51" [style=solid, label="(1, 56, 56, 384)"]; -"249 dequantize_per_tensor_51" -> "250 gelu" [style=solid, label="(1, 56, 56, 384)"]; -"250 gelu" -> "251 dropout_2" [style=solid, label="(1, 56, 56, 384)"]; -"251 dropout_2" -> "252 dropout_2_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 56, 56, 384)"]; -"252 dropout_2_0_0_nncf_smooth_quant_0" -> "253 quantize_per_tensor_52" [style=solid, label="(1, 56, 56, 384)"]; -"253 quantize_per_tensor_52" -> "254 dequantize_per_tensor_53" [style=solid, label="(1, 56, 56, 384)"]; -"254 dequantize_per_tensor_53" -> "257 linear_5" [style=solid, label="(1, 56, 56, 384)"]; -"255 _frozen_param9" -> "256 dequantize_per_tensor_54" [style=solid, label="(96, 384)"]; -"256 dequantize_per_tensor_54" -> "257 linear_5" [style=solid, label="(96, 384)"]; -"257 linear_5" -> "258 quantize_per_tensor_55" [style=solid, label="(1, 56, 56, 96)"]; -"258 quantize_per_tensor_55" -> "259 dequantize_per_tensor_56" [style=solid, label="(1, 56, 56, 96)"]; -"259 dequantize_per_tensor_56" -> "260 dropout_3" [style=solid, label="(1, 56, 56, 96)"]; -"260 dropout_3" -> "261 layer_norm_2" [style=solid, label="(1, 56, 56, 96)"]; -"261 layer_norm_2" -> "262 quantize_per_tensor_57" [style=solid, label="(1, 56, 56, 96)"]; -"262 quantize_per_tensor_57" -> "263 dequantize_per_tensor_58" [style=solid, label="(1, 56, 56, 96)"]; -"263 dequantize_per_tensor_58" -> "264 add_2" [style=solid, label="(1, 56, 56, 96)"]; -"264 add_2" -> "265 quantize_per_tensor_59" [style=solid, label="(1, 56, 56, 96)"]; -"265 quantize_per_tensor_59" -> "266 dequantize_per_tensor_60" [style=solid, label="(1, 56, 56, 96)"]; -"265 quantize_per_tensor_59" -> "267 dequantize_per_tensor_61" [style=solid, label="(1, 56, 56, 96)"]; -"266 dequantize_per_tensor_60" -> "386 add_5" [style=solid, label="(1, 56, 56, 96)"]; -"267 dequantize_per_tensor_61" -> "300 pad_1" [style=solid, label="(1, 56, 56, 96)"]; -"268 _frozen_param10" -> "269 dequantize_per_tensor_62" [style=solid, label="(1, 15, 15, 2)"]; -"269 dequantize_per_tensor_62" -> "272 linear_6" [style=solid, label="(1, 15, 15, 2)"]; -"270 _frozen_param11" -> "271 dequantize_per_tensor_63" [style=solid, label="(512, 2)"]; -"271 dequantize_per_tensor_63" -> "272 linear_6" [style=solid, label="(512, 2)"]; -"272 linear_6" -> "273 relu__1" [style=solid, label="(1, 15, 15, 512)"]; -"273 relu__1" -> "274 quantize_per_tensor_64" [style=solid, label="(1, 15, 15, 512)"]; -"274 quantize_per_tensor_64" -> "275 dequantize_per_tensor_65" [style=solid, label="(1, 15, 15, 512)"]; -"275 dequantize_per_tensor_65" -> "276 relu__1_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"276 relu__1_0_0_nncf_smooth_quant_0" -> "277 quantize_per_tensor_66" [style=solid, label="(1, 15, 15, 512)"]; -"277 quantize_per_tensor_66" -> "278 dequantize_per_tensor_67" [style=solid, label="(1, 15, 15, 512)"]; -"278 dequantize_per_tensor_67" -> "281 linear_7" [style=solid, label="(1, 15, 15, 512)"]; -"279 _frozen_param12" -> "280 dequantize_per_tensor_68" [style=solid, label="(3, 512)"]; -"280 dequantize_per_tensor_68" -> "281 linear_7" [style=solid, label="(3, 512)"]; -"281 linear_7" -> "282 quantize_per_tensor_69" [style=solid, label="(1, 15, 15, 3)"]; -"282 quantize_per_tensor_69" -> "283 dequantize_per_tensor_70" [style=solid, label="(1, 15, 15, 3)"]; -"283 dequantize_per_tensor_70" -> "284 view_4" [style=solid, label="(1, 15, 15, 3)"]; -"284 view_4" -> "285 quantize_per_tensor_71" [style=solid, label="(225, 3)"]; -"285 quantize_per_tensor_71" -> "286 dequantize_per_tensor_72" [style=solid, label="(225, 3)"]; -"286 dequantize_per_tensor_72" -> "287 index_1" [style=solid, label="(225, 3)"]; -"287 index_1" -> "288 view_5" [style=solid, label="(4096, 3)"]; -"288 view_5" -> "289 permute_5" [style=solid, label="(64, 64, 3)"]; -"289 permute_5" -> "290 contiguous_1" [style=solid, label="(3, 64, 64)"]; -"290 contiguous_1" -> "291 unsqueeze_1" [style=solid, label="(3, 64, 64)"]; -"291 unsqueeze_1" -> "292 sigmoid_1" [style=solid, label="(1, 3, 64, 64)"]; -"292 sigmoid_1" -> "293 quantize_per_tensor_73" [style=solid, label="(1, 3, 64, 64)"]; -"293 quantize_per_tensor_73" -> "294 dequantize_per_tensor_74" [style=solid, label="(1, 3, 64, 64)"]; -"294 dequantize_per_tensor_74" -> "297 mul_2" [style=solid, label="(1, 3, 64, 64)"]; -"295 _frozen_param13" -> "296 dequantize_per_tensor_75" [style=solid, label="()"]; -"296 dequantize_per_tensor_75" -> "297 mul_2" [style=solid, label="()"]; -"297 mul_2" -> "298 quantize_per_tensor_76" [style=solid, label="(1, 3, 64, 64)"]; -"298 quantize_per_tensor_76" -> "299 dequantize_per_tensor_77" [style=solid, label="(1, 3, 64, 64)"]; -"299 dequantize_per_tensor_77" -> "336 add_3" [style=solid, label="(1, 3, 64, 64)"]; -"300 pad_1" -> "301 roll" [style=solid, label="(1, 56, 56, 96)"]; -"301 roll" -> "302 view_6" [style=solid, label="(1, 56, 56, 96)"]; -"302 view_6" -> "303 permute_6" [style=solid, label="(1, 7, 8, 7, 8, 96)"]; -"303 permute_6" -> "304 reshape_4" [style=solid, label="(1, 7, 7, 8, 8, 96)"]; -"304 reshape_4" -> "306 reshape_4_0_0_nncf_smooth_quant_0" [style=solid, label="(49, 64, 96)"]; -"304 reshape_4" -> "339 new_zeros" [style=solid, label="(49, 64, 96)"]; -"305 clone_1" -> "311 linear_8" [style=solid, label="(288,)"]; -"306 reshape_4_0_0_nncf_smooth_quant_0" -> "307 quantize_per_tensor_78" [style=solid, label="(49, 64, 96)"]; -"307 quantize_per_tensor_78" -> "308 dequantize_per_tensor_79" [style=solid, label="(49, 64, 96)"]; -"308 dequantize_per_tensor_79" -> "311 linear_8" [style=solid, label="(49, 64, 96)"]; -"309 _frozen_param14" -> "310 dequantize_per_tensor_80" [style=solid, label="(288, 96)"]; -"310 dequantize_per_tensor_80" -> "311 linear_8" [style=solid, label="(288, 96)"]; -"311 linear_8" -> "312 quantize_per_tensor_81" [style=solid, label="(49, 64, 288)"]; -"312 quantize_per_tensor_81" -> "313 dequantize_per_tensor_82" [style=solid, label="(49, 64, 288)"]; -"313 dequantize_per_tensor_82" -> "314 reshape_5" [style=solid, label="(49, 64, 288)"]; -"314 reshape_5" -> "315 permute_7" [style=solid, label="(49, 64, 3, 3, 32)"]; -"315 permute_7" -> "316 select_3" [style=solid, label="(3, 49, 3, 64, 32)"]; -"315 permute_7" -> "317 select_4" [style=solid, label="(3, 49, 3, 64, 32)"]; -"315 permute_7" -> "318 select_5" [style=solid, label="(3, 49, 3, 64, 32)"]; -"316 select_3" -> "319 linalg_vector_norm_2" [style=solid, label="(49, 3, 64, 32)"]; -"316 select_3" -> "321 expand_as_2" [style=solid, label="(49, 3, 64, 32)"]; -"316 select_3" -> "322 div_2" [style=solid, label="(49, 3, 64, 32)"]; -"317 select_4" -> "323 linalg_vector_norm_3" [style=solid, label="(49, 3, 64, 32)"]; -"317 select_4" -> "325 expand_as_3" [style=solid, label="(49, 3, 64, 32)"]; -"317 select_4" -> "326 div_3" [style=solid, label="(49, 3, 64, 32)"]; -"318 select_5" -> "365 matmul_3" [style=solid, label="(49, 3, 64, 32)"]; -"319 linalg_vector_norm_2" -> "320 clamp_min_2" [style=solid, label="(49, 3, 64, 1)"]; -"320 clamp_min_2" -> "321 expand_as_2" [style=solid, label="(49, 3, 64, 1)"]; -"321 expand_as_2" -> "322 div_2" [style=solid, label="(49, 3, 64, 32)"]; -"322 div_2" -> "328 matmul_2" [style=solid, label="(49, 3, 64, 32)"]; -"323 linalg_vector_norm_3" -> "324 clamp_min_3" [style=solid, label="(49, 3, 64, 1)"]; -"324 clamp_min_3" -> "325 expand_as_3" [style=solid, label="(49, 3, 64, 1)"]; -"325 expand_as_3" -> "326 div_3" [style=solid, label="(49, 3, 64, 32)"]; -"326 div_3" -> "327 transpose_2" [style=solid, label="(49, 3, 64, 32)"]; -"327 transpose_2" -> "328 matmul_2" [style=solid, label="(49, 3, 32, 64)"]; -"328 matmul_2" -> "329 quantize_per_tensor_83" [style=solid, label="(49, 3, 64, 64)"]; -"329 quantize_per_tensor_83" -> "330 dequantize_per_tensor_84" [style=solid, label="(49, 3, 64, 64)"]; -"330 dequantize_per_tensor_84" -> "333 mul_3" [style=solid, label="(49, 3, 64, 64)"]; -"331 _frozen_param15" -> "332 dequantize_per_tensor_85" [style=solid, label="(3, 1, 1)"]; -"332 dequantize_per_tensor_85" -> "333 mul_3" [style=solid, label="(3, 1, 1)"]; -"333 mul_3" -> "334 quantize_per_tensor_86" [style=solid, label="(49, 3, 64, 64)"]; -"334 quantize_per_tensor_86" -> "335 dequantize_per_tensor_87" [style=solid, label="(49, 3, 64, 64)"]; -"335 dequantize_per_tensor_87" -> "336 add_3" [style=solid, label="(49, 3, 64, 64)"]; -"336 add_3" -> "337 quantize_per_tensor_88" [style=solid, label="(49, 3, 64, 64)"]; -"337 quantize_per_tensor_88" -> "338 dequantize_per_tensor_89" [style=solid, label="(49, 3, 64, 64)"]; -"338 dequantize_per_tensor_89" -> "350 view_8" [style=solid, label="(49, 3, 64, 64)"]; -"339 new_zeros" -> "340 view_7" [style=solid, label="(56, 56)"]; -"340 view_7" -> "341 permute_8" [style=solid, label="(7, 8, 7, 8)"]; -"341 permute_8" -> "342 reshape_6" [style=solid, label="(7, 7, 8, 8)"]; -"342 reshape_6" -> "343 unsqueeze_2" [style=solid, label="(49, 64)"]; -"342 reshape_6" -> "344 unsqueeze_3" [style=solid, label="(49, 64)"]; -"343 unsqueeze_2" -> "345 sub" [style=solid, label="(49, 1, 64)"]; -"344 unsqueeze_3" -> "345 sub" [style=solid, label="(49, 64, 1)"]; -"345 sub" -> "346 ne" [style=solid, label="(49, 64, 64)"]; -"345 sub" -> "347 masked_fill" [style=solid, label="(49, 64, 64)"]; -"345 sub" -> "348 eq" [style=solid, label="(49, 64, 64)"]; -"346 ne" -> "347 masked_fill" [style=solid, label="(49, 64, 64)"]; -"347 masked_fill" -> "349 masked_fill_1" [style=solid, label="(49, 64, 64)"]; -"348 eq" -> "349 masked_fill_1" [style=solid, label="(49, 64, 64)"]; -"349 masked_fill_1" -> "353 unsqueeze_4" [style=solid, label="(49, 64, 64)"]; -"350 view_8" -> "351 quantize_per_tensor_90" [style=solid, label="(1, 49, 3, 64, 64)"]; -"351 quantize_per_tensor_90" -> "352 dequantize_per_tensor_91" [style=solid, label="(1, 49, 3, 64, 64)"]; -"352 dequantize_per_tensor_91" -> "357 add_4" [style=solid, label="(1, 49, 3, 64, 64)"]; -"353 unsqueeze_4" -> "354 unsqueeze_5" [style=solid, label="(49, 1, 64, 64)"]; -"354 unsqueeze_5" -> "355 quantize_per_tensor_92" [style=solid, label="(1, 49, 1, 64, 64)"]; -"355 quantize_per_tensor_92" -> "356 dequantize_per_tensor_93" [style=solid, label="(1, 49, 1, 64, 64)"]; -"356 dequantize_per_tensor_93" -> "357 add_4" [style=solid, label="(1, 49, 1, 64, 64)"]; -"357 add_4" -> "358 quantize_per_tensor_94" [style=solid, label="(1, 49, 3, 64, 64)"]; -"358 quantize_per_tensor_94" -> "359 dequantize_per_tensor_95" [style=solid, label="(1, 49, 3, 64, 64)"]; -"359 dequantize_per_tensor_95" -> "360 view_9" [style=solid, label="(1, 49, 3, 64, 64)"]; -"360 view_9" -> "361 quantize_per_tensor_96" [style=solid, label="(49, 3, 64, 64)"]; -"361 quantize_per_tensor_96" -> "362 dequantize_per_tensor_97" [style=solid, label="(49, 3, 64, 64)"]; -"362 dequantize_per_tensor_97" -> "363 softmax_1" [style=solid, label="(49, 3, 64, 64)"]; -"363 softmax_1" -> "364 dropout_4" [style=solid, label="(49, 3, 64, 64)"]; -"364 dropout_4" -> "365 matmul_3" [style=solid, label="(49, 3, 64, 64)"]; -"365 matmul_3" -> "366 transpose_3" [style=solid, label="(49, 3, 64, 32)"]; -"366 transpose_3" -> "367 reshape_7" [style=solid, label="(49, 64, 3, 32)"]; -"367 reshape_7" -> "368 reshape_7_0_0_nncf_smooth_quant_0" [style=solid, label="(49, 64, 96)"]; -"368 reshape_7_0_0_nncf_smooth_quant_0" -> "369 quantize_per_tensor_98" [style=solid, label="(49, 64, 96)"]; -"369 quantize_per_tensor_98" -> "370 dequantize_per_tensor_99" [style=solid, label="(49, 64, 96)"]; -"370 dequantize_per_tensor_99" -> "373 linear_9" [style=solid, label="(49, 64, 96)"]; -"371 _frozen_param16" -> "372 dequantize_per_tensor_100" [style=solid, label="(96, 96)"]; -"372 dequantize_per_tensor_100" -> "373 linear_9" [style=solid, label="(96, 96)"]; -"373 linear_9" -> "374 quantize_per_tensor_101" [style=solid, label="(49, 64, 96)"]; -"374 quantize_per_tensor_101" -> "375 dequantize_per_tensor_102" [style=solid, label="(49, 64, 96)"]; -"375 dequantize_per_tensor_102" -> "376 dropout_5" [style=solid, label="(49, 64, 96)"]; -"376 dropout_5" -> "377 view_10" [style=solid, label="(49, 64, 96)"]; -"377 view_10" -> "378 permute_9" [style=solid, label="(1, 7, 7, 8, 8, 96)"]; -"378 permute_9" -> "379 reshape_8" [style=solid, label="(1, 7, 8, 7, 8, 96)"]; -"379 reshape_8" -> "380 roll_1" [style=solid, label="(1, 56, 56, 96)"]; -"380 roll_1" -> "381 slice_23" [style=solid, label="(1, 56, 56, 96)"]; -"381 slice_23" -> "382 slice_24" [style=solid, label="(1, 56, 56, 96)"]; -"382 slice_24" -> "383 layer_norm_3" [style=solid, label="(1, 56, 56, 96)"]; -"383 layer_norm_3" -> "384 quantize_per_tensor_103" [style=solid, label="(1, 56, 56, 96)"]; -"384 quantize_per_tensor_103" -> "385 dequantize_per_tensor_104" [style=solid, label="(1, 56, 56, 96)"]; -"385 dequantize_per_tensor_104" -> "386 add_5" [style=solid, label="(1, 56, 56, 96)"]; -"386 add_5" -> "387 quantize_per_tensor_105" [style=solid, label="(1, 56, 56, 96)"]; -"387 quantize_per_tensor_105" -> "388 dequantize_per_tensor_106" [style=solid, label="(1, 56, 56, 96)"]; -"387 quantize_per_tensor_105" -> "389 dequantize_per_tensor_107" [style=solid, label="(1, 56, 56, 96)"]; -"388 dequantize_per_tensor_106" -> "412 add_6" [style=solid, label="(1, 56, 56, 96)"]; -"389 dequantize_per_tensor_107" -> "390 add_5_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 56, 56, 96)"]; -"390 add_5_0_0_nncf_smooth_quant_0" -> "391 quantize_per_tensor_108" [style=solid, label="(1, 56, 56, 96)"]; -"391 quantize_per_tensor_108" -> "392 dequantize_per_tensor_109" [style=solid, label="(1, 56, 56, 96)"]; -"392 dequantize_per_tensor_109" -> "395 linear_10" [style=solid, label="(1, 56, 56, 96)"]; -"393 _frozen_param17" -> "394 dequantize_per_tensor_110" [style=solid, label="(384, 96)"]; -"394 dequantize_per_tensor_110" -> "395 linear_10" [style=solid, label="(384, 96)"]; -"395 linear_10" -> "396 quantize_per_tensor_111" [style=solid, label="(1, 56, 56, 384)"]; -"396 quantize_per_tensor_111" -> "397 dequantize_per_tensor_112" [style=solid, label="(1, 56, 56, 384)"]; -"397 dequantize_per_tensor_112" -> "398 gelu_1" [style=solid, label="(1, 56, 56, 384)"]; -"398 gelu_1" -> "399 dropout_6" [style=solid, label="(1, 56, 56, 384)"]; -"399 dropout_6" -> "400 dropout_6_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 56, 56, 384)"]; -"400 dropout_6_0_0_nncf_smooth_quant_0" -> "401 quantize_per_tensor_113" [style=solid, label="(1, 56, 56, 384)"]; -"401 quantize_per_tensor_113" -> "402 dequantize_per_tensor_114" [style=solid, label="(1, 56, 56, 384)"]; -"402 dequantize_per_tensor_114" -> "405 linear_11" [style=solid, label="(1, 56, 56, 384)"]; -"403 _frozen_param18" -> "404 dequantize_per_tensor_115" [style=solid, label="(96, 384)"]; -"404 dequantize_per_tensor_115" -> "405 linear_11" [style=solid, label="(96, 384)"]; -"405 linear_11" -> "406 quantize_per_tensor_116" [style=solid, label="(1, 56, 56, 96)"]; -"406 quantize_per_tensor_116" -> "407 dequantize_per_tensor_117" [style=solid, label="(1, 56, 56, 96)"]; -"407 dequantize_per_tensor_117" -> "408 dropout_7" [style=solid, label="(1, 56, 56, 96)"]; -"408 dropout_7" -> "409 layer_norm_4" [style=solid, label="(1, 56, 56, 96)"]; -"409 layer_norm_4" -> "410 quantize_per_tensor_118" [style=solid, label="(1, 56, 56, 96)"]; -"410 quantize_per_tensor_118" -> "411 dequantize_per_tensor_119" [style=solid, label="(1, 56, 56, 96)"]; -"411 dequantize_per_tensor_119" -> "412 add_6" [style=solid, label="(1, 56, 56, 96)"]; -"412 add_6" -> "413 quantize_per_tensor_120" [style=solid, label="(1, 56, 56, 96)"]; -"413 quantize_per_tensor_120" -> "414 dequantize_per_tensor_121" [style=solid, label="(1, 56, 56, 96)"]; -"414 dequantize_per_tensor_121" -> "415 pad_2" [style=solid, label="(1, 56, 56, 96)"]; -"415 pad_2" -> "416 slice_25" [style=solid, label="(1, 56, 56, 96)"]; -"415 pad_2" -> "421 slice_28" [style=solid, label="(1, 56, 56, 96)"]; -"415 pad_2" -> "426 slice_31" [style=solid, label="(1, 56, 56, 96)"]; -"415 pad_2" -> "431 slice_34" [style=solid, label="(1, 56, 56, 96)"]; -"416 slice_25" -> "417 slice_26" [style=solid, label="(1, 28, 56, 96)"]; -"417 slice_26" -> "418 slice_27" [style=solid, label="(1, 28, 28, 96)"]; -"418 slice_27" -> "419 quantize_per_tensor_122" [style=solid, label="(1, 28, 28, 96)"]; -"419 quantize_per_tensor_122" -> "420 dequantize_per_tensor_123" [style=solid, label="(1, 28, 28, 96)"]; -"420 dequantize_per_tensor_123" -> "436 cat" [style=solid, label="(1, 28, 28, 96)"]; -"421 slice_28" -> "422 slice_29" [style=solid, label="(1, 28, 56, 96)"]; -"422 slice_29" -> "423 slice_30" [style=solid, label="(1, 28, 28, 96)"]; -"423 slice_30" -> "424 quantize_per_tensor_124" [style=solid, label="(1, 28, 28, 96)"]; -"424 quantize_per_tensor_124" -> "425 dequantize_per_tensor_125" [style=solid, label="(1, 28, 28, 96)"]; -"425 dequantize_per_tensor_125" -> "436 cat" [style=solid, label="(1, 28, 28, 96)"]; -"426 slice_31" -> "427 slice_32" [style=solid, label="(1, 28, 56, 96)"]; -"427 slice_32" -> "428 slice_33" [style=solid, label="(1, 28, 28, 96)"]; -"428 slice_33" -> "429 quantize_per_tensor_126" [style=solid, label="(1, 28, 28, 96)"]; -"429 quantize_per_tensor_126" -> "430 dequantize_per_tensor_127" [style=solid, label="(1, 28, 28, 96)"]; -"430 dequantize_per_tensor_127" -> "436 cat" [style=solid, label="(1, 28, 28, 96)"]; -"431 slice_34" -> "432 slice_35" [style=solid, label="(1, 28, 56, 96)"]; -"432 slice_35" -> "433 slice_36" [style=solid, label="(1, 28, 28, 96)"]; -"433 slice_36" -> "434 quantize_per_tensor_128" [style=solid, label="(1, 28, 28, 96)"]; -"434 quantize_per_tensor_128" -> "435 dequantize_per_tensor_129" [style=solid, label="(1, 28, 28, 96)"]; -"435 dequantize_per_tensor_129" -> "436 cat" [style=solid, label="(1, 28, 28, 96)"]; -"436 cat" -> "437 quantize_per_tensor_130" [style=solid, label="(1, 28, 28, 384)"]; -"437 quantize_per_tensor_130" -> "438 dequantize_per_tensor_131" [style=solid, label="(1, 28, 28, 384)"]; -"438 dequantize_per_tensor_131" -> "439 cat_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 28, 28, 384)"]; -"439 cat_0_0_nncf_smooth_quant_0" -> "440 quantize_per_tensor_132" [style=solid, label="(1, 28, 28, 384)"]; -"440 quantize_per_tensor_132" -> "441 dequantize_per_tensor_133" [style=solid, label="(1, 28, 28, 384)"]; -"441 dequantize_per_tensor_133" -> "444 linear_12" [style=solid, label="(1, 28, 28, 384)"]; -"442 _frozen_param19" -> "443 dequantize_per_tensor_134" [style=solid, label="(192, 384)"]; -"443 dequantize_per_tensor_134" -> "444 linear_12" [style=solid, label="(192, 384)"]; -"444 linear_12" -> "445 quantize_per_tensor_135" [style=solid, label="(1, 28, 28, 192)"]; -"445 quantize_per_tensor_135" -> "446 dequantize_per_tensor_136" [style=solid, label="(1, 28, 28, 192)"]; -"446 dequantize_per_tensor_136" -> "447 layer_norm_5" [style=solid, label="(1, 28, 28, 192)"]; -"447 layer_norm_5" -> "480 pad_3" [style=solid, label="(1, 28, 28, 192)"]; -"447 layer_norm_5" -> "543 quantize_per_tensor_172" [style=solid, label="(1, 28, 28, 192)"]; -"448 _frozen_param20" -> "449 dequantize_per_tensor_137" [style=solid, label="(1, 15, 15, 2)"]; -"449 dequantize_per_tensor_137" -> "452 linear_13" [style=solid, label="(1, 15, 15, 2)"]; -"450 _frozen_param21" -> "451 dequantize_per_tensor_138" [style=solid, label="(512, 2)"]; -"451 dequantize_per_tensor_138" -> "452 linear_13" [style=solid, label="(512, 2)"]; -"452 linear_13" -> "453 relu__2" [style=solid, label="(1, 15, 15, 512)"]; -"453 relu__2" -> "454 quantize_per_tensor_139" [style=solid, label="(1, 15, 15, 512)"]; -"454 quantize_per_tensor_139" -> "455 dequantize_per_tensor_140" [style=solid, label="(1, 15, 15, 512)"]; -"455 dequantize_per_tensor_140" -> "456 relu__2_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"456 relu__2_0_0_nncf_smooth_quant_0" -> "457 quantize_per_tensor_141" [style=solid, label="(1, 15, 15, 512)"]; -"457 quantize_per_tensor_141" -> "458 dequantize_per_tensor_142" [style=solid, label="(1, 15, 15, 512)"]; -"458 dequantize_per_tensor_142" -> "461 linear_14" [style=solid, label="(1, 15, 15, 512)"]; -"459 _frozen_param22" -> "460 dequantize_per_tensor_143" [style=solid, label="(6, 512)"]; -"460 dequantize_per_tensor_143" -> "461 linear_14" [style=solid, label="(6, 512)"]; -"461 linear_14" -> "462 quantize_per_tensor_144" [style=solid, label="(1, 15, 15, 6)"]; -"462 quantize_per_tensor_144" -> "463 dequantize_per_tensor_145" [style=solid, label="(1, 15, 15, 6)"]; -"463 dequantize_per_tensor_145" -> "464 view_11" [style=solid, label="(1, 15, 15, 6)"]; -"464 view_11" -> "465 quantize_per_tensor_146" [style=solid, label="(225, 6)"]; -"465 quantize_per_tensor_146" -> "466 dequantize_per_tensor_147" [style=solid, label="(225, 6)"]; -"466 dequantize_per_tensor_147" -> "467 index_2" [style=solid, label="(225, 6)"]; -"467 index_2" -> "468 view_12" [style=solid, label="(4096, 6)"]; -"468 view_12" -> "469 permute_10" [style=solid, label="(64, 64, 6)"]; -"469 permute_10" -> "470 contiguous_2" [style=solid, label="(6, 64, 64)"]; -"470 contiguous_2" -> "471 unsqueeze_6" [style=solid, label="(6, 64, 64)"]; -"471 unsqueeze_6" -> "472 sigmoid_2" [style=solid, label="(1, 6, 64, 64)"]; -"472 sigmoid_2" -> "473 quantize_per_tensor_148" [style=solid, label="(1, 6, 64, 64)"]; -"473 quantize_per_tensor_148" -> "474 dequantize_per_tensor_149" [style=solid, label="(1, 6, 64, 64)"]; -"474 dequantize_per_tensor_149" -> "477 mul_4" [style=solid, label="(1, 6, 64, 64)"]; -"475 _frozen_param23" -> "476 dequantize_per_tensor_150" [style=solid, label="()"]; -"476 dequantize_per_tensor_150" -> "477 mul_4" [style=solid, label="()"]; -"477 mul_4" -> "478 quantize_per_tensor_151" [style=solid, label="(1, 6, 64, 64)"]; -"478 quantize_per_tensor_151" -> "479 dequantize_per_tensor_152" [style=solid, label="(1, 6, 64, 64)"]; -"479 dequantize_per_tensor_152" -> "515 add_7" [style=solid, label="(1, 6, 64, 64)"]; -"480 pad_3" -> "481 view_13" [style=solid, label="(1, 32, 32, 192)"]; -"481 view_13" -> "482 permute_11" [style=solid, label="(1, 4, 8, 4, 8, 192)"]; -"482 permute_11" -> "483 reshape_9" [style=solid, label="(1, 4, 4, 8, 8, 192)"]; -"483 reshape_9" -> "485 reshape_9_0_0_nncf_smooth_quant_0" [style=solid, label="(16, 64, 192)"]; -"484 clone_2" -> "490 linear_15" [style=solid, label="(576,)"]; -"485 reshape_9_0_0_nncf_smooth_quant_0" -> "486 quantize_per_tensor_153" [style=solid, label="(16, 64, 192)"]; -"486 quantize_per_tensor_153" -> "487 dequantize_per_tensor_154" [style=solid, label="(16, 64, 192)"]; -"487 dequantize_per_tensor_154" -> "490 linear_15" [style=solid, label="(16, 64, 192)"]; -"488 _frozen_param24" -> "489 dequantize_per_tensor_155" [style=solid, label="(576, 192)"]; -"489 dequantize_per_tensor_155" -> "490 linear_15" [style=solid, label="(576, 192)"]; -"490 linear_15" -> "491 quantize_per_tensor_156" [style=solid, label="(16, 64, 576)"]; -"491 quantize_per_tensor_156" -> "492 dequantize_per_tensor_157" [style=solid, label="(16, 64, 576)"]; -"492 dequantize_per_tensor_157" -> "493 reshape_10" [style=solid, label="(16, 64, 576)"]; -"493 reshape_10" -> "494 permute_12" [style=solid, label="(16, 64, 3, 6, 32)"]; -"494 permute_12" -> "495 select_6" [style=solid, label="(3, 16, 6, 64, 32)"]; -"494 permute_12" -> "496 select_7" [style=solid, label="(3, 16, 6, 64, 32)"]; -"494 permute_12" -> "497 select_8" [style=solid, label="(3, 16, 6, 64, 32)"]; -"495 select_6" -> "498 linalg_vector_norm_4" [style=solid, label="(16, 6, 64, 32)"]; -"495 select_6" -> "500 expand_as_4" [style=solid, label="(16, 6, 64, 32)"]; -"495 select_6" -> "501 div_4" [style=solid, label="(16, 6, 64, 32)"]; -"496 select_7" -> "502 linalg_vector_norm_5" [style=solid, label="(16, 6, 64, 32)"]; -"496 select_7" -> "504 expand_as_5" [style=solid, label="(16, 6, 64, 32)"]; -"496 select_7" -> "505 div_5" [style=solid, label="(16, 6, 64, 32)"]; -"497 select_8" -> "520 matmul_5" [style=solid, label="(16, 6, 64, 32)"]; -"498 linalg_vector_norm_4" -> "499 clamp_min_4" [style=solid, label="(16, 6, 64, 1)"]; -"499 clamp_min_4" -> "500 expand_as_4" [style=solid, label="(16, 6, 64, 1)"]; -"500 expand_as_4" -> "501 div_4" [style=solid, label="(16, 6, 64, 32)"]; -"501 div_4" -> "507 matmul_4" [style=solid, label="(16, 6, 64, 32)"]; -"502 linalg_vector_norm_5" -> "503 clamp_min_5" [style=solid, label="(16, 6, 64, 1)"]; -"503 clamp_min_5" -> "504 expand_as_5" [style=solid, label="(16, 6, 64, 1)"]; -"504 expand_as_5" -> "505 div_5" [style=solid, label="(16, 6, 64, 32)"]; -"505 div_5" -> "506 transpose_4" [style=solid, label="(16, 6, 64, 32)"]; -"506 transpose_4" -> "507 matmul_4" [style=solid, label="(16, 6, 32, 64)"]; -"507 matmul_4" -> "508 quantize_per_tensor_158" [style=solid, label="(16, 6, 64, 64)"]; -"508 quantize_per_tensor_158" -> "509 dequantize_per_tensor_159" [style=solid, label="(16, 6, 64, 64)"]; -"509 dequantize_per_tensor_159" -> "512 mul_5" [style=solid, label="(16, 6, 64, 64)"]; -"510 _frozen_param25" -> "511 dequantize_per_tensor_160" [style=solid, label="(6, 1, 1)"]; -"511 dequantize_per_tensor_160" -> "512 mul_5" [style=solid, label="(6, 1, 1)"]; -"512 mul_5" -> "513 quantize_per_tensor_161" [style=solid, label="(16, 6, 64, 64)"]; -"513 quantize_per_tensor_161" -> "514 dequantize_per_tensor_162" [style=solid, label="(16, 6, 64, 64)"]; -"514 dequantize_per_tensor_162" -> "515 add_7" [style=solid, label="(16, 6, 64, 64)"]; -"515 add_7" -> "516 quantize_per_tensor_163" [style=solid, label="(16, 6, 64, 64)"]; -"516 quantize_per_tensor_163" -> "517 dequantize_per_tensor_164" [style=solid, label="(16, 6, 64, 64)"]; -"517 dequantize_per_tensor_164" -> "518 softmax_2" [style=solid, label="(16, 6, 64, 64)"]; -"518 softmax_2" -> "519 dropout_8" [style=solid, label="(16, 6, 64, 64)"]; -"519 dropout_8" -> "520 matmul_5" [style=solid, label="(16, 6, 64, 64)"]; -"520 matmul_5" -> "521 transpose_5" [style=solid, label="(16, 6, 64, 32)"]; -"521 transpose_5" -> "522 reshape_11" [style=solid, label="(16, 64, 6, 32)"]; -"522 reshape_11" -> "523 reshape_11_0_0_nncf_smooth_quant_0" [style=solid, label="(16, 64, 192)"]; -"523 reshape_11_0_0_nncf_smooth_quant_0" -> "524 quantize_per_tensor_165" [style=solid, label="(16, 64, 192)"]; -"524 quantize_per_tensor_165" -> "525 dequantize_per_tensor_166" [style=solid, label="(16, 64, 192)"]; -"525 dequantize_per_tensor_166" -> "528 linear_16" [style=solid, label="(16, 64, 192)"]; -"526 _frozen_param26" -> "527 dequantize_per_tensor_167" [style=solid, label="(192, 192)"]; -"527 dequantize_per_tensor_167" -> "528 linear_16" [style=solid, label="(192, 192)"]; -"528 linear_16" -> "529 quantize_per_tensor_168" [style=solid, label="(16, 64, 192)"]; -"529 quantize_per_tensor_168" -> "530 dequantize_per_tensor_169" [style=solid, label="(16, 64, 192)"]; -"530 dequantize_per_tensor_169" -> "531 dropout_9" [style=solid, label="(16, 64, 192)"]; -"531 dropout_9" -> "532 view_14" [style=solid, label="(16, 64, 192)"]; -"532 view_14" -> "533 permute_13" [style=solid, label="(1, 4, 4, 8, 8, 192)"]; -"533 permute_13" -> "534 reshape_12" [style=solid, label="(1, 4, 8, 4, 8, 192)"]; -"534 reshape_12" -> "535 slice_38" [style=solid, label="(1, 32, 32, 192)"]; -"535 slice_38" -> "536 slice_39" [style=solid, label="(1, 32, 32, 192)"]; -"536 slice_39" -> "537 slice_40" [style=solid, label="(1, 28, 32, 192)"]; -"537 slice_40" -> "538 slice_41" [style=solid, label="(1, 28, 28, 192)"]; -"538 slice_41" -> "539 contiguous_3" [style=solid, label="(1, 28, 28, 192)"]; -"539 contiguous_3" -> "540 layer_norm_6" [style=solid, label="(1, 28, 28, 192)"]; -"540 layer_norm_6" -> "541 quantize_per_tensor_170" [style=solid, label="(1, 28, 28, 192)"]; -"541 quantize_per_tensor_170" -> "542 dequantize_per_tensor_171" [style=solid, label="(1, 28, 28, 192)"]; -"542 dequantize_per_tensor_171" -> "545 add_8" [style=solid, label="(1, 28, 28, 192)"]; -"543 quantize_per_tensor_172" -> "544 dequantize_per_tensor_173" [style=solid, label="(1, 28, 28, 192)"]; -"544 dequantize_per_tensor_173" -> "545 add_8" [style=solid, label="(1, 28, 28, 192)"]; -"545 add_8" -> "546 quantize_per_tensor_174" [style=solid, label="(1, 28, 28, 192)"]; -"546 quantize_per_tensor_174" -> "547 dequantize_per_tensor_175" [style=solid, label="(1, 28, 28, 192)"]; -"546 quantize_per_tensor_174" -> "548 dequantize_per_tensor_176" [style=solid, label="(1, 28, 28, 192)"]; -"547 dequantize_per_tensor_175" -> "571 add_9" [style=solid, label="(1, 28, 28, 192)"]; -"548 dequantize_per_tensor_176" -> "549 add_8_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 28, 28, 192)"]; -"549 add_8_0_0_nncf_smooth_quant_0" -> "550 quantize_per_tensor_177" [style=solid, label="(1, 28, 28, 192)"]; -"550 quantize_per_tensor_177" -> "551 dequantize_per_tensor_178" [style=solid, label="(1, 28, 28, 192)"]; -"551 dequantize_per_tensor_178" -> "554 linear_17" [style=solid, label="(1, 28, 28, 192)"]; -"552 _frozen_param27" -> "553 dequantize_per_tensor_179" [style=solid, label="(768, 192)"]; -"553 dequantize_per_tensor_179" -> "554 linear_17" [style=solid, label="(768, 192)"]; -"554 linear_17" -> "555 quantize_per_tensor_180" [style=solid, label="(1, 28, 28, 768)"]; -"555 quantize_per_tensor_180" -> "556 dequantize_per_tensor_181" [style=solid, label="(1, 28, 28, 768)"]; -"556 dequantize_per_tensor_181" -> "557 gelu_2" [style=solid, label="(1, 28, 28, 768)"]; -"557 gelu_2" -> "558 dropout_10" [style=solid, label="(1, 28, 28, 768)"]; -"558 dropout_10" -> "559 dropout_10_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 28, 28, 768)"]; -"559 dropout_10_0_0_nncf_smooth_quant_0" -> "560 quantize_per_tensor_182" [style=solid, label="(1, 28, 28, 768)"]; -"560 quantize_per_tensor_182" -> "561 dequantize_per_tensor_183" [style=solid, label="(1, 28, 28, 768)"]; -"561 dequantize_per_tensor_183" -> "564 linear_18" [style=solid, label="(1, 28, 28, 768)"]; -"562 _frozen_param28" -> "563 dequantize_per_tensor_184" [style=solid, label="(192, 768)"]; -"563 dequantize_per_tensor_184" -> "564 linear_18" [style=solid, label="(192, 768)"]; -"564 linear_18" -> "565 quantize_per_tensor_185" [style=solid, label="(1, 28, 28, 192)"]; -"565 quantize_per_tensor_185" -> "566 dequantize_per_tensor_186" [style=solid, label="(1, 28, 28, 192)"]; -"566 dequantize_per_tensor_186" -> "567 dropout_11" [style=solid, label="(1, 28, 28, 192)"]; -"567 dropout_11" -> "568 layer_norm_7" [style=solid, label="(1, 28, 28, 192)"]; -"568 layer_norm_7" -> "569 quantize_per_tensor_187" [style=solid, label="(1, 28, 28, 192)"]; -"569 quantize_per_tensor_187" -> "570 dequantize_per_tensor_188" [style=solid, label="(1, 28, 28, 192)"]; -"570 dequantize_per_tensor_188" -> "571 add_9" [style=solid, label="(1, 28, 28, 192)"]; -"571 add_9" -> "572 quantize_per_tensor_189" [style=solid, label="(1, 28, 28, 192)"]; -"572 quantize_per_tensor_189" -> "573 dequantize_per_tensor_190" [style=solid, label="(1, 28, 28, 192)"]; -"572 quantize_per_tensor_189" -> "574 dequantize_per_tensor_191" [style=solid, label="(1, 28, 28, 192)"]; -"573 dequantize_per_tensor_190" -> "696 add_12" [style=solid, label="(1, 28, 28, 192)"]; -"574 dequantize_per_tensor_191" -> "607 pad_4" [style=solid, label="(1, 28, 28, 192)"]; -"575 _frozen_param29" -> "576 dequantize_per_tensor_192" [style=solid, label="(1, 15, 15, 2)"]; -"576 dequantize_per_tensor_192" -> "579 linear_19" [style=solid, label="(1, 15, 15, 2)"]; -"577 _frozen_param30" -> "578 dequantize_per_tensor_193" [style=solid, label="(512, 2)"]; -"578 dequantize_per_tensor_193" -> "579 linear_19" [style=solid, label="(512, 2)"]; -"579 linear_19" -> "580 relu__3" [style=solid, label="(1, 15, 15, 512)"]; -"580 relu__3" -> "581 quantize_per_tensor_194" [style=solid, label="(1, 15, 15, 512)"]; -"581 quantize_per_tensor_194" -> "582 dequantize_per_tensor_195" [style=solid, label="(1, 15, 15, 512)"]; -"582 dequantize_per_tensor_195" -> "583 relu__3_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"583 relu__3_0_0_nncf_smooth_quant_0" -> "584 quantize_per_tensor_196" [style=solid, label="(1, 15, 15, 512)"]; -"584 quantize_per_tensor_196" -> "585 dequantize_per_tensor_197" [style=solid, label="(1, 15, 15, 512)"]; -"585 dequantize_per_tensor_197" -> "588 linear_20" [style=solid, label="(1, 15, 15, 512)"]; -"586 _frozen_param31" -> "587 dequantize_per_tensor_198" [style=solid, label="(6, 512)"]; -"587 dequantize_per_tensor_198" -> "588 linear_20" [style=solid, label="(6, 512)"]; -"588 linear_20" -> "589 quantize_per_tensor_199" [style=solid, label="(1, 15, 15, 6)"]; -"589 quantize_per_tensor_199" -> "590 dequantize_per_tensor_200" [style=solid, label="(1, 15, 15, 6)"]; -"590 dequantize_per_tensor_200" -> "591 view_15" [style=solid, label="(1, 15, 15, 6)"]; -"591 view_15" -> "592 quantize_per_tensor_201" [style=solid, label="(225, 6)"]; -"592 quantize_per_tensor_201" -> "593 dequantize_per_tensor_202" [style=solid, label="(225, 6)"]; -"593 dequantize_per_tensor_202" -> "594 index_3" [style=solid, label="(225, 6)"]; -"594 index_3" -> "595 view_16" [style=solid, label="(4096, 6)"]; -"595 view_16" -> "596 permute_14" [style=solid, label="(64, 64, 6)"]; -"596 permute_14" -> "597 contiguous_4" [style=solid, label="(6, 64, 64)"]; -"597 contiguous_4" -> "598 unsqueeze_7" [style=solid, label="(6, 64, 64)"]; -"598 unsqueeze_7" -> "599 sigmoid_3" [style=solid, label="(1, 6, 64, 64)"]; -"599 sigmoid_3" -> "600 quantize_per_tensor_203" [style=solid, label="(1, 6, 64, 64)"]; -"600 quantize_per_tensor_203" -> "601 dequantize_per_tensor_204" [style=solid, label="(1, 6, 64, 64)"]; -"601 dequantize_per_tensor_204" -> "604 mul_6" [style=solid, label="(1, 6, 64, 64)"]; -"602 _frozen_param32" -> "603 dequantize_per_tensor_205" [style=solid, label="()"]; -"603 dequantize_per_tensor_205" -> "604 mul_6" [style=solid, label="()"]; -"604 mul_6" -> "605 quantize_per_tensor_206" [style=solid, label="(1, 6, 64, 64)"]; -"605 quantize_per_tensor_206" -> "606 dequantize_per_tensor_207" [style=solid, label="(1, 6, 64, 64)"]; -"606 dequantize_per_tensor_207" -> "643 add_10" [style=solid, label="(1, 6, 64, 64)"]; -"607 pad_4" -> "608 roll_2" [style=solid, label="(1, 32, 32, 192)"]; -"608 roll_2" -> "609 view_17" [style=solid, label="(1, 32, 32, 192)"]; -"609 view_17" -> "610 permute_15" [style=solid, label="(1, 4, 8, 4, 8, 192)"]; -"610 permute_15" -> "611 reshape_13" [style=solid, label="(1, 4, 4, 8, 8, 192)"]; -"611 reshape_13" -> "613 reshape_13_0_0_nncf_smooth_quant_0" [style=solid, label="(16, 64, 192)"]; -"611 reshape_13" -> "646 new_zeros_1" [style=solid, label="(16, 64, 192)"]; -"612 clone_3" -> "618 linear_21" [style=solid, label="(576,)"]; -"613 reshape_13_0_0_nncf_smooth_quant_0" -> "614 quantize_per_tensor_208" [style=solid, label="(16, 64, 192)"]; -"614 quantize_per_tensor_208" -> "615 dequantize_per_tensor_209" [style=solid, label="(16, 64, 192)"]; -"615 dequantize_per_tensor_209" -> "618 linear_21" [style=solid, label="(16, 64, 192)"]; -"616 _frozen_param33" -> "617 dequantize_per_tensor_210" [style=solid, label="(576, 192)"]; -"617 dequantize_per_tensor_210" -> "618 linear_21" [style=solid, label="(576, 192)"]; -"618 linear_21" -> "619 quantize_per_tensor_211" [style=solid, label="(16, 64, 576)"]; -"619 quantize_per_tensor_211" -> "620 dequantize_per_tensor_212" [style=solid, label="(16, 64, 576)"]; -"620 dequantize_per_tensor_212" -> "621 reshape_14" [style=solid, label="(16, 64, 576)"]; -"621 reshape_14" -> "622 permute_16" [style=solid, label="(16, 64, 3, 6, 32)"]; -"622 permute_16" -> "623 select_9" [style=solid, label="(3, 16, 6, 64, 32)"]; -"622 permute_16" -> "624 select_10" [style=solid, label="(3, 16, 6, 64, 32)"]; -"622 permute_16" -> "625 select_11" [style=solid, label="(3, 16, 6, 64, 32)"]; -"623 select_9" -> "626 linalg_vector_norm_6" [style=solid, label="(16, 6, 64, 32)"]; -"623 select_9" -> "628 expand_as_6" [style=solid, label="(16, 6, 64, 32)"]; -"623 select_9" -> "629 div_6" [style=solid, label="(16, 6, 64, 32)"]; -"624 select_10" -> "630 linalg_vector_norm_7" [style=solid, label="(16, 6, 64, 32)"]; -"624 select_10" -> "632 expand_as_7" [style=solid, label="(16, 6, 64, 32)"]; -"624 select_10" -> "633 div_7" [style=solid, label="(16, 6, 64, 32)"]; -"625 select_11" -> "672 matmul_7" [style=solid, label="(16, 6, 64, 32)"]; -"626 linalg_vector_norm_6" -> "627 clamp_min_6" [style=solid, label="(16, 6, 64, 1)"]; -"627 clamp_min_6" -> "628 expand_as_6" [style=solid, label="(16, 6, 64, 1)"]; -"628 expand_as_6" -> "629 div_6" [style=solid, label="(16, 6, 64, 32)"]; -"629 div_6" -> "635 matmul_6" [style=solid, label="(16, 6, 64, 32)"]; -"630 linalg_vector_norm_7" -> "631 clamp_min_7" [style=solid, label="(16, 6, 64, 1)"]; -"631 clamp_min_7" -> "632 expand_as_7" [style=solid, label="(16, 6, 64, 1)"]; -"632 expand_as_7" -> "633 div_7" [style=solid, label="(16, 6, 64, 32)"]; -"633 div_7" -> "634 transpose_6" [style=solid, label="(16, 6, 64, 32)"]; -"634 transpose_6" -> "635 matmul_6" [style=solid, label="(16, 6, 32, 64)"]; -"635 matmul_6" -> "636 quantize_per_tensor_213" [style=solid, label="(16, 6, 64, 64)"]; -"636 quantize_per_tensor_213" -> "637 dequantize_per_tensor_214" [style=solid, label="(16, 6, 64, 64)"]; -"637 dequantize_per_tensor_214" -> "640 mul_7" [style=solid, label="(16, 6, 64, 64)"]; -"638 _frozen_param34" -> "639 dequantize_per_tensor_215" [style=solid, label="(6, 1, 1)"]; -"639 dequantize_per_tensor_215" -> "640 mul_7" [style=solid, label="(6, 1, 1)"]; -"640 mul_7" -> "641 quantize_per_tensor_216" [style=solid, label="(16, 6, 64, 64)"]; -"641 quantize_per_tensor_216" -> "642 dequantize_per_tensor_217" [style=solid, label="(16, 6, 64, 64)"]; -"642 dequantize_per_tensor_217" -> "643 add_10" [style=solid, label="(16, 6, 64, 64)"]; -"643 add_10" -> "644 quantize_per_tensor_218" [style=solid, label="(16, 6, 64, 64)"]; -"644 quantize_per_tensor_218" -> "645 dequantize_per_tensor_219" [style=solid, label="(16, 6, 64, 64)"]; -"645 dequantize_per_tensor_219" -> "657 view_19" [style=solid, label="(16, 6, 64, 64)"]; -"646 new_zeros_1" -> "647 view_18" [style=solid, label="(32, 32)"]; -"647 view_18" -> "648 permute_17" [style=solid, label="(4, 8, 4, 8)"]; -"648 permute_17" -> "649 reshape_15" [style=solid, label="(4, 4, 8, 8)"]; -"649 reshape_15" -> "650 unsqueeze_8" [style=solid, label="(16, 64)"]; -"649 reshape_15" -> "651 unsqueeze_9" [style=solid, label="(16, 64)"]; -"650 unsqueeze_8" -> "652 sub_1" [style=solid, label="(16, 1, 64)"]; -"651 unsqueeze_9" -> "652 sub_1" [style=solid, label="(16, 64, 1)"]; -"652 sub_1" -> "653 ne_1" [style=solid, label="(16, 64, 64)"]; -"652 sub_1" -> "654 masked_fill_2" [style=solid, label="(16, 64, 64)"]; -"652 sub_1" -> "655 eq_1" [style=solid, label="(16, 64, 64)"]; -"653 ne_1" -> "654 masked_fill_2" [style=solid, label="(16, 64, 64)"]; -"654 masked_fill_2" -> "656 masked_fill_3" [style=solid, label="(16, 64, 64)"]; -"655 eq_1" -> "656 masked_fill_3" [style=solid, label="(16, 64, 64)"]; -"656 masked_fill_3" -> "660 unsqueeze_10" [style=solid, label="(16, 64, 64)"]; -"657 view_19" -> "658 quantize_per_tensor_220" [style=solid, label="(1, 16, 6, 64, 64)"]; -"658 quantize_per_tensor_220" -> "659 dequantize_per_tensor_221" [style=solid, label="(1, 16, 6, 64, 64)"]; -"659 dequantize_per_tensor_221" -> "664 add_11" [style=solid, label="(1, 16, 6, 64, 64)"]; -"660 unsqueeze_10" -> "661 unsqueeze_11" [style=solid, label="(16, 1, 64, 64)"]; -"661 unsqueeze_11" -> "662 quantize_per_tensor_222" [style=solid, label="(1, 16, 1, 64, 64)"]; -"662 quantize_per_tensor_222" -> "663 dequantize_per_tensor_223" [style=solid, label="(1, 16, 1, 64, 64)"]; -"663 dequantize_per_tensor_223" -> "664 add_11" [style=solid, label="(1, 16, 1, 64, 64)"]; -"664 add_11" -> "665 quantize_per_tensor_224" [style=solid, label="(1, 16, 6, 64, 64)"]; -"665 quantize_per_tensor_224" -> "666 dequantize_per_tensor_225" [style=solid, label="(1, 16, 6, 64, 64)"]; -"666 dequantize_per_tensor_225" -> "667 view_20" [style=solid, label="(1, 16, 6, 64, 64)"]; -"667 view_20" -> "668 quantize_per_tensor_226" [style=solid, label="(16, 6, 64, 64)"]; -"668 quantize_per_tensor_226" -> "669 dequantize_per_tensor_227" [style=solid, label="(16, 6, 64, 64)"]; -"669 dequantize_per_tensor_227" -> "670 softmax_3" [style=solid, label="(16, 6, 64, 64)"]; -"670 softmax_3" -> "671 dropout_12" [style=solid, label="(16, 6, 64, 64)"]; -"671 dropout_12" -> "672 matmul_7" [style=solid, label="(16, 6, 64, 64)"]; -"672 matmul_7" -> "673 transpose_7" [style=solid, label="(16, 6, 64, 32)"]; -"673 transpose_7" -> "674 reshape_16" [style=solid, label="(16, 64, 6, 32)"]; -"674 reshape_16" -> "675 reshape_16_0_0_nncf_smooth_quant_0" [style=solid, label="(16, 64, 192)"]; -"675 reshape_16_0_0_nncf_smooth_quant_0" -> "676 quantize_per_tensor_228" [style=solid, label="(16, 64, 192)"]; -"676 quantize_per_tensor_228" -> "677 dequantize_per_tensor_229" [style=solid, label="(16, 64, 192)"]; -"677 dequantize_per_tensor_229" -> "680 linear_22" [style=solid, label="(16, 64, 192)"]; -"678 _frozen_param35" -> "679 dequantize_per_tensor_230" [style=solid, label="(192, 192)"]; -"679 dequantize_per_tensor_230" -> "680 linear_22" [style=solid, label="(192, 192)"]; -"680 linear_22" -> "681 quantize_per_tensor_231" [style=solid, label="(16, 64, 192)"]; -"681 quantize_per_tensor_231" -> "682 dequantize_per_tensor_232" [style=solid, label="(16, 64, 192)"]; -"682 dequantize_per_tensor_232" -> "683 dropout_13" [style=solid, label="(16, 64, 192)"]; -"683 dropout_13" -> "684 view_21" [style=solid, label="(16, 64, 192)"]; -"684 view_21" -> "685 permute_18" [style=solid, label="(1, 4, 4, 8, 8, 192)"]; -"685 permute_18" -> "686 reshape_17" [style=solid, label="(1, 4, 8, 4, 8, 192)"]; -"686 reshape_17" -> "687 roll_3" [style=solid, label="(1, 32, 32, 192)"]; -"687 roll_3" -> "688 slice_61" [style=solid, label="(1, 32, 32, 192)"]; -"688 slice_61" -> "689 slice_62" [style=solid, label="(1, 32, 32, 192)"]; -"689 slice_62" -> "690 slice_63" [style=solid, label="(1, 28, 32, 192)"]; -"690 slice_63" -> "691 slice_64" [style=solid, label="(1, 28, 28, 192)"]; -"691 slice_64" -> "692 contiguous_5" [style=solid, label="(1, 28, 28, 192)"]; -"692 contiguous_5" -> "693 layer_norm_8" [style=solid, label="(1, 28, 28, 192)"]; -"693 layer_norm_8" -> "694 quantize_per_tensor_233" [style=solid, label="(1, 28, 28, 192)"]; -"694 quantize_per_tensor_233" -> "695 dequantize_per_tensor_234" [style=solid, label="(1, 28, 28, 192)"]; -"695 dequantize_per_tensor_234" -> "696 add_12" [style=solid, label="(1, 28, 28, 192)"]; -"696 add_12" -> "697 quantize_per_tensor_235" [style=solid, label="(1, 28, 28, 192)"]; -"697 quantize_per_tensor_235" -> "698 dequantize_per_tensor_236" [style=solid, label="(1, 28, 28, 192)"]; -"697 quantize_per_tensor_235" -> "699 dequantize_per_tensor_237" [style=solid, label="(1, 28, 28, 192)"]; -"698 dequantize_per_tensor_236" -> "722 add_13" [style=solid, label="(1, 28, 28, 192)"]; -"699 dequantize_per_tensor_237" -> "700 add_12_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 28, 28, 192)"]; -"700 add_12_0_0_nncf_smooth_quant_0" -> "701 quantize_per_tensor_238" [style=solid, label="(1, 28, 28, 192)"]; -"701 quantize_per_tensor_238" -> "702 dequantize_per_tensor_239" [style=solid, label="(1, 28, 28, 192)"]; -"702 dequantize_per_tensor_239" -> "705 linear_23" [style=solid, label="(1, 28, 28, 192)"]; -"703 _frozen_param36" -> "704 dequantize_per_tensor_240" [style=solid, label="(768, 192)"]; -"704 dequantize_per_tensor_240" -> "705 linear_23" [style=solid, label="(768, 192)"]; -"705 linear_23" -> "706 quantize_per_tensor_241" [style=solid, label="(1, 28, 28, 768)"]; -"706 quantize_per_tensor_241" -> "707 dequantize_per_tensor_242" [style=solid, label="(1, 28, 28, 768)"]; -"707 dequantize_per_tensor_242" -> "708 gelu_3" [style=solid, label="(1, 28, 28, 768)"]; -"708 gelu_3" -> "709 dropout_14" [style=solid, label="(1, 28, 28, 768)"]; -"709 dropout_14" -> "710 dropout_14_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 28, 28, 768)"]; -"710 dropout_14_0_0_nncf_smooth_quant_0" -> "711 quantize_per_tensor_243" [style=solid, label="(1, 28, 28, 768)"]; -"711 quantize_per_tensor_243" -> "712 dequantize_per_tensor_244" [style=solid, label="(1, 28, 28, 768)"]; -"712 dequantize_per_tensor_244" -> "715 linear_24" [style=solid, label="(1, 28, 28, 768)"]; -"713 _frozen_param37" -> "714 dequantize_per_tensor_245" [style=solid, label="(192, 768)"]; -"714 dequantize_per_tensor_245" -> "715 linear_24" [style=solid, label="(192, 768)"]; -"715 linear_24" -> "716 quantize_per_tensor_246" [style=solid, label="(1, 28, 28, 192)"]; -"716 quantize_per_tensor_246" -> "717 dequantize_per_tensor_247" [style=solid, label="(1, 28, 28, 192)"]; -"717 dequantize_per_tensor_247" -> "718 dropout_15" [style=solid, label="(1, 28, 28, 192)"]; -"718 dropout_15" -> "719 layer_norm_9" [style=solid, label="(1, 28, 28, 192)"]; -"719 layer_norm_9" -> "720 quantize_per_tensor_248" [style=solid, label="(1, 28, 28, 192)"]; -"720 quantize_per_tensor_248" -> "721 dequantize_per_tensor_249" [style=solid, label="(1, 28, 28, 192)"]; -"721 dequantize_per_tensor_249" -> "722 add_13" [style=solid, label="(1, 28, 28, 192)"]; -"722 add_13" -> "723 quantize_per_tensor_250" [style=solid, label="(1, 28, 28, 192)"]; -"723 quantize_per_tensor_250" -> "724 dequantize_per_tensor_251" [style=solid, label="(1, 28, 28, 192)"]; -"724 dequantize_per_tensor_251" -> "725 pad_5" [style=solid, label="(1, 28, 28, 192)"]; -"725 pad_5" -> "726 slice_65" [style=solid, label="(1, 28, 28, 192)"]; -"725 pad_5" -> "731 slice_68" [style=solid, label="(1, 28, 28, 192)"]; -"725 pad_5" -> "736 slice_71" [style=solid, label="(1, 28, 28, 192)"]; -"725 pad_5" -> "741 slice_74" [style=solid, label="(1, 28, 28, 192)"]; -"726 slice_65" -> "727 slice_66" [style=solid, label="(1, 14, 28, 192)"]; -"727 slice_66" -> "728 slice_67" [style=solid, label="(1, 14, 14, 192)"]; -"728 slice_67" -> "729 quantize_per_tensor_252" [style=solid, label="(1, 14, 14, 192)"]; -"729 quantize_per_tensor_252" -> "730 dequantize_per_tensor_253" [style=solid, label="(1, 14, 14, 192)"]; -"730 dequantize_per_tensor_253" -> "746 cat_1" [style=solid, label="(1, 14, 14, 192)"]; -"731 slice_68" -> "732 slice_69" [style=solid, label="(1, 14, 28, 192)"]; -"732 slice_69" -> "733 slice_70" [style=solid, label="(1, 14, 14, 192)"]; -"733 slice_70" -> "734 quantize_per_tensor_254" [style=solid, label="(1, 14, 14, 192)"]; -"734 quantize_per_tensor_254" -> "735 dequantize_per_tensor_255" [style=solid, label="(1, 14, 14, 192)"]; -"735 dequantize_per_tensor_255" -> "746 cat_1" [style=solid, label="(1, 14, 14, 192)"]; -"736 slice_71" -> "737 slice_72" [style=solid, label="(1, 14, 28, 192)"]; -"737 slice_72" -> "738 slice_73" [style=solid, label="(1, 14, 14, 192)"]; -"738 slice_73" -> "739 quantize_per_tensor_256" [style=solid, label="(1, 14, 14, 192)"]; -"739 quantize_per_tensor_256" -> "740 dequantize_per_tensor_257" [style=solid, label="(1, 14, 14, 192)"]; -"740 dequantize_per_tensor_257" -> "746 cat_1" [style=solid, label="(1, 14, 14, 192)"]; -"741 slice_74" -> "742 slice_75" [style=solid, label="(1, 14, 28, 192)"]; -"742 slice_75" -> "743 slice_76" [style=solid, label="(1, 14, 14, 192)"]; -"743 slice_76" -> "744 quantize_per_tensor_258" [style=solid, label="(1, 14, 14, 192)"]; -"744 quantize_per_tensor_258" -> "745 dequantize_per_tensor_259" [style=solid, label="(1, 14, 14, 192)"]; -"745 dequantize_per_tensor_259" -> "746 cat_1" [style=solid, label="(1, 14, 14, 192)"]; -"746 cat_1" -> "747 quantize_per_tensor_260" [style=solid, label="(1, 14, 14, 768)"]; -"747 quantize_per_tensor_260" -> "748 dequantize_per_tensor_261" [style=solid, label="(1, 14, 14, 768)"]; -"748 dequantize_per_tensor_261" -> "749 cat_1_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 768)"]; -"749 cat_1_0_0_nncf_smooth_quant_0" -> "750 quantize_per_tensor_262" [style=solid, label="(1, 14, 14, 768)"]; -"750 quantize_per_tensor_262" -> "751 dequantize_per_tensor_263" [style=solid, label="(1, 14, 14, 768)"]; -"751 dequantize_per_tensor_263" -> "754 linear_25" [style=solid, label="(1, 14, 14, 768)"]; -"752 _frozen_param38" -> "753 dequantize_per_tensor_264" [style=solid, label="(384, 768)"]; -"753 dequantize_per_tensor_264" -> "754 linear_25" [style=solid, label="(384, 768)"]; -"754 linear_25" -> "755 quantize_per_tensor_265" [style=solid, label="(1, 14, 14, 384)"]; -"755 quantize_per_tensor_265" -> "756 dequantize_per_tensor_266" [style=solid, label="(1, 14, 14, 384)"]; -"756 dequantize_per_tensor_266" -> "757 layer_norm_10" [style=solid, label="(1, 14, 14, 384)"]; -"757 layer_norm_10" -> "790 pad_6" [style=solid, label="(1, 14, 14, 384)"]; -"757 layer_norm_10" -> "853 quantize_per_tensor_302" [style=solid, label="(1, 14, 14, 384)"]; -"758 _frozen_param39" -> "759 dequantize_per_tensor_267" [style=solid, label="(1, 15, 15, 2)"]; -"759 dequantize_per_tensor_267" -> "762 linear_26" [style=solid, label="(1, 15, 15, 2)"]; -"760 _frozen_param40" -> "761 dequantize_per_tensor_268" [style=solid, label="(512, 2)"]; -"761 dequantize_per_tensor_268" -> "762 linear_26" [style=solid, label="(512, 2)"]; -"762 linear_26" -> "763 relu__4" [style=solid, label="(1, 15, 15, 512)"]; -"763 relu__4" -> "764 quantize_per_tensor_269" [style=solid, label="(1, 15, 15, 512)"]; -"764 quantize_per_tensor_269" -> "765 dequantize_per_tensor_270" [style=solid, label="(1, 15, 15, 512)"]; -"765 dequantize_per_tensor_270" -> "766 relu__4_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"766 relu__4_0_0_nncf_smooth_quant_0" -> "767 quantize_per_tensor_271" [style=solid, label="(1, 15, 15, 512)"]; -"767 quantize_per_tensor_271" -> "768 dequantize_per_tensor_272" [style=solid, label="(1, 15, 15, 512)"]; -"768 dequantize_per_tensor_272" -> "771 linear_27" [style=solid, label="(1, 15, 15, 512)"]; -"769 _frozen_param41" -> "770 dequantize_per_tensor_273" [style=solid, label="(12, 512)"]; -"770 dequantize_per_tensor_273" -> "771 linear_27" [style=solid, label="(12, 512)"]; -"771 linear_27" -> "772 quantize_per_tensor_274" [style=solid, label="(1, 15, 15, 12)"]; -"772 quantize_per_tensor_274" -> "773 dequantize_per_tensor_275" [style=solid, label="(1, 15, 15, 12)"]; -"773 dequantize_per_tensor_275" -> "774 view_22" [style=solid, label="(1, 15, 15, 12)"]; -"774 view_22" -> "775 quantize_per_tensor_276" [style=solid, label="(225, 12)"]; -"775 quantize_per_tensor_276" -> "776 dequantize_per_tensor_277" [style=solid, label="(225, 12)"]; -"776 dequantize_per_tensor_277" -> "777 index_4" [style=solid, label="(225, 12)"]; -"777 index_4" -> "778 view_23" [style=solid, label="(4096, 12)"]; -"778 view_23" -> "779 permute_19" [style=solid, label="(64, 64, 12)"]; -"779 permute_19" -> "780 contiguous_6" [style=solid, label="(12, 64, 64)"]; -"780 contiguous_6" -> "781 unsqueeze_12" [style=solid, label="(12, 64, 64)"]; -"781 unsqueeze_12" -> "782 sigmoid_4" [style=solid, label="(1, 12, 64, 64)"]; -"782 sigmoid_4" -> "783 quantize_per_tensor_278" [style=solid, label="(1, 12, 64, 64)"]; -"783 quantize_per_tensor_278" -> "784 dequantize_per_tensor_279" [style=solid, label="(1, 12, 64, 64)"]; -"784 dequantize_per_tensor_279" -> "787 mul_8" [style=solid, label="(1, 12, 64, 64)"]; -"785 _frozen_param42" -> "786 dequantize_per_tensor_280" [style=solid, label="()"]; -"786 dequantize_per_tensor_280" -> "787 mul_8" [style=solid, label="()"]; -"787 mul_8" -> "788 quantize_per_tensor_281" [style=solid, label="(1, 12, 64, 64)"]; -"788 quantize_per_tensor_281" -> "789 dequantize_per_tensor_282" [style=solid, label="(1, 12, 64, 64)"]; -"789 dequantize_per_tensor_282" -> "825 add_14" [style=solid, label="(1, 12, 64, 64)"]; -"790 pad_6" -> "791 view_24" [style=solid, label="(1, 16, 16, 384)"]; -"791 view_24" -> "792 permute_20" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"792 permute_20" -> "793 reshape_18" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"793 reshape_18" -> "795 reshape_18_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"794 clone_4" -> "800 linear_28" [style=solid, label="(1152,)"]; -"795 reshape_18_0_0_nncf_smooth_quant_0" -> "796 quantize_per_tensor_283" [style=solid, label="(4, 64, 384)"]; -"796 quantize_per_tensor_283" -> "797 dequantize_per_tensor_284" [style=solid, label="(4, 64, 384)"]; -"797 dequantize_per_tensor_284" -> "800 linear_28" [style=solid, label="(4, 64, 384)"]; -"798 _frozen_param43" -> "799 dequantize_per_tensor_285" [style=solid, label="(1152, 384)"]; -"799 dequantize_per_tensor_285" -> "800 linear_28" [style=solid, label="(1152, 384)"]; -"800 linear_28" -> "801 quantize_per_tensor_286" [style=solid, label="(4, 64, 1152)"]; -"801 quantize_per_tensor_286" -> "802 dequantize_per_tensor_287" [style=solid, label="(4, 64, 1152)"]; -"802 dequantize_per_tensor_287" -> "803 reshape_19" [style=solid, label="(4, 64, 1152)"]; -"803 reshape_19" -> "804 permute_21" [style=solid, label="(4, 64, 3, 12, 32)"]; -"804 permute_21" -> "805 select_12" [style=solid, label="(3, 4, 12, 64, 32)"]; -"804 permute_21" -> "806 select_13" [style=solid, label="(3, 4, 12, 64, 32)"]; -"804 permute_21" -> "807 select_14" [style=solid, label="(3, 4, 12, 64, 32)"]; -"805 select_12" -> "808 linalg_vector_norm_8" [style=solid, label="(4, 12, 64, 32)"]; -"805 select_12" -> "810 expand_as_8" [style=solid, label="(4, 12, 64, 32)"]; -"805 select_12" -> "811 div_8" [style=solid, label="(4, 12, 64, 32)"]; -"806 select_13" -> "812 linalg_vector_norm_9" [style=solid, label="(4, 12, 64, 32)"]; -"806 select_13" -> "814 expand_as_9" [style=solid, label="(4, 12, 64, 32)"]; -"806 select_13" -> "815 div_9" [style=solid, label="(4, 12, 64, 32)"]; -"807 select_14" -> "830 matmul_9" [style=solid, label="(4, 12, 64, 32)"]; -"808 linalg_vector_norm_8" -> "809 clamp_min_8" [style=solid, label="(4, 12, 64, 1)"]; -"809 clamp_min_8" -> "810 expand_as_8" [style=solid, label="(4, 12, 64, 1)"]; -"810 expand_as_8" -> "811 div_8" [style=solid, label="(4, 12, 64, 32)"]; -"811 div_8" -> "817 matmul_8" [style=solid, label="(4, 12, 64, 32)"]; -"812 linalg_vector_norm_9" -> "813 clamp_min_9" [style=solid, label="(4, 12, 64, 1)"]; -"813 clamp_min_9" -> "814 expand_as_9" [style=solid, label="(4, 12, 64, 1)"]; -"814 expand_as_9" -> "815 div_9" [style=solid, label="(4, 12, 64, 32)"]; -"815 div_9" -> "816 transpose_8" [style=solid, label="(4, 12, 64, 32)"]; -"816 transpose_8" -> "817 matmul_8" [style=solid, label="(4, 12, 32, 64)"]; -"817 matmul_8" -> "818 quantize_per_tensor_288" [style=solid, label="(4, 12, 64, 64)"]; -"818 quantize_per_tensor_288" -> "819 dequantize_per_tensor_289" [style=solid, label="(4, 12, 64, 64)"]; -"819 dequantize_per_tensor_289" -> "822 mul_9" [style=solid, label="(4, 12, 64, 64)"]; -"820 _frozen_param44" -> "821 dequantize_per_tensor_290" [style=solid, label="(12, 1, 1)"]; -"821 dequantize_per_tensor_290" -> "822 mul_9" [style=solid, label="(12, 1, 1)"]; -"822 mul_9" -> "823 quantize_per_tensor_291" [style=solid, label="(4, 12, 64, 64)"]; -"823 quantize_per_tensor_291" -> "824 dequantize_per_tensor_292" [style=solid, label="(4, 12, 64, 64)"]; -"824 dequantize_per_tensor_292" -> "825 add_14" [style=solid, label="(4, 12, 64, 64)"]; -"825 add_14" -> "826 quantize_per_tensor_293" [style=solid, label="(4, 12, 64, 64)"]; -"826 quantize_per_tensor_293" -> "827 dequantize_per_tensor_294" [style=solid, label="(4, 12, 64, 64)"]; -"827 dequantize_per_tensor_294" -> "828 softmax_4" [style=solid, label="(4, 12, 64, 64)"]; -"828 softmax_4" -> "829 dropout_16" [style=solid, label="(4, 12, 64, 64)"]; -"829 dropout_16" -> "830 matmul_9" [style=solid, label="(4, 12, 64, 64)"]; -"830 matmul_9" -> "831 transpose_9" [style=solid, label="(4, 12, 64, 32)"]; -"831 transpose_9" -> "832 reshape_20" [style=solid, label="(4, 64, 12, 32)"]; -"832 reshape_20" -> "833 reshape_20_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"833 reshape_20_0_0_nncf_smooth_quant_0" -> "834 quantize_per_tensor_295" [style=solid, label="(4, 64, 384)"]; -"834 quantize_per_tensor_295" -> "835 dequantize_per_tensor_296" [style=solid, label="(4, 64, 384)"]; -"835 dequantize_per_tensor_296" -> "838 linear_29" [style=solid, label="(4, 64, 384)"]; -"836 _frozen_param45" -> "837 dequantize_per_tensor_297" [style=solid, label="(384, 384)"]; -"837 dequantize_per_tensor_297" -> "838 linear_29" [style=solid, label="(384, 384)"]; -"838 linear_29" -> "839 quantize_per_tensor_298" [style=solid, label="(4, 64, 384)"]; -"839 quantize_per_tensor_298" -> "840 dequantize_per_tensor_299" [style=solid, label="(4, 64, 384)"]; -"840 dequantize_per_tensor_299" -> "841 dropout_17" [style=solid, label="(4, 64, 384)"]; -"841 dropout_17" -> "842 view_25" [style=solid, label="(4, 64, 384)"]; -"842 view_25" -> "843 permute_22" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"843 permute_22" -> "844 reshape_21" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"844 reshape_21" -> "845 slice_78" [style=solid, label="(1, 16, 16, 384)"]; -"845 slice_78" -> "846 slice_79" [style=solid, label="(1, 16, 16, 384)"]; -"846 slice_79" -> "847 slice_80" [style=solid, label="(1, 14, 16, 384)"]; -"847 slice_80" -> "848 slice_81" [style=solid, label="(1, 14, 14, 384)"]; -"848 slice_81" -> "849 contiguous_7" [style=solid, label="(1, 14, 14, 384)"]; -"849 contiguous_7" -> "850 layer_norm_11" [style=solid, label="(1, 14, 14, 384)"]; -"850 layer_norm_11" -> "851 quantize_per_tensor_300" [style=solid, label="(1, 14, 14, 384)"]; -"851 quantize_per_tensor_300" -> "852 dequantize_per_tensor_301" [style=solid, label="(1, 14, 14, 384)"]; -"852 dequantize_per_tensor_301" -> "855 add_15" [style=solid, label="(1, 14, 14, 384)"]; -"853 quantize_per_tensor_302" -> "854 dequantize_per_tensor_303" [style=solid, label="(1, 14, 14, 384)"]; -"854 dequantize_per_tensor_303" -> "855 add_15" [style=solid, label="(1, 14, 14, 384)"]; -"855 add_15" -> "856 quantize_per_tensor_304" [style=solid, label="(1, 14, 14, 384)"]; -"856 quantize_per_tensor_304" -> "857 dequantize_per_tensor_305" [style=solid, label="(1, 14, 14, 384)"]; -"856 quantize_per_tensor_304" -> "858 dequantize_per_tensor_306" [style=solid, label="(1, 14, 14, 384)"]; -"857 dequantize_per_tensor_305" -> "881 add_16" [style=solid, label="(1, 14, 14, 384)"]; -"858 dequantize_per_tensor_306" -> "859 add_15_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 384)"]; -"859 add_15_0_0_nncf_smooth_quant_0" -> "860 quantize_per_tensor_307" [style=solid, label="(1, 14, 14, 384)"]; -"860 quantize_per_tensor_307" -> "861 dequantize_per_tensor_308" [style=solid, label="(1, 14, 14, 384)"]; -"861 dequantize_per_tensor_308" -> "864 linear_30" [style=solid, label="(1, 14, 14, 384)"]; -"862 _frozen_param46" -> "863 dequantize_per_tensor_309" [style=solid, label="(1536, 384)"]; -"863 dequantize_per_tensor_309" -> "864 linear_30" [style=solid, label="(1536, 384)"]; -"864 linear_30" -> "865 quantize_per_tensor_310" [style=solid, label="(1, 14, 14, 1536)"]; -"865 quantize_per_tensor_310" -> "866 dequantize_per_tensor_311" [style=solid, label="(1, 14, 14, 1536)"]; -"866 dequantize_per_tensor_311" -> "867 gelu_4" [style=solid, label="(1, 14, 14, 1536)"]; -"867 gelu_4" -> "868 dropout_18" [style=solid, label="(1, 14, 14, 1536)"]; -"868 dropout_18" -> "869 dropout_18_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 1536)"]; -"869 dropout_18_0_0_nncf_smooth_quant_0" -> "870 quantize_per_tensor_312" [style=solid, label="(1, 14, 14, 1536)"]; -"870 quantize_per_tensor_312" -> "871 dequantize_per_tensor_313" [style=solid, label="(1, 14, 14, 1536)"]; -"871 dequantize_per_tensor_313" -> "874 linear_31" [style=solid, label="(1, 14, 14, 1536)"]; -"872 _frozen_param47" -> "873 dequantize_per_tensor_314" [style=solid, label="(384, 1536)"]; -"873 dequantize_per_tensor_314" -> "874 linear_31" [style=solid, label="(384, 1536)"]; -"874 linear_31" -> "875 quantize_per_tensor_315" [style=solid, label="(1, 14, 14, 384)"]; -"875 quantize_per_tensor_315" -> "876 dequantize_per_tensor_316" [style=solid, label="(1, 14, 14, 384)"]; -"876 dequantize_per_tensor_316" -> "877 dropout_19" [style=solid, label="(1, 14, 14, 384)"]; -"877 dropout_19" -> "878 layer_norm_12" [style=solid, label="(1, 14, 14, 384)"]; -"878 layer_norm_12" -> "879 quantize_per_tensor_317" [style=solid, label="(1, 14, 14, 384)"]; -"879 quantize_per_tensor_317" -> "880 dequantize_per_tensor_318" [style=solid, label="(1, 14, 14, 384)"]; -"880 dequantize_per_tensor_318" -> "881 add_16" [style=solid, label="(1, 14, 14, 384)"]; -"881 add_16" -> "882 quantize_per_tensor_319" [style=solid, label="(1, 14, 14, 384)"]; -"882 quantize_per_tensor_319" -> "883 dequantize_per_tensor_320" [style=solid, label="(1, 14, 14, 384)"]; -"882 quantize_per_tensor_319" -> "884 dequantize_per_tensor_321" [style=solid, label="(1, 14, 14, 384)"]; -"883 dequantize_per_tensor_320" -> "1006 add_19" [style=solid, label="(1, 14, 14, 384)"]; -"884 dequantize_per_tensor_321" -> "917 pad_7" [style=solid, label="(1, 14, 14, 384)"]; -"885 _frozen_param48" -> "886 dequantize_per_tensor_322" [style=solid, label="(1, 15, 15, 2)"]; -"886 dequantize_per_tensor_322" -> "889 linear_32" [style=solid, label="(1, 15, 15, 2)"]; -"887 _frozen_param49" -> "888 dequantize_per_tensor_323" [style=solid, label="(512, 2)"]; -"888 dequantize_per_tensor_323" -> "889 linear_32" [style=solid, label="(512, 2)"]; -"889 linear_32" -> "890 relu__5" [style=solid, label="(1, 15, 15, 512)"]; -"890 relu__5" -> "891 quantize_per_tensor_324" [style=solid, label="(1, 15, 15, 512)"]; -"891 quantize_per_tensor_324" -> "892 dequantize_per_tensor_325" [style=solid, label="(1, 15, 15, 512)"]; -"892 dequantize_per_tensor_325" -> "893 relu__5_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"893 relu__5_0_0_nncf_smooth_quant_0" -> "894 quantize_per_tensor_326" [style=solid, label="(1, 15, 15, 512)"]; -"894 quantize_per_tensor_326" -> "895 dequantize_per_tensor_327" [style=solid, label="(1, 15, 15, 512)"]; -"895 dequantize_per_tensor_327" -> "898 linear_33" [style=solid, label="(1, 15, 15, 512)"]; -"896 _frozen_param50" -> "897 dequantize_per_tensor_328" [style=solid, label="(12, 512)"]; -"897 dequantize_per_tensor_328" -> "898 linear_33" [style=solid, label="(12, 512)"]; -"898 linear_33" -> "899 quantize_per_tensor_329" [style=solid, label="(1, 15, 15, 12)"]; -"899 quantize_per_tensor_329" -> "900 dequantize_per_tensor_330" [style=solid, label="(1, 15, 15, 12)"]; -"900 dequantize_per_tensor_330" -> "901 view_26" [style=solid, label="(1, 15, 15, 12)"]; -"901 view_26" -> "902 quantize_per_tensor_331" [style=solid, label="(225, 12)"]; -"902 quantize_per_tensor_331" -> "903 dequantize_per_tensor_332" [style=solid, label="(225, 12)"]; -"903 dequantize_per_tensor_332" -> "904 index_5" [style=solid, label="(225, 12)"]; -"904 index_5" -> "905 view_27" [style=solid, label="(4096, 12)"]; -"905 view_27" -> "906 permute_23" [style=solid, label="(64, 64, 12)"]; -"906 permute_23" -> "907 contiguous_8" [style=solid, label="(12, 64, 64)"]; -"907 contiguous_8" -> "908 unsqueeze_13" [style=solid, label="(12, 64, 64)"]; -"908 unsqueeze_13" -> "909 sigmoid_5" [style=solid, label="(1, 12, 64, 64)"]; -"909 sigmoid_5" -> "910 quantize_per_tensor_333" [style=solid, label="(1, 12, 64, 64)"]; -"910 quantize_per_tensor_333" -> "911 dequantize_per_tensor_334" [style=solid, label="(1, 12, 64, 64)"]; -"911 dequantize_per_tensor_334" -> "914 mul_10" [style=solid, label="(1, 12, 64, 64)"]; -"912 _frozen_param51" -> "913 dequantize_per_tensor_335" [style=solid, label="()"]; -"913 dequantize_per_tensor_335" -> "914 mul_10" [style=solid, label="()"]; -"914 mul_10" -> "915 quantize_per_tensor_336" [style=solid, label="(1, 12, 64, 64)"]; -"915 quantize_per_tensor_336" -> "916 dequantize_per_tensor_337" [style=solid, label="(1, 12, 64, 64)"]; -"916 dequantize_per_tensor_337" -> "953 add_17" [style=solid, label="(1, 12, 64, 64)"]; -"917 pad_7" -> "918 roll_4" [style=solid, label="(1, 16, 16, 384)"]; -"918 roll_4" -> "919 view_28" [style=solid, label="(1, 16, 16, 384)"]; -"919 view_28" -> "920 permute_24" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"920 permute_24" -> "921 reshape_22" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"921 reshape_22" -> "923 reshape_22_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"921 reshape_22" -> "956 new_zeros_2" [style=solid, label="(4, 64, 384)"]; -"922 clone_5" -> "928 linear_34" [style=solid, label="(1152,)"]; -"923 reshape_22_0_0_nncf_smooth_quant_0" -> "924 quantize_per_tensor_338" [style=solid, label="(4, 64, 384)"]; -"924 quantize_per_tensor_338" -> "925 dequantize_per_tensor_339" [style=solid, label="(4, 64, 384)"]; -"925 dequantize_per_tensor_339" -> "928 linear_34" [style=solid, label="(4, 64, 384)"]; -"926 _frozen_param52" -> "927 dequantize_per_tensor_340" [style=solid, label="(1152, 384)"]; -"927 dequantize_per_tensor_340" -> "928 linear_34" [style=solid, label="(1152, 384)"]; -"928 linear_34" -> "929 quantize_per_tensor_341" [style=solid, label="(4, 64, 1152)"]; -"929 quantize_per_tensor_341" -> "930 dequantize_per_tensor_342" [style=solid, label="(4, 64, 1152)"]; -"930 dequantize_per_tensor_342" -> "931 reshape_23" [style=solid, label="(4, 64, 1152)"]; -"931 reshape_23" -> "932 permute_25" [style=solid, label="(4, 64, 3, 12, 32)"]; -"932 permute_25" -> "933 select_15" [style=solid, label="(3, 4, 12, 64, 32)"]; -"932 permute_25" -> "934 select_16" [style=solid, label="(3, 4, 12, 64, 32)"]; -"932 permute_25" -> "935 select_17" [style=solid, label="(3, 4, 12, 64, 32)"]; -"933 select_15" -> "936 linalg_vector_norm_10" [style=solid, label="(4, 12, 64, 32)"]; -"933 select_15" -> "938 expand_as_10" [style=solid, label="(4, 12, 64, 32)"]; -"933 select_15" -> "939 div_10" [style=solid, label="(4, 12, 64, 32)"]; -"934 select_16" -> "940 linalg_vector_norm_11" [style=solid, label="(4, 12, 64, 32)"]; -"934 select_16" -> "942 expand_as_11" [style=solid, label="(4, 12, 64, 32)"]; -"934 select_16" -> "943 div_11" [style=solid, label="(4, 12, 64, 32)"]; -"935 select_17" -> "982 matmul_11" [style=solid, label="(4, 12, 64, 32)"]; -"936 linalg_vector_norm_10" -> "937 clamp_min_10" [style=solid, label="(4, 12, 64, 1)"]; -"937 clamp_min_10" -> "938 expand_as_10" [style=solid, label="(4, 12, 64, 1)"]; -"938 expand_as_10" -> "939 div_10" [style=solid, label="(4, 12, 64, 32)"]; -"939 div_10" -> "945 matmul_10" [style=solid, label="(4, 12, 64, 32)"]; -"940 linalg_vector_norm_11" -> "941 clamp_min_11" [style=solid, label="(4, 12, 64, 1)"]; -"941 clamp_min_11" -> "942 expand_as_11" [style=solid, label="(4, 12, 64, 1)"]; -"942 expand_as_11" -> "943 div_11" [style=solid, label="(4, 12, 64, 32)"]; -"943 div_11" -> "944 transpose_10" [style=solid, label="(4, 12, 64, 32)"]; -"944 transpose_10" -> "945 matmul_10" [style=solid, label="(4, 12, 32, 64)"]; -"945 matmul_10" -> "946 quantize_per_tensor_343" [style=solid, label="(4, 12, 64, 64)"]; -"946 quantize_per_tensor_343" -> "947 dequantize_per_tensor_344" [style=solid, label="(4, 12, 64, 64)"]; -"947 dequantize_per_tensor_344" -> "950 mul_11" [style=solid, label="(4, 12, 64, 64)"]; -"948 _frozen_param53" -> "949 dequantize_per_tensor_345" [style=solid, label="(12, 1, 1)"]; -"949 dequantize_per_tensor_345" -> "950 mul_11" [style=solid, label="(12, 1, 1)"]; -"950 mul_11" -> "951 quantize_per_tensor_346" [style=solid, label="(4, 12, 64, 64)"]; -"951 quantize_per_tensor_346" -> "952 dequantize_per_tensor_347" [style=solid, label="(4, 12, 64, 64)"]; -"952 dequantize_per_tensor_347" -> "953 add_17" [style=solid, label="(4, 12, 64, 64)"]; -"953 add_17" -> "954 quantize_per_tensor_348" [style=solid, label="(4, 12, 64, 64)"]; -"954 quantize_per_tensor_348" -> "955 dequantize_per_tensor_349" [style=solid, label="(4, 12, 64, 64)"]; -"955 dequantize_per_tensor_349" -> "967 view_30" [style=solid, label="(4, 12, 64, 64)"]; -"956 new_zeros_2" -> "957 view_29" [style=solid, label="(16, 16)"]; -"957 view_29" -> "958 permute_26" [style=solid, label="(2, 8, 2, 8)"]; -"958 permute_26" -> "959 reshape_24" [style=solid, label="(2, 2, 8, 8)"]; -"959 reshape_24" -> "960 unsqueeze_14" [style=solid, label="(4, 64)"]; -"959 reshape_24" -> "961 unsqueeze_15" [style=solid, label="(4, 64)"]; -"960 unsqueeze_14" -> "962 sub_2" [style=solid, label="(4, 1, 64)"]; -"961 unsqueeze_15" -> "962 sub_2" [style=solid, label="(4, 64, 1)"]; -"962 sub_2" -> "963 ne_2" [style=solid, label="(4, 64, 64)"]; -"962 sub_2" -> "964 masked_fill_4" [style=solid, label="(4, 64, 64)"]; -"962 sub_2" -> "965 eq_2" [style=solid, label="(4, 64, 64)"]; -"963 ne_2" -> "964 masked_fill_4" [style=solid, label="(4, 64, 64)"]; -"964 masked_fill_4" -> "966 masked_fill_5" [style=solid, label="(4, 64, 64)"]; -"965 eq_2" -> "966 masked_fill_5" [style=solid, label="(4, 64, 64)"]; -"966 masked_fill_5" -> "970 unsqueeze_16" [style=solid, label="(4, 64, 64)"]; -"967 view_30" -> "968 quantize_per_tensor_350" [style=solid, label="(1, 4, 12, 64, 64)"]; -"968 quantize_per_tensor_350" -> "969 dequantize_per_tensor_351" [style=solid, label="(1, 4, 12, 64, 64)"]; -"969 dequantize_per_tensor_351" -> "974 add_18" [style=solid, label="(1, 4, 12, 64, 64)"]; -"970 unsqueeze_16" -> "971 unsqueeze_17" [style=solid, label="(4, 1, 64, 64)"]; -"971 unsqueeze_17" -> "972 quantize_per_tensor_352" [style=solid, label="(1, 4, 1, 64, 64)"]; -"972 quantize_per_tensor_352" -> "973 dequantize_per_tensor_353" [style=solid, label="(1, 4, 1, 64, 64)"]; -"973 dequantize_per_tensor_353" -> "974 add_18" [style=solid, label="(1, 4, 1, 64, 64)"]; -"974 add_18" -> "975 quantize_per_tensor_354" [style=solid, label="(1, 4, 12, 64, 64)"]; -"975 quantize_per_tensor_354" -> "976 dequantize_per_tensor_355" [style=solid, label="(1, 4, 12, 64, 64)"]; -"976 dequantize_per_tensor_355" -> "977 view_31" [style=solid, label="(1, 4, 12, 64, 64)"]; -"977 view_31" -> "978 quantize_per_tensor_356" [style=solid, label="(4, 12, 64, 64)"]; -"978 quantize_per_tensor_356" -> "979 dequantize_per_tensor_357" [style=solid, label="(4, 12, 64, 64)"]; -"979 dequantize_per_tensor_357" -> "980 softmax_5" [style=solid, label="(4, 12, 64, 64)"]; -"980 softmax_5" -> "981 dropout_20" [style=solid, label="(4, 12, 64, 64)"]; -"981 dropout_20" -> "982 matmul_11" [style=solid, label="(4, 12, 64, 64)"]; -"982 matmul_11" -> "983 transpose_11" [style=solid, label="(4, 12, 64, 32)"]; -"983 transpose_11" -> "984 reshape_25" [style=solid, label="(4, 64, 12, 32)"]; -"984 reshape_25" -> "985 reshape_25_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"985 reshape_25_0_0_nncf_smooth_quant_0" -> "986 quantize_per_tensor_358" [style=solid, label="(4, 64, 384)"]; -"986 quantize_per_tensor_358" -> "987 dequantize_per_tensor_359" [style=solid, label="(4, 64, 384)"]; -"987 dequantize_per_tensor_359" -> "990 linear_35" [style=solid, label="(4, 64, 384)"]; -"988 _frozen_param54" -> "989 dequantize_per_tensor_360" [style=solid, label="(384, 384)"]; -"989 dequantize_per_tensor_360" -> "990 linear_35" [style=solid, label="(384, 384)"]; -"990 linear_35" -> "991 quantize_per_tensor_361" [style=solid, label="(4, 64, 384)"]; -"991 quantize_per_tensor_361" -> "992 dequantize_per_tensor_362" [style=solid, label="(4, 64, 384)"]; -"992 dequantize_per_tensor_362" -> "993 dropout_21" [style=solid, label="(4, 64, 384)"]; -"993 dropout_21" -> "994 view_32" [style=solid, label="(4, 64, 384)"]; -"994 view_32" -> "995 permute_27" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"995 permute_27" -> "996 reshape_26" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"996 reshape_26" -> "997 roll_5" [style=solid, label="(1, 16, 16, 384)"]; -"997 roll_5" -> "998 slice_101" [style=solid, label="(1, 16, 16, 384)"]; -"998 slice_101" -> "999 slice_102" [style=solid, label="(1, 16, 16, 384)"]; -"999 slice_102" -> "1000 slice_103" [style=solid, label="(1, 14, 16, 384)"]; -"1000 slice_103" -> "1001 slice_104" [style=solid, label="(1, 14, 14, 384)"]; -"1001 slice_104" -> "1002 contiguous_9" [style=solid, label="(1, 14, 14, 384)"]; -"1002 contiguous_9" -> "1003 layer_norm_13" [style=solid, label="(1, 14, 14, 384)"]; -"1003 layer_norm_13" -> "1004 quantize_per_tensor_363" [style=solid, label="(1, 14, 14, 384)"]; -"1004 quantize_per_tensor_363" -> "1005 dequantize_per_tensor_364" [style=solid, label="(1, 14, 14, 384)"]; -"1005 dequantize_per_tensor_364" -> "1006 add_19" [style=solid, label="(1, 14, 14, 384)"]; -"1006 add_19" -> "1007 quantize_per_tensor_365" [style=solid, label="(1, 14, 14, 384)"]; -"1007 quantize_per_tensor_365" -> "1008 dequantize_per_tensor_366" [style=solid, label="(1, 14, 14, 384)"]; -"1007 quantize_per_tensor_365" -> "1009 dequantize_per_tensor_367" [style=solid, label="(1, 14, 14, 384)"]; -"1008 dequantize_per_tensor_366" -> "1032 add_20" [style=solid, label="(1, 14, 14, 384)"]; -"1009 dequantize_per_tensor_367" -> "1010 add_19_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 384)"]; -"1010 add_19_0_0_nncf_smooth_quant_0" -> "1011 quantize_per_tensor_368" [style=solid, label="(1, 14, 14, 384)"]; -"1011 quantize_per_tensor_368" -> "1012 dequantize_per_tensor_369" [style=solid, label="(1, 14, 14, 384)"]; -"1012 dequantize_per_tensor_369" -> "1015 linear_36" [style=solid, label="(1, 14, 14, 384)"]; -"1013 _frozen_param55" -> "1014 dequantize_per_tensor_370" [style=solid, label="(1536, 384)"]; -"1014 dequantize_per_tensor_370" -> "1015 linear_36" [style=solid, label="(1536, 384)"]; -"1015 linear_36" -> "1016 quantize_per_tensor_371" [style=solid, label="(1, 14, 14, 1536)"]; -"1016 quantize_per_tensor_371" -> "1017 dequantize_per_tensor_372" [style=solid, label="(1, 14, 14, 1536)"]; -"1017 dequantize_per_tensor_372" -> "1018 gelu_5" [style=solid, label="(1, 14, 14, 1536)"]; -"1018 gelu_5" -> "1019 dropout_22" [style=solid, label="(1, 14, 14, 1536)"]; -"1019 dropout_22" -> "1020 dropout_22_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 1536)"]; -"1020 dropout_22_0_0_nncf_smooth_quant_0" -> "1021 quantize_per_tensor_373" [style=solid, label="(1, 14, 14, 1536)"]; -"1021 quantize_per_tensor_373" -> "1022 dequantize_per_tensor_374" [style=solid, label="(1, 14, 14, 1536)"]; -"1022 dequantize_per_tensor_374" -> "1025 linear_37" [style=solid, label="(1, 14, 14, 1536)"]; -"1023 _frozen_param56" -> "1024 dequantize_per_tensor_375" [style=solid, label="(384, 1536)"]; -"1024 dequantize_per_tensor_375" -> "1025 linear_37" [style=solid, label="(384, 1536)"]; -"1025 linear_37" -> "1026 quantize_per_tensor_376" [style=solid, label="(1, 14, 14, 384)"]; -"1026 quantize_per_tensor_376" -> "1027 dequantize_per_tensor_377" [style=solid, label="(1, 14, 14, 384)"]; -"1027 dequantize_per_tensor_377" -> "1028 dropout_23" [style=solid, label="(1, 14, 14, 384)"]; -"1028 dropout_23" -> "1029 layer_norm_14" [style=solid, label="(1, 14, 14, 384)"]; -"1029 layer_norm_14" -> "1030 quantize_per_tensor_378" [style=solid, label="(1, 14, 14, 384)"]; -"1030 quantize_per_tensor_378" -> "1031 dequantize_per_tensor_379" [style=solid, label="(1, 14, 14, 384)"]; -"1031 dequantize_per_tensor_379" -> "1032 add_20" [style=solid, label="(1, 14, 14, 384)"]; -"1032 add_20" -> "1033 quantize_per_tensor_380" [style=solid, label="(1, 14, 14, 384)"]; -"1033 quantize_per_tensor_380" -> "1034 dequantize_per_tensor_381" [style=solid, label="(1, 14, 14, 384)"]; -"1033 quantize_per_tensor_380" -> "1035 dequantize_per_tensor_382" [style=solid, label="(1, 14, 14, 384)"]; -"1034 dequantize_per_tensor_381" -> "1131 add_22" [style=solid, label="(1, 14, 14, 384)"]; -"1035 dequantize_per_tensor_382" -> "1068 pad_8" [style=solid, label="(1, 14, 14, 384)"]; -"1036 _frozen_param57" -> "1037 dequantize_per_tensor_383" [style=solid, label="(1, 15, 15, 2)"]; -"1037 dequantize_per_tensor_383" -> "1040 linear_38" [style=solid, label="(1, 15, 15, 2)"]; -"1038 _frozen_param58" -> "1039 dequantize_per_tensor_384" [style=solid, label="(512, 2)"]; -"1039 dequantize_per_tensor_384" -> "1040 linear_38" [style=solid, label="(512, 2)"]; -"1040 linear_38" -> "1041 relu__6" [style=solid, label="(1, 15, 15, 512)"]; -"1041 relu__6" -> "1042 quantize_per_tensor_385" [style=solid, label="(1, 15, 15, 512)"]; -"1042 quantize_per_tensor_385" -> "1043 dequantize_per_tensor_386" [style=solid, label="(1, 15, 15, 512)"]; -"1043 dequantize_per_tensor_386" -> "1044 relu__6_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"1044 relu__6_0_0_nncf_smooth_quant_0" -> "1045 quantize_per_tensor_387" [style=solid, label="(1, 15, 15, 512)"]; -"1045 quantize_per_tensor_387" -> "1046 dequantize_per_tensor_388" [style=solid, label="(1, 15, 15, 512)"]; -"1046 dequantize_per_tensor_388" -> "1049 linear_39" [style=solid, label="(1, 15, 15, 512)"]; -"1047 _frozen_param59" -> "1048 dequantize_per_tensor_389" [style=solid, label="(12, 512)"]; -"1048 dequantize_per_tensor_389" -> "1049 linear_39" [style=solid, label="(12, 512)"]; -"1049 linear_39" -> "1050 quantize_per_tensor_390" [style=solid, label="(1, 15, 15, 12)"]; -"1050 quantize_per_tensor_390" -> "1051 dequantize_per_tensor_391" [style=solid, label="(1, 15, 15, 12)"]; -"1051 dequantize_per_tensor_391" -> "1052 view_33" [style=solid, label="(1, 15, 15, 12)"]; -"1052 view_33" -> "1053 quantize_per_tensor_392" [style=solid, label="(225, 12)"]; -"1053 quantize_per_tensor_392" -> "1054 dequantize_per_tensor_393" [style=solid, label="(225, 12)"]; -"1054 dequantize_per_tensor_393" -> "1055 index_6" [style=solid, label="(225, 12)"]; -"1055 index_6" -> "1056 view_34" [style=solid, label="(4096, 12)"]; -"1056 view_34" -> "1057 permute_28" [style=solid, label="(64, 64, 12)"]; -"1057 permute_28" -> "1058 contiguous_10" [style=solid, label="(12, 64, 64)"]; -"1058 contiguous_10" -> "1059 unsqueeze_18" [style=solid, label="(12, 64, 64)"]; -"1059 unsqueeze_18" -> "1060 sigmoid_6" [style=solid, label="(1, 12, 64, 64)"]; -"1060 sigmoid_6" -> "1061 quantize_per_tensor_394" [style=solid, label="(1, 12, 64, 64)"]; -"1061 quantize_per_tensor_394" -> "1062 dequantize_per_tensor_395" [style=solid, label="(1, 12, 64, 64)"]; -"1062 dequantize_per_tensor_395" -> "1065 mul_12" [style=solid, label="(1, 12, 64, 64)"]; -"1063 _frozen_param60" -> "1064 dequantize_per_tensor_396" [style=solid, label="()"]; -"1064 dequantize_per_tensor_396" -> "1065 mul_12" [style=solid, label="()"]; -"1065 mul_12" -> "1066 quantize_per_tensor_397" [style=solid, label="(1, 12, 64, 64)"]; -"1066 quantize_per_tensor_397" -> "1067 dequantize_per_tensor_398" [style=solid, label="(1, 12, 64, 64)"]; -"1067 dequantize_per_tensor_398" -> "1103 add_21" [style=solid, label="(1, 12, 64, 64)"]; -"1068 pad_8" -> "1069 view_35" [style=solid, label="(1, 16, 16, 384)"]; -"1069 view_35" -> "1070 permute_29" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1070 permute_29" -> "1071 reshape_27" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1071 reshape_27" -> "1073 reshape_27_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1072 clone_6" -> "1078 linear_40" [style=solid, label="(1152,)"]; -"1073 reshape_27_0_0_nncf_smooth_quant_0" -> "1074 quantize_per_tensor_399" [style=solid, label="(4, 64, 384)"]; -"1074 quantize_per_tensor_399" -> "1075 dequantize_per_tensor_400" [style=solid, label="(4, 64, 384)"]; -"1075 dequantize_per_tensor_400" -> "1078 linear_40" [style=solid, label="(4, 64, 384)"]; -"1076 _frozen_param61" -> "1077 dequantize_per_tensor_401" [style=solid, label="(1152, 384)"]; -"1077 dequantize_per_tensor_401" -> "1078 linear_40" [style=solid, label="(1152, 384)"]; -"1078 linear_40" -> "1079 quantize_per_tensor_402" [style=solid, label="(4, 64, 1152)"]; -"1079 quantize_per_tensor_402" -> "1080 dequantize_per_tensor_403" [style=solid, label="(4, 64, 1152)"]; -"1080 dequantize_per_tensor_403" -> "1081 reshape_28" [style=solid, label="(4, 64, 1152)"]; -"1081 reshape_28" -> "1082 permute_30" [style=solid, label="(4, 64, 3, 12, 32)"]; -"1082 permute_30" -> "1083 select_18" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1082 permute_30" -> "1084 select_19" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1082 permute_30" -> "1085 select_20" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1083 select_18" -> "1086 linalg_vector_norm_12" [style=solid, label="(4, 12, 64, 32)"]; -"1083 select_18" -> "1088 expand_as_12" [style=solid, label="(4, 12, 64, 32)"]; -"1083 select_18" -> "1089 div_12" [style=solid, label="(4, 12, 64, 32)"]; -"1084 select_19" -> "1090 linalg_vector_norm_13" [style=solid, label="(4, 12, 64, 32)"]; -"1084 select_19" -> "1092 expand_as_13" [style=solid, label="(4, 12, 64, 32)"]; -"1084 select_19" -> "1093 div_13" [style=solid, label="(4, 12, 64, 32)"]; -"1085 select_20" -> "1108 matmul_13" [style=solid, label="(4, 12, 64, 32)"]; -"1086 linalg_vector_norm_12" -> "1087 clamp_min_12" [style=solid, label="(4, 12, 64, 1)"]; -"1087 clamp_min_12" -> "1088 expand_as_12" [style=solid, label="(4, 12, 64, 1)"]; -"1088 expand_as_12" -> "1089 div_12" [style=solid, label="(4, 12, 64, 32)"]; -"1089 div_12" -> "1095 matmul_12" [style=solid, label="(4, 12, 64, 32)"]; -"1090 linalg_vector_norm_13" -> "1091 clamp_min_13" [style=solid, label="(4, 12, 64, 1)"]; -"1091 clamp_min_13" -> "1092 expand_as_13" [style=solid, label="(4, 12, 64, 1)"]; -"1092 expand_as_13" -> "1093 div_13" [style=solid, label="(4, 12, 64, 32)"]; -"1093 div_13" -> "1094 transpose_12" [style=solid, label="(4, 12, 64, 32)"]; -"1094 transpose_12" -> "1095 matmul_12" [style=solid, label="(4, 12, 32, 64)"]; -"1095 matmul_12" -> "1096 quantize_per_tensor_404" [style=solid, label="(4, 12, 64, 64)"]; -"1096 quantize_per_tensor_404" -> "1097 dequantize_per_tensor_405" [style=solid, label="(4, 12, 64, 64)"]; -"1097 dequantize_per_tensor_405" -> "1100 mul_13" [style=solid, label="(4, 12, 64, 64)"]; -"1098 _frozen_param62" -> "1099 dequantize_per_tensor_406" [style=solid, label="(12, 1, 1)"]; -"1099 dequantize_per_tensor_406" -> "1100 mul_13" [style=solid, label="(12, 1, 1)"]; -"1100 mul_13" -> "1101 quantize_per_tensor_407" [style=solid, label="(4, 12, 64, 64)"]; -"1101 quantize_per_tensor_407" -> "1102 dequantize_per_tensor_408" [style=solid, label="(4, 12, 64, 64)"]; -"1102 dequantize_per_tensor_408" -> "1103 add_21" [style=solid, label="(4, 12, 64, 64)"]; -"1103 add_21" -> "1104 quantize_per_tensor_409" [style=solid, label="(4, 12, 64, 64)"]; -"1104 quantize_per_tensor_409" -> "1105 dequantize_per_tensor_410" [style=solid, label="(4, 12, 64, 64)"]; -"1105 dequantize_per_tensor_410" -> "1106 softmax_6" [style=solid, label="(4, 12, 64, 64)"]; -"1106 softmax_6" -> "1107 dropout_24" [style=solid, label="(4, 12, 64, 64)"]; -"1107 dropout_24" -> "1108 matmul_13" [style=solid, label="(4, 12, 64, 64)"]; -"1108 matmul_13" -> "1109 transpose_13" [style=solid, label="(4, 12, 64, 32)"]; -"1109 transpose_13" -> "1110 reshape_29" [style=solid, label="(4, 64, 12, 32)"]; -"1110 reshape_29" -> "1111 reshape_29_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1111 reshape_29_0_0_nncf_smooth_quant_0" -> "1112 quantize_per_tensor_411" [style=solid, label="(4, 64, 384)"]; -"1112 quantize_per_tensor_411" -> "1113 dequantize_per_tensor_412" [style=solid, label="(4, 64, 384)"]; -"1113 dequantize_per_tensor_412" -> "1116 linear_41" [style=solid, label="(4, 64, 384)"]; -"1114 _frozen_param63" -> "1115 dequantize_per_tensor_413" [style=solid, label="(384, 384)"]; -"1115 dequantize_per_tensor_413" -> "1116 linear_41" [style=solid, label="(384, 384)"]; -"1116 linear_41" -> "1117 quantize_per_tensor_414" [style=solid, label="(4, 64, 384)"]; -"1117 quantize_per_tensor_414" -> "1118 dequantize_per_tensor_415" [style=solid, label="(4, 64, 384)"]; -"1118 dequantize_per_tensor_415" -> "1119 dropout_25" [style=solid, label="(4, 64, 384)"]; -"1119 dropout_25" -> "1120 view_36" [style=solid, label="(4, 64, 384)"]; -"1120 view_36" -> "1121 permute_31" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1121 permute_31" -> "1122 reshape_30" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1122 reshape_30" -> "1123 slice_106" [style=solid, label="(1, 16, 16, 384)"]; -"1123 slice_106" -> "1124 slice_107" [style=solid, label="(1, 16, 16, 384)"]; -"1124 slice_107" -> "1125 slice_108" [style=solid, label="(1, 14, 16, 384)"]; -"1125 slice_108" -> "1126 slice_109" [style=solid, label="(1, 14, 14, 384)"]; -"1126 slice_109" -> "1127 contiguous_11" [style=solid, label="(1, 14, 14, 384)"]; -"1127 contiguous_11" -> "1128 layer_norm_15" [style=solid, label="(1, 14, 14, 384)"]; -"1128 layer_norm_15" -> "1129 quantize_per_tensor_416" [style=solid, label="(1, 14, 14, 384)"]; -"1129 quantize_per_tensor_416" -> "1130 dequantize_per_tensor_417" [style=solid, label="(1, 14, 14, 384)"]; -"1130 dequantize_per_tensor_417" -> "1131 add_22" [style=solid, label="(1, 14, 14, 384)"]; -"1131 add_22" -> "1132 quantize_per_tensor_418" [style=solid, label="(1, 14, 14, 384)"]; -"1132 quantize_per_tensor_418" -> "1133 dequantize_per_tensor_419" [style=solid, label="(1, 14, 14, 384)"]; -"1132 quantize_per_tensor_418" -> "1134 dequantize_per_tensor_420" [style=solid, label="(1, 14, 14, 384)"]; -"1133 dequantize_per_tensor_419" -> "1157 add_23" [style=solid, label="(1, 14, 14, 384)"]; -"1134 dequantize_per_tensor_420" -> "1135 add_22_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 384)"]; -"1135 add_22_0_0_nncf_smooth_quant_0" -> "1136 quantize_per_tensor_421" [style=solid, label="(1, 14, 14, 384)"]; -"1136 quantize_per_tensor_421" -> "1137 dequantize_per_tensor_422" [style=solid, label="(1, 14, 14, 384)"]; -"1137 dequantize_per_tensor_422" -> "1140 linear_42" [style=solid, label="(1, 14, 14, 384)"]; -"1138 _frozen_param64" -> "1139 dequantize_per_tensor_423" [style=solid, label="(1536, 384)"]; -"1139 dequantize_per_tensor_423" -> "1140 linear_42" [style=solid, label="(1536, 384)"]; -"1140 linear_42" -> "1141 quantize_per_tensor_424" [style=solid, label="(1, 14, 14, 1536)"]; -"1141 quantize_per_tensor_424" -> "1142 dequantize_per_tensor_425" [style=solid, label="(1, 14, 14, 1536)"]; -"1142 dequantize_per_tensor_425" -> "1143 gelu_6" [style=solid, label="(1, 14, 14, 1536)"]; -"1143 gelu_6" -> "1144 dropout_26" [style=solid, label="(1, 14, 14, 1536)"]; -"1144 dropout_26" -> "1145 dropout_26_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 1536)"]; -"1145 dropout_26_0_0_nncf_smooth_quant_0" -> "1146 quantize_per_tensor_426" [style=solid, label="(1, 14, 14, 1536)"]; -"1146 quantize_per_tensor_426" -> "1147 dequantize_per_tensor_427" [style=solid, label="(1, 14, 14, 1536)"]; -"1147 dequantize_per_tensor_427" -> "1150 linear_43" [style=solid, label="(1, 14, 14, 1536)"]; -"1148 _frozen_param65" -> "1149 dequantize_per_tensor_428" [style=solid, label="(384, 1536)"]; -"1149 dequantize_per_tensor_428" -> "1150 linear_43" [style=solid, label="(384, 1536)"]; -"1150 linear_43" -> "1151 quantize_per_tensor_429" [style=solid, label="(1, 14, 14, 384)"]; -"1151 quantize_per_tensor_429" -> "1152 dequantize_per_tensor_430" [style=solid, label="(1, 14, 14, 384)"]; -"1152 dequantize_per_tensor_430" -> "1153 dropout_27" [style=solid, label="(1, 14, 14, 384)"]; -"1153 dropout_27" -> "1154 layer_norm_16" [style=solid, label="(1, 14, 14, 384)"]; -"1154 layer_norm_16" -> "1155 quantize_per_tensor_431" [style=solid, label="(1, 14, 14, 384)"]; -"1155 quantize_per_tensor_431" -> "1156 dequantize_per_tensor_432" [style=solid, label="(1, 14, 14, 384)"]; -"1156 dequantize_per_tensor_432" -> "1157 add_23" [style=solid, label="(1, 14, 14, 384)"]; -"1157 add_23" -> "1158 quantize_per_tensor_433" [style=solid, label="(1, 14, 14, 384)"]; -"1158 quantize_per_tensor_433" -> "1159 dequantize_per_tensor_434" [style=solid, label="(1, 14, 14, 384)"]; -"1158 quantize_per_tensor_433" -> "1160 dequantize_per_tensor_435" [style=solid, label="(1, 14, 14, 384)"]; -"1159 dequantize_per_tensor_434" -> "1282 add_26" [style=solid, label="(1, 14, 14, 384)"]; -"1160 dequantize_per_tensor_435" -> "1193 pad_9" [style=solid, label="(1, 14, 14, 384)"]; -"1161 _frozen_param66" -> "1162 dequantize_per_tensor_436" [style=solid, label="(1, 15, 15, 2)"]; -"1162 dequantize_per_tensor_436" -> "1165 linear_44" [style=solid, label="(1, 15, 15, 2)"]; -"1163 _frozen_param67" -> "1164 dequantize_per_tensor_437" [style=solid, label="(512, 2)"]; -"1164 dequantize_per_tensor_437" -> "1165 linear_44" [style=solid, label="(512, 2)"]; -"1165 linear_44" -> "1166 relu__7" [style=solid, label="(1, 15, 15, 512)"]; -"1166 relu__7" -> "1167 quantize_per_tensor_438" [style=solid, label="(1, 15, 15, 512)"]; -"1167 quantize_per_tensor_438" -> "1168 dequantize_per_tensor_439" [style=solid, label="(1, 15, 15, 512)"]; -"1168 dequantize_per_tensor_439" -> "1169 relu__7_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"1169 relu__7_0_0_nncf_smooth_quant_0" -> "1170 quantize_per_tensor_440" [style=solid, label="(1, 15, 15, 512)"]; -"1170 quantize_per_tensor_440" -> "1171 dequantize_per_tensor_441" [style=solid, label="(1, 15, 15, 512)"]; -"1171 dequantize_per_tensor_441" -> "1174 linear_45" [style=solid, label="(1, 15, 15, 512)"]; -"1172 _frozen_param68" -> "1173 dequantize_per_tensor_442" [style=solid, label="(12, 512)"]; -"1173 dequantize_per_tensor_442" -> "1174 linear_45" [style=solid, label="(12, 512)"]; -"1174 linear_45" -> "1175 quantize_per_tensor_443" [style=solid, label="(1, 15, 15, 12)"]; -"1175 quantize_per_tensor_443" -> "1176 dequantize_per_tensor_444" [style=solid, label="(1, 15, 15, 12)"]; -"1176 dequantize_per_tensor_444" -> "1177 view_37" [style=solid, label="(1, 15, 15, 12)"]; -"1177 view_37" -> "1178 quantize_per_tensor_445" [style=solid, label="(225, 12)"]; -"1178 quantize_per_tensor_445" -> "1179 dequantize_per_tensor_446" [style=solid, label="(225, 12)"]; -"1179 dequantize_per_tensor_446" -> "1180 index_7" [style=solid, label="(225, 12)"]; -"1180 index_7" -> "1181 view_38" [style=solid, label="(4096, 12)"]; -"1181 view_38" -> "1182 permute_32" [style=solid, label="(64, 64, 12)"]; -"1182 permute_32" -> "1183 contiguous_12" [style=solid, label="(12, 64, 64)"]; -"1183 contiguous_12" -> "1184 unsqueeze_19" [style=solid, label="(12, 64, 64)"]; -"1184 unsqueeze_19" -> "1185 sigmoid_7" [style=solid, label="(1, 12, 64, 64)"]; -"1185 sigmoid_7" -> "1186 quantize_per_tensor_447" [style=solid, label="(1, 12, 64, 64)"]; -"1186 quantize_per_tensor_447" -> "1187 dequantize_per_tensor_448" [style=solid, label="(1, 12, 64, 64)"]; -"1187 dequantize_per_tensor_448" -> "1190 mul_14" [style=solid, label="(1, 12, 64, 64)"]; -"1188 _frozen_param69" -> "1189 dequantize_per_tensor_449" [style=solid, label="()"]; -"1189 dequantize_per_tensor_449" -> "1190 mul_14" [style=solid, label="()"]; -"1190 mul_14" -> "1191 quantize_per_tensor_450" [style=solid, label="(1, 12, 64, 64)"]; -"1191 quantize_per_tensor_450" -> "1192 dequantize_per_tensor_451" [style=solid, label="(1, 12, 64, 64)"]; -"1192 dequantize_per_tensor_451" -> "1229 add_24" [style=solid, label="(1, 12, 64, 64)"]; -"1193 pad_9" -> "1194 roll_6" [style=solid, label="(1, 16, 16, 384)"]; -"1194 roll_6" -> "1195 view_39" [style=solid, label="(1, 16, 16, 384)"]; -"1195 view_39" -> "1196 permute_33" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1196 permute_33" -> "1197 reshape_31" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1197 reshape_31" -> "1199 reshape_31_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1197 reshape_31" -> "1232 new_zeros_3" [style=solid, label="(4, 64, 384)"]; -"1198 clone_7" -> "1204 linear_46" [style=solid, label="(1152,)"]; -"1199 reshape_31_0_0_nncf_smooth_quant_0" -> "1200 quantize_per_tensor_452" [style=solid, label="(4, 64, 384)"]; -"1200 quantize_per_tensor_452" -> "1201 dequantize_per_tensor_453" [style=solid, label="(4, 64, 384)"]; -"1201 dequantize_per_tensor_453" -> "1204 linear_46" [style=solid, label="(4, 64, 384)"]; -"1202 _frozen_param70" -> "1203 dequantize_per_tensor_454" [style=solid, label="(1152, 384)"]; -"1203 dequantize_per_tensor_454" -> "1204 linear_46" [style=solid, label="(1152, 384)"]; -"1204 linear_46" -> "1205 quantize_per_tensor_455" [style=solid, label="(4, 64, 1152)"]; -"1205 quantize_per_tensor_455" -> "1206 dequantize_per_tensor_456" [style=solid, label="(4, 64, 1152)"]; -"1206 dequantize_per_tensor_456" -> "1207 reshape_32" [style=solid, label="(4, 64, 1152)"]; -"1207 reshape_32" -> "1208 permute_34" [style=solid, label="(4, 64, 3, 12, 32)"]; -"1208 permute_34" -> "1209 select_21" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1208 permute_34" -> "1210 select_22" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1208 permute_34" -> "1211 select_23" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1209 select_21" -> "1212 linalg_vector_norm_14" [style=solid, label="(4, 12, 64, 32)"]; -"1209 select_21" -> "1214 expand_as_14" [style=solid, label="(4, 12, 64, 32)"]; -"1209 select_21" -> "1215 div_14" [style=solid, label="(4, 12, 64, 32)"]; -"1210 select_22" -> "1216 linalg_vector_norm_15" [style=solid, label="(4, 12, 64, 32)"]; -"1210 select_22" -> "1218 expand_as_15" [style=solid, label="(4, 12, 64, 32)"]; -"1210 select_22" -> "1219 div_15" [style=solid, label="(4, 12, 64, 32)"]; -"1211 select_23" -> "1258 matmul_15" [style=solid, label="(4, 12, 64, 32)"]; -"1212 linalg_vector_norm_14" -> "1213 clamp_min_14" [style=solid, label="(4, 12, 64, 1)"]; -"1213 clamp_min_14" -> "1214 expand_as_14" [style=solid, label="(4, 12, 64, 1)"]; -"1214 expand_as_14" -> "1215 div_14" [style=solid, label="(4, 12, 64, 32)"]; -"1215 div_14" -> "1221 matmul_14" [style=solid, label="(4, 12, 64, 32)"]; -"1216 linalg_vector_norm_15" -> "1217 clamp_min_15" [style=solid, label="(4, 12, 64, 1)"]; -"1217 clamp_min_15" -> "1218 expand_as_15" [style=solid, label="(4, 12, 64, 1)"]; -"1218 expand_as_15" -> "1219 div_15" [style=solid, label="(4, 12, 64, 32)"]; -"1219 div_15" -> "1220 transpose_14" [style=solid, label="(4, 12, 64, 32)"]; -"1220 transpose_14" -> "1221 matmul_14" [style=solid, label="(4, 12, 32, 64)"]; -"1221 matmul_14" -> "1222 quantize_per_tensor_457" [style=solid, label="(4, 12, 64, 64)"]; -"1222 quantize_per_tensor_457" -> "1223 dequantize_per_tensor_458" [style=solid, label="(4, 12, 64, 64)"]; -"1223 dequantize_per_tensor_458" -> "1226 mul_15" [style=solid, label="(4, 12, 64, 64)"]; -"1224 _frozen_param71" -> "1225 dequantize_per_tensor_459" [style=solid, label="(12, 1, 1)"]; -"1225 dequantize_per_tensor_459" -> "1226 mul_15" [style=solid, label="(12, 1, 1)"]; -"1226 mul_15" -> "1227 quantize_per_tensor_460" [style=solid, label="(4, 12, 64, 64)"]; -"1227 quantize_per_tensor_460" -> "1228 dequantize_per_tensor_461" [style=solid, label="(4, 12, 64, 64)"]; -"1228 dequantize_per_tensor_461" -> "1229 add_24" [style=solid, label="(4, 12, 64, 64)"]; -"1229 add_24" -> "1230 quantize_per_tensor_462" [style=solid, label="(4, 12, 64, 64)"]; -"1230 quantize_per_tensor_462" -> "1231 dequantize_per_tensor_463" [style=solid, label="(4, 12, 64, 64)"]; -"1231 dequantize_per_tensor_463" -> "1243 view_41" [style=solid, label="(4, 12, 64, 64)"]; -"1232 new_zeros_3" -> "1233 view_40" [style=solid, label="(16, 16)"]; -"1233 view_40" -> "1234 permute_35" [style=solid, label="(2, 8, 2, 8)"]; -"1234 permute_35" -> "1235 reshape_33" [style=solid, label="(2, 2, 8, 8)"]; -"1235 reshape_33" -> "1236 unsqueeze_20" [style=solid, label="(4, 64)"]; -"1235 reshape_33" -> "1237 unsqueeze_21" [style=solid, label="(4, 64)"]; -"1236 unsqueeze_20" -> "1238 sub_3" [style=solid, label="(4, 1, 64)"]; -"1237 unsqueeze_21" -> "1238 sub_3" [style=solid, label="(4, 64, 1)"]; -"1238 sub_3" -> "1239 ne_3" [style=solid, label="(4, 64, 64)"]; -"1238 sub_3" -> "1240 masked_fill_6" [style=solid, label="(4, 64, 64)"]; -"1238 sub_3" -> "1241 eq_3" [style=solid, label="(4, 64, 64)"]; -"1239 ne_3" -> "1240 masked_fill_6" [style=solid, label="(4, 64, 64)"]; -"1240 masked_fill_6" -> "1242 masked_fill_7" [style=solid, label="(4, 64, 64)"]; -"1241 eq_3" -> "1242 masked_fill_7" [style=solid, label="(4, 64, 64)"]; -"1242 masked_fill_7" -> "1246 unsqueeze_22" [style=solid, label="(4, 64, 64)"]; -"1243 view_41" -> "1244 quantize_per_tensor_464" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1244 quantize_per_tensor_464" -> "1245 dequantize_per_tensor_465" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1245 dequantize_per_tensor_465" -> "1250 add_25" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1246 unsqueeze_22" -> "1247 unsqueeze_23" [style=solid, label="(4, 1, 64, 64)"]; -"1247 unsqueeze_23" -> "1248 quantize_per_tensor_466" [style=solid, label="(1, 4, 1, 64, 64)"]; -"1248 quantize_per_tensor_466" -> "1249 dequantize_per_tensor_467" [style=solid, label="(1, 4, 1, 64, 64)"]; -"1249 dequantize_per_tensor_467" -> "1250 add_25" [style=solid, label="(1, 4, 1, 64, 64)"]; -"1250 add_25" -> "1251 quantize_per_tensor_468" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1251 quantize_per_tensor_468" -> "1252 dequantize_per_tensor_469" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1252 dequantize_per_tensor_469" -> "1253 view_42" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1253 view_42" -> "1254 quantize_per_tensor_470" [style=solid, label="(4, 12, 64, 64)"]; -"1254 quantize_per_tensor_470" -> "1255 dequantize_per_tensor_471" [style=solid, label="(4, 12, 64, 64)"]; -"1255 dequantize_per_tensor_471" -> "1256 softmax_7" [style=solid, label="(4, 12, 64, 64)"]; -"1256 softmax_7" -> "1257 dropout_28" [style=solid, label="(4, 12, 64, 64)"]; -"1257 dropout_28" -> "1258 matmul_15" [style=solid, label="(4, 12, 64, 64)"]; -"1258 matmul_15" -> "1259 transpose_15" [style=solid, label="(4, 12, 64, 32)"]; -"1259 transpose_15" -> "1260 reshape_34" [style=solid, label="(4, 64, 12, 32)"]; -"1260 reshape_34" -> "1261 reshape_34_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1261 reshape_34_0_0_nncf_smooth_quant_0" -> "1262 quantize_per_tensor_472" [style=solid, label="(4, 64, 384)"]; -"1262 quantize_per_tensor_472" -> "1263 dequantize_per_tensor_473" [style=solid, label="(4, 64, 384)"]; -"1263 dequantize_per_tensor_473" -> "1266 linear_47" [style=solid, label="(4, 64, 384)"]; -"1264 _frozen_param72" -> "1265 dequantize_per_tensor_474" [style=solid, label="(384, 384)"]; -"1265 dequantize_per_tensor_474" -> "1266 linear_47" [style=solid, label="(384, 384)"]; -"1266 linear_47" -> "1267 quantize_per_tensor_475" [style=solid, label="(4, 64, 384)"]; -"1267 quantize_per_tensor_475" -> "1268 dequantize_per_tensor_476" [style=solid, label="(4, 64, 384)"]; -"1268 dequantize_per_tensor_476" -> "1269 dropout_29" [style=solid, label="(4, 64, 384)"]; -"1269 dropout_29" -> "1270 view_43" [style=solid, label="(4, 64, 384)"]; -"1270 view_43" -> "1271 permute_36" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1271 permute_36" -> "1272 reshape_35" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1272 reshape_35" -> "1273 roll_7" [style=solid, label="(1, 16, 16, 384)"]; -"1273 roll_7" -> "1274 slice_129" [style=solid, label="(1, 16, 16, 384)"]; -"1274 slice_129" -> "1275 slice_130" [style=solid, label="(1, 16, 16, 384)"]; -"1275 slice_130" -> "1276 slice_131" [style=solid, label="(1, 14, 16, 384)"]; -"1276 slice_131" -> "1277 slice_132" [style=solid, label="(1, 14, 14, 384)"]; -"1277 slice_132" -> "1278 contiguous_13" [style=solid, label="(1, 14, 14, 384)"]; -"1278 contiguous_13" -> "1279 layer_norm_17" [style=solid, label="(1, 14, 14, 384)"]; -"1279 layer_norm_17" -> "1280 quantize_per_tensor_477" [style=solid, label="(1, 14, 14, 384)"]; -"1280 quantize_per_tensor_477" -> "1281 dequantize_per_tensor_478" [style=solid, label="(1, 14, 14, 384)"]; -"1281 dequantize_per_tensor_478" -> "1282 add_26" [style=solid, label="(1, 14, 14, 384)"]; -"1282 add_26" -> "1283 quantize_per_tensor_479" [style=solid, label="(1, 14, 14, 384)"]; -"1283 quantize_per_tensor_479" -> "1284 dequantize_per_tensor_480" [style=solid, label="(1, 14, 14, 384)"]; -"1283 quantize_per_tensor_479" -> "1285 dequantize_per_tensor_481" [style=solid, label="(1, 14, 14, 384)"]; -"1284 dequantize_per_tensor_480" -> "1308 add_27" [style=solid, label="(1, 14, 14, 384)"]; -"1285 dequantize_per_tensor_481" -> "1286 add_26_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 384)"]; -"1286 add_26_0_0_nncf_smooth_quant_0" -> "1287 quantize_per_tensor_482" [style=solid, label="(1, 14, 14, 384)"]; -"1287 quantize_per_tensor_482" -> "1288 dequantize_per_tensor_483" [style=solid, label="(1, 14, 14, 384)"]; -"1288 dequantize_per_tensor_483" -> "1291 linear_48" [style=solid, label="(1, 14, 14, 384)"]; -"1289 _frozen_param73" -> "1290 dequantize_per_tensor_484" [style=solid, label="(1536, 384)"]; -"1290 dequantize_per_tensor_484" -> "1291 linear_48" [style=solid, label="(1536, 384)"]; -"1291 linear_48" -> "1292 quantize_per_tensor_485" [style=solid, label="(1, 14, 14, 1536)"]; -"1292 quantize_per_tensor_485" -> "1293 dequantize_per_tensor_486" [style=solid, label="(1, 14, 14, 1536)"]; -"1293 dequantize_per_tensor_486" -> "1294 gelu_7" [style=solid, label="(1, 14, 14, 1536)"]; -"1294 gelu_7" -> "1295 dropout_30" [style=solid, label="(1, 14, 14, 1536)"]; -"1295 dropout_30" -> "1296 dropout_30_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 1536)"]; -"1296 dropout_30_0_0_nncf_smooth_quant_0" -> "1297 quantize_per_tensor_487" [style=solid, label="(1, 14, 14, 1536)"]; -"1297 quantize_per_tensor_487" -> "1298 dequantize_per_tensor_488" [style=solid, label="(1, 14, 14, 1536)"]; -"1298 dequantize_per_tensor_488" -> "1301 linear_49" [style=solid, label="(1, 14, 14, 1536)"]; -"1299 _frozen_param74" -> "1300 dequantize_per_tensor_489" [style=solid, label="(384, 1536)"]; -"1300 dequantize_per_tensor_489" -> "1301 linear_49" [style=solid, label="(384, 1536)"]; -"1301 linear_49" -> "1302 quantize_per_tensor_490" [style=solid, label="(1, 14, 14, 384)"]; -"1302 quantize_per_tensor_490" -> "1303 dequantize_per_tensor_491" [style=solid, label="(1, 14, 14, 384)"]; -"1303 dequantize_per_tensor_491" -> "1304 dropout_31" [style=solid, label="(1, 14, 14, 384)"]; -"1304 dropout_31" -> "1305 layer_norm_18" [style=solid, label="(1, 14, 14, 384)"]; -"1305 layer_norm_18" -> "1306 quantize_per_tensor_492" [style=solid, label="(1, 14, 14, 384)"]; -"1306 quantize_per_tensor_492" -> "1307 dequantize_per_tensor_493" [style=solid, label="(1, 14, 14, 384)"]; -"1307 dequantize_per_tensor_493" -> "1308 add_27" [style=solid, label="(1, 14, 14, 384)"]; -"1308 add_27" -> "1309 quantize_per_tensor_494" [style=solid, label="(1, 14, 14, 384)"]; -"1309 quantize_per_tensor_494" -> "1310 dequantize_per_tensor_495" [style=solid, label="(1, 14, 14, 384)"]; -"1309 quantize_per_tensor_494" -> "1311 dequantize_per_tensor_496" [style=solid, label="(1, 14, 14, 384)"]; -"1310 dequantize_per_tensor_495" -> "1407 add_29" [style=solid, label="(1, 14, 14, 384)"]; -"1311 dequantize_per_tensor_496" -> "1344 pad_10" [style=solid, label="(1, 14, 14, 384)"]; -"1312 _frozen_param75" -> "1313 dequantize_per_tensor_497" [style=solid, label="(1, 15, 15, 2)"]; -"1313 dequantize_per_tensor_497" -> "1316 linear_50" [style=solid, label="(1, 15, 15, 2)"]; -"1314 _frozen_param76" -> "1315 dequantize_per_tensor_498" [style=solid, label="(512, 2)"]; -"1315 dequantize_per_tensor_498" -> "1316 linear_50" [style=solid, label="(512, 2)"]; -"1316 linear_50" -> "1317 relu__8" [style=solid, label="(1, 15, 15, 512)"]; -"1317 relu__8" -> "1318 quantize_per_tensor_499" [style=solid, label="(1, 15, 15, 512)"]; -"1318 quantize_per_tensor_499" -> "1319 dequantize_per_tensor_500" [style=solid, label="(1, 15, 15, 512)"]; -"1319 dequantize_per_tensor_500" -> "1320 relu__8_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"1320 relu__8_0_0_nncf_smooth_quant_0" -> "1321 quantize_per_tensor_501" [style=solid, label="(1, 15, 15, 512)"]; -"1321 quantize_per_tensor_501" -> "1322 dequantize_per_tensor_502" [style=solid, label="(1, 15, 15, 512)"]; -"1322 dequantize_per_tensor_502" -> "1325 linear_51" [style=solid, label="(1, 15, 15, 512)"]; -"1323 _frozen_param77" -> "1324 dequantize_per_tensor_503" [style=solid, label="(12, 512)"]; -"1324 dequantize_per_tensor_503" -> "1325 linear_51" [style=solid, label="(12, 512)"]; -"1325 linear_51" -> "1326 quantize_per_tensor_504" [style=solid, label="(1, 15, 15, 12)"]; -"1326 quantize_per_tensor_504" -> "1327 dequantize_per_tensor_505" [style=solid, label="(1, 15, 15, 12)"]; -"1327 dequantize_per_tensor_505" -> "1328 view_44" [style=solid, label="(1, 15, 15, 12)"]; -"1328 view_44" -> "1329 quantize_per_tensor_506" [style=solid, label="(225, 12)"]; -"1329 quantize_per_tensor_506" -> "1330 dequantize_per_tensor_507" [style=solid, label="(225, 12)"]; -"1330 dequantize_per_tensor_507" -> "1331 index_8" [style=solid, label="(225, 12)"]; -"1331 index_8" -> "1332 view_45" [style=solid, label="(4096, 12)"]; -"1332 view_45" -> "1333 permute_37" [style=solid, label="(64, 64, 12)"]; -"1333 permute_37" -> "1334 contiguous_14" [style=solid, label="(12, 64, 64)"]; -"1334 contiguous_14" -> "1335 unsqueeze_24" [style=solid, label="(12, 64, 64)"]; -"1335 unsqueeze_24" -> "1336 sigmoid_8" [style=solid, label="(1, 12, 64, 64)"]; -"1336 sigmoid_8" -> "1337 quantize_per_tensor_508" [style=solid, label="(1, 12, 64, 64)"]; -"1337 quantize_per_tensor_508" -> "1338 dequantize_per_tensor_509" [style=solid, label="(1, 12, 64, 64)"]; -"1338 dequantize_per_tensor_509" -> "1341 mul_16" [style=solid, label="(1, 12, 64, 64)"]; -"1339 _frozen_param78" -> "1340 dequantize_per_tensor_510" [style=solid, label="()"]; -"1340 dequantize_per_tensor_510" -> "1341 mul_16" [style=solid, label="()"]; -"1341 mul_16" -> "1342 quantize_per_tensor_511" [style=solid, label="(1, 12, 64, 64)"]; -"1342 quantize_per_tensor_511" -> "1343 dequantize_per_tensor_512" [style=solid, label="(1, 12, 64, 64)"]; -"1343 dequantize_per_tensor_512" -> "1379 add_28" [style=solid, label="(1, 12, 64, 64)"]; -"1344 pad_10" -> "1345 view_46" [style=solid, label="(1, 16, 16, 384)"]; -"1345 view_46" -> "1346 permute_38" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1346 permute_38" -> "1347 reshape_36" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1347 reshape_36" -> "1349 reshape_36_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1348 clone_8" -> "1354 linear_52" [style=solid, label="(1152,)"]; -"1349 reshape_36_0_0_nncf_smooth_quant_0" -> "1350 quantize_per_tensor_513" [style=solid, label="(4, 64, 384)"]; -"1350 quantize_per_tensor_513" -> "1351 dequantize_per_tensor_514" [style=solid, label="(4, 64, 384)"]; -"1351 dequantize_per_tensor_514" -> "1354 linear_52" [style=solid, label="(4, 64, 384)"]; -"1352 _frozen_param79" -> "1353 dequantize_per_tensor_515" [style=solid, label="(1152, 384)"]; -"1353 dequantize_per_tensor_515" -> "1354 linear_52" [style=solid, label="(1152, 384)"]; -"1354 linear_52" -> "1355 quantize_per_tensor_516" [style=solid, label="(4, 64, 1152)"]; -"1355 quantize_per_tensor_516" -> "1356 dequantize_per_tensor_517" [style=solid, label="(4, 64, 1152)"]; -"1356 dequantize_per_tensor_517" -> "1357 reshape_37" [style=solid, label="(4, 64, 1152)"]; -"1357 reshape_37" -> "1358 permute_39" [style=solid, label="(4, 64, 3, 12, 32)"]; -"1358 permute_39" -> "1359 select_24" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1358 permute_39" -> "1360 select_25" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1358 permute_39" -> "1361 select_26" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1359 select_24" -> "1362 linalg_vector_norm_16" [style=solid, label="(4, 12, 64, 32)"]; -"1359 select_24" -> "1364 expand_as_16" [style=solid, label="(4, 12, 64, 32)"]; -"1359 select_24" -> "1365 div_16" [style=solid, label="(4, 12, 64, 32)"]; -"1360 select_25" -> "1366 linalg_vector_norm_17" [style=solid, label="(4, 12, 64, 32)"]; -"1360 select_25" -> "1368 expand_as_17" [style=solid, label="(4, 12, 64, 32)"]; -"1360 select_25" -> "1369 div_17" [style=solid, label="(4, 12, 64, 32)"]; -"1361 select_26" -> "1384 matmul_17" [style=solid, label="(4, 12, 64, 32)"]; -"1362 linalg_vector_norm_16" -> "1363 clamp_min_16" [style=solid, label="(4, 12, 64, 1)"]; -"1363 clamp_min_16" -> "1364 expand_as_16" [style=solid, label="(4, 12, 64, 1)"]; -"1364 expand_as_16" -> "1365 div_16" [style=solid, label="(4, 12, 64, 32)"]; -"1365 div_16" -> "1371 matmul_16" [style=solid, label="(4, 12, 64, 32)"]; -"1366 linalg_vector_norm_17" -> "1367 clamp_min_17" [style=solid, label="(4, 12, 64, 1)"]; -"1367 clamp_min_17" -> "1368 expand_as_17" [style=solid, label="(4, 12, 64, 1)"]; -"1368 expand_as_17" -> "1369 div_17" [style=solid, label="(4, 12, 64, 32)"]; -"1369 div_17" -> "1370 transpose_16" [style=solid, label="(4, 12, 64, 32)"]; -"1370 transpose_16" -> "1371 matmul_16" [style=solid, label="(4, 12, 32, 64)"]; -"1371 matmul_16" -> "1372 quantize_per_tensor_518" [style=solid, label="(4, 12, 64, 64)"]; -"1372 quantize_per_tensor_518" -> "1373 dequantize_per_tensor_519" [style=solid, label="(4, 12, 64, 64)"]; -"1373 dequantize_per_tensor_519" -> "1376 mul_17" [style=solid, label="(4, 12, 64, 64)"]; -"1374 _frozen_param80" -> "1375 dequantize_per_tensor_520" [style=solid, label="(12, 1, 1)"]; -"1375 dequantize_per_tensor_520" -> "1376 mul_17" [style=solid, label="(12, 1, 1)"]; -"1376 mul_17" -> "1377 quantize_per_tensor_521" [style=solid, label="(4, 12, 64, 64)"]; -"1377 quantize_per_tensor_521" -> "1378 dequantize_per_tensor_522" [style=solid, label="(4, 12, 64, 64)"]; -"1378 dequantize_per_tensor_522" -> "1379 add_28" [style=solid, label="(4, 12, 64, 64)"]; -"1379 add_28" -> "1380 quantize_per_tensor_523" [style=solid, label="(4, 12, 64, 64)"]; -"1380 quantize_per_tensor_523" -> "1381 dequantize_per_tensor_524" [style=solid, label="(4, 12, 64, 64)"]; -"1381 dequantize_per_tensor_524" -> "1382 softmax_8" [style=solid, label="(4, 12, 64, 64)"]; -"1382 softmax_8" -> "1383 dropout_32" [style=solid, label="(4, 12, 64, 64)"]; -"1383 dropout_32" -> "1384 matmul_17" [style=solid, label="(4, 12, 64, 64)"]; -"1384 matmul_17" -> "1385 transpose_17" [style=solid, label="(4, 12, 64, 32)"]; -"1385 transpose_17" -> "1386 reshape_38" [style=solid, label="(4, 64, 12, 32)"]; -"1386 reshape_38" -> "1387 reshape_38_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1387 reshape_38_0_0_nncf_smooth_quant_0" -> "1388 quantize_per_tensor_525" [style=solid, label="(4, 64, 384)"]; -"1388 quantize_per_tensor_525" -> "1389 dequantize_per_tensor_526" [style=solid, label="(4, 64, 384)"]; -"1389 dequantize_per_tensor_526" -> "1392 linear_53" [style=solid, label="(4, 64, 384)"]; -"1390 _frozen_param81" -> "1391 dequantize_per_tensor_527" [style=solid, label="(384, 384)"]; -"1391 dequantize_per_tensor_527" -> "1392 linear_53" [style=solid, label="(384, 384)"]; -"1392 linear_53" -> "1393 quantize_per_tensor_528" [style=solid, label="(4, 64, 384)"]; -"1393 quantize_per_tensor_528" -> "1394 dequantize_per_tensor_529" [style=solid, label="(4, 64, 384)"]; -"1394 dequantize_per_tensor_529" -> "1395 dropout_33" [style=solid, label="(4, 64, 384)"]; -"1395 dropout_33" -> "1396 view_47" [style=solid, label="(4, 64, 384)"]; -"1396 view_47" -> "1397 permute_40" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1397 permute_40" -> "1398 reshape_39" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1398 reshape_39" -> "1399 slice_134" [style=solid, label="(1, 16, 16, 384)"]; -"1399 slice_134" -> "1400 slice_135" [style=solid, label="(1, 16, 16, 384)"]; -"1400 slice_135" -> "1401 slice_136" [style=solid, label="(1, 14, 16, 384)"]; -"1401 slice_136" -> "1402 slice_137" [style=solid, label="(1, 14, 14, 384)"]; -"1402 slice_137" -> "1403 contiguous_15" [style=solid, label="(1, 14, 14, 384)"]; -"1403 contiguous_15" -> "1404 layer_norm_19" [style=solid, label="(1, 14, 14, 384)"]; -"1404 layer_norm_19" -> "1405 quantize_per_tensor_530" [style=solid, label="(1, 14, 14, 384)"]; -"1405 quantize_per_tensor_530" -> "1406 dequantize_per_tensor_531" [style=solid, label="(1, 14, 14, 384)"]; -"1406 dequantize_per_tensor_531" -> "1407 add_29" [style=solid, label="(1, 14, 14, 384)"]; -"1407 add_29" -> "1408 quantize_per_tensor_532" [style=solid, label="(1, 14, 14, 384)"]; -"1408 quantize_per_tensor_532" -> "1409 dequantize_per_tensor_533" [style=solid, label="(1, 14, 14, 384)"]; -"1408 quantize_per_tensor_532" -> "1410 dequantize_per_tensor_534" [style=solid, label="(1, 14, 14, 384)"]; -"1409 dequantize_per_tensor_533" -> "1433 add_30" [style=solid, label="(1, 14, 14, 384)"]; -"1410 dequantize_per_tensor_534" -> "1411 add_29_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 384)"]; -"1411 add_29_0_0_nncf_smooth_quant_0" -> "1412 quantize_per_tensor_535" [style=solid, label="(1, 14, 14, 384)"]; -"1412 quantize_per_tensor_535" -> "1413 dequantize_per_tensor_536" [style=solid, label="(1, 14, 14, 384)"]; -"1413 dequantize_per_tensor_536" -> "1416 linear_54" [style=solid, label="(1, 14, 14, 384)"]; -"1414 _frozen_param82" -> "1415 dequantize_per_tensor_537" [style=solid, label="(1536, 384)"]; -"1415 dequantize_per_tensor_537" -> "1416 linear_54" [style=solid, label="(1536, 384)"]; -"1416 linear_54" -> "1417 quantize_per_tensor_538" [style=solid, label="(1, 14, 14, 1536)"]; -"1417 quantize_per_tensor_538" -> "1418 dequantize_per_tensor_539" [style=solid, label="(1, 14, 14, 1536)"]; -"1418 dequantize_per_tensor_539" -> "1419 gelu_8" [style=solid, label="(1, 14, 14, 1536)"]; -"1419 gelu_8" -> "1420 dropout_34" [style=solid, label="(1, 14, 14, 1536)"]; -"1420 dropout_34" -> "1421 dropout_34_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 1536)"]; -"1421 dropout_34_0_0_nncf_smooth_quant_0" -> "1422 quantize_per_tensor_540" [style=solid, label="(1, 14, 14, 1536)"]; -"1422 quantize_per_tensor_540" -> "1423 dequantize_per_tensor_541" [style=solid, label="(1, 14, 14, 1536)"]; -"1423 dequantize_per_tensor_541" -> "1426 linear_55" [style=solid, label="(1, 14, 14, 1536)"]; -"1424 _frozen_param83" -> "1425 dequantize_per_tensor_542" [style=solid, label="(384, 1536)"]; -"1425 dequantize_per_tensor_542" -> "1426 linear_55" [style=solid, label="(384, 1536)"]; -"1426 linear_55" -> "1427 quantize_per_tensor_543" [style=solid, label="(1, 14, 14, 384)"]; -"1427 quantize_per_tensor_543" -> "1428 dequantize_per_tensor_544" [style=solid, label="(1, 14, 14, 384)"]; -"1428 dequantize_per_tensor_544" -> "1429 dropout_35" [style=solid, label="(1, 14, 14, 384)"]; -"1429 dropout_35" -> "1430 layer_norm_20" [style=solid, label="(1, 14, 14, 384)"]; -"1430 layer_norm_20" -> "1431 quantize_per_tensor_545" [style=solid, label="(1, 14, 14, 384)"]; -"1431 quantize_per_tensor_545" -> "1432 dequantize_per_tensor_546" [style=solid, label="(1, 14, 14, 384)"]; -"1432 dequantize_per_tensor_546" -> "1433 add_30" [style=solid, label="(1, 14, 14, 384)"]; -"1433 add_30" -> "1434 quantize_per_tensor_547" [style=solid, label="(1, 14, 14, 384)"]; -"1434 quantize_per_tensor_547" -> "1435 dequantize_per_tensor_548" [style=solid, label="(1, 14, 14, 384)"]; -"1434 quantize_per_tensor_547" -> "1436 dequantize_per_tensor_549" [style=solid, label="(1, 14, 14, 384)"]; -"1435 dequantize_per_tensor_548" -> "1558 add_33" [style=solid, label="(1, 14, 14, 384)"]; -"1436 dequantize_per_tensor_549" -> "1469 pad_11" [style=solid, label="(1, 14, 14, 384)"]; -"1437 _frozen_param84" -> "1438 dequantize_per_tensor_550" [style=solid, label="(1, 15, 15, 2)"]; -"1438 dequantize_per_tensor_550" -> "1441 linear_56" [style=solid, label="(1, 15, 15, 2)"]; -"1439 _frozen_param85" -> "1440 dequantize_per_tensor_551" [style=solid, label="(512, 2)"]; -"1440 dequantize_per_tensor_551" -> "1441 linear_56" [style=solid, label="(512, 2)"]; -"1441 linear_56" -> "1442 relu__9" [style=solid, label="(1, 15, 15, 512)"]; -"1442 relu__9" -> "1443 quantize_per_tensor_552" [style=solid, label="(1, 15, 15, 512)"]; -"1443 quantize_per_tensor_552" -> "1444 dequantize_per_tensor_553" [style=solid, label="(1, 15, 15, 512)"]; -"1444 dequantize_per_tensor_553" -> "1445 relu__9_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"1445 relu__9_0_0_nncf_smooth_quant_0" -> "1446 quantize_per_tensor_554" [style=solid, label="(1, 15, 15, 512)"]; -"1446 quantize_per_tensor_554" -> "1447 dequantize_per_tensor_555" [style=solid, label="(1, 15, 15, 512)"]; -"1447 dequantize_per_tensor_555" -> "1450 linear_57" [style=solid, label="(1, 15, 15, 512)"]; -"1448 _frozen_param86" -> "1449 dequantize_per_tensor_556" [style=solid, label="(12, 512)"]; -"1449 dequantize_per_tensor_556" -> "1450 linear_57" [style=solid, label="(12, 512)"]; -"1450 linear_57" -> "1451 quantize_per_tensor_557" [style=solid, label="(1, 15, 15, 12)"]; -"1451 quantize_per_tensor_557" -> "1452 dequantize_per_tensor_558" [style=solid, label="(1, 15, 15, 12)"]; -"1452 dequantize_per_tensor_558" -> "1453 view_48" [style=solid, label="(1, 15, 15, 12)"]; -"1453 view_48" -> "1454 quantize_per_tensor_559" [style=solid, label="(225, 12)"]; -"1454 quantize_per_tensor_559" -> "1455 dequantize_per_tensor_560" [style=solid, label="(225, 12)"]; -"1455 dequantize_per_tensor_560" -> "1456 index_9" [style=solid, label="(225, 12)"]; -"1456 index_9" -> "1457 view_49" [style=solid, label="(4096, 12)"]; -"1457 view_49" -> "1458 permute_41" [style=solid, label="(64, 64, 12)"]; -"1458 permute_41" -> "1459 contiguous_16" [style=solid, label="(12, 64, 64)"]; -"1459 contiguous_16" -> "1460 unsqueeze_25" [style=solid, label="(12, 64, 64)"]; -"1460 unsqueeze_25" -> "1461 sigmoid_9" [style=solid, label="(1, 12, 64, 64)"]; -"1461 sigmoid_9" -> "1462 quantize_per_tensor_561" [style=solid, label="(1, 12, 64, 64)"]; -"1462 quantize_per_tensor_561" -> "1463 dequantize_per_tensor_562" [style=solid, label="(1, 12, 64, 64)"]; -"1463 dequantize_per_tensor_562" -> "1466 mul_18" [style=solid, label="(1, 12, 64, 64)"]; -"1464 _frozen_param87" -> "1465 dequantize_per_tensor_563" [style=solid, label="()"]; -"1465 dequantize_per_tensor_563" -> "1466 mul_18" [style=solid, label="()"]; -"1466 mul_18" -> "1467 quantize_per_tensor_564" [style=solid, label="(1, 12, 64, 64)"]; -"1467 quantize_per_tensor_564" -> "1468 dequantize_per_tensor_565" [style=solid, label="(1, 12, 64, 64)"]; -"1468 dequantize_per_tensor_565" -> "1505 add_31" [style=solid, label="(1, 12, 64, 64)"]; -"1469 pad_11" -> "1470 roll_8" [style=solid, label="(1, 16, 16, 384)"]; -"1470 roll_8" -> "1471 view_50" [style=solid, label="(1, 16, 16, 384)"]; -"1471 view_50" -> "1472 permute_42" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1472 permute_42" -> "1473 reshape_40" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1473 reshape_40" -> "1475 reshape_40_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1473 reshape_40" -> "1508 new_zeros_4" [style=solid, label="(4, 64, 384)"]; -"1474 clone_9" -> "1480 linear_58" [style=solid, label="(1152,)"]; -"1475 reshape_40_0_0_nncf_smooth_quant_0" -> "1476 quantize_per_tensor_566" [style=solid, label="(4, 64, 384)"]; -"1476 quantize_per_tensor_566" -> "1477 dequantize_per_tensor_567" [style=solid, label="(4, 64, 384)"]; -"1477 dequantize_per_tensor_567" -> "1480 linear_58" [style=solid, label="(4, 64, 384)"]; -"1478 _frozen_param88" -> "1479 dequantize_per_tensor_568" [style=solid, label="(1152, 384)"]; -"1479 dequantize_per_tensor_568" -> "1480 linear_58" [style=solid, label="(1152, 384)"]; -"1480 linear_58" -> "1481 quantize_per_tensor_569" [style=solid, label="(4, 64, 1152)"]; -"1481 quantize_per_tensor_569" -> "1482 dequantize_per_tensor_570" [style=solid, label="(4, 64, 1152)"]; -"1482 dequantize_per_tensor_570" -> "1483 reshape_41" [style=solid, label="(4, 64, 1152)"]; -"1483 reshape_41" -> "1484 permute_43" [style=solid, label="(4, 64, 3, 12, 32)"]; -"1484 permute_43" -> "1485 select_27" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1484 permute_43" -> "1486 select_28" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1484 permute_43" -> "1487 select_29" [style=solid, label="(3, 4, 12, 64, 32)"]; -"1485 select_27" -> "1488 linalg_vector_norm_18" [style=solid, label="(4, 12, 64, 32)"]; -"1485 select_27" -> "1490 expand_as_18" [style=solid, label="(4, 12, 64, 32)"]; -"1485 select_27" -> "1491 div_18" [style=solid, label="(4, 12, 64, 32)"]; -"1486 select_28" -> "1492 linalg_vector_norm_19" [style=solid, label="(4, 12, 64, 32)"]; -"1486 select_28" -> "1494 expand_as_19" [style=solid, label="(4, 12, 64, 32)"]; -"1486 select_28" -> "1495 div_19" [style=solid, label="(4, 12, 64, 32)"]; -"1487 select_29" -> "1534 matmul_19" [style=solid, label="(4, 12, 64, 32)"]; -"1488 linalg_vector_norm_18" -> "1489 clamp_min_18" [style=solid, label="(4, 12, 64, 1)"]; -"1489 clamp_min_18" -> "1490 expand_as_18" [style=solid, label="(4, 12, 64, 1)"]; -"1490 expand_as_18" -> "1491 div_18" [style=solid, label="(4, 12, 64, 32)"]; -"1491 div_18" -> "1497 matmul_18" [style=solid, label="(4, 12, 64, 32)"]; -"1492 linalg_vector_norm_19" -> "1493 clamp_min_19" [style=solid, label="(4, 12, 64, 1)"]; -"1493 clamp_min_19" -> "1494 expand_as_19" [style=solid, label="(4, 12, 64, 1)"]; -"1494 expand_as_19" -> "1495 div_19" [style=solid, label="(4, 12, 64, 32)"]; -"1495 div_19" -> "1496 transpose_18" [style=solid, label="(4, 12, 64, 32)"]; -"1496 transpose_18" -> "1497 matmul_18" [style=solid, label="(4, 12, 32, 64)"]; -"1497 matmul_18" -> "1498 quantize_per_tensor_571" [style=solid, label="(4, 12, 64, 64)"]; -"1498 quantize_per_tensor_571" -> "1499 dequantize_per_tensor_572" [style=solid, label="(4, 12, 64, 64)"]; -"1499 dequantize_per_tensor_572" -> "1502 mul_19" [style=solid, label="(4, 12, 64, 64)"]; -"1500 _frozen_param89" -> "1501 dequantize_per_tensor_573" [style=solid, label="(12, 1, 1)"]; -"1501 dequantize_per_tensor_573" -> "1502 mul_19" [style=solid, label="(12, 1, 1)"]; -"1502 mul_19" -> "1503 quantize_per_tensor_574" [style=solid, label="(4, 12, 64, 64)"]; -"1503 quantize_per_tensor_574" -> "1504 dequantize_per_tensor_575" [style=solid, label="(4, 12, 64, 64)"]; -"1504 dequantize_per_tensor_575" -> "1505 add_31" [style=solid, label="(4, 12, 64, 64)"]; -"1505 add_31" -> "1506 quantize_per_tensor_576" [style=solid, label="(4, 12, 64, 64)"]; -"1506 quantize_per_tensor_576" -> "1507 dequantize_per_tensor_577" [style=solid, label="(4, 12, 64, 64)"]; -"1507 dequantize_per_tensor_577" -> "1519 view_52" [style=solid, label="(4, 12, 64, 64)"]; -"1508 new_zeros_4" -> "1509 view_51" [style=solid, label="(16, 16)"]; -"1509 view_51" -> "1510 permute_44" [style=solid, label="(2, 8, 2, 8)"]; -"1510 permute_44" -> "1511 reshape_42" [style=solid, label="(2, 2, 8, 8)"]; -"1511 reshape_42" -> "1512 unsqueeze_26" [style=solid, label="(4, 64)"]; -"1511 reshape_42" -> "1513 unsqueeze_27" [style=solid, label="(4, 64)"]; -"1512 unsqueeze_26" -> "1514 sub_4" [style=solid, label="(4, 1, 64)"]; -"1513 unsqueeze_27" -> "1514 sub_4" [style=solid, label="(4, 64, 1)"]; -"1514 sub_4" -> "1515 ne_4" [style=solid, label="(4, 64, 64)"]; -"1514 sub_4" -> "1516 masked_fill_8" [style=solid, label="(4, 64, 64)"]; -"1514 sub_4" -> "1517 eq_4" [style=solid, label="(4, 64, 64)"]; -"1515 ne_4" -> "1516 masked_fill_8" [style=solid, label="(4, 64, 64)"]; -"1516 masked_fill_8" -> "1518 masked_fill_9" [style=solid, label="(4, 64, 64)"]; -"1517 eq_4" -> "1518 masked_fill_9" [style=solid, label="(4, 64, 64)"]; -"1518 masked_fill_9" -> "1522 unsqueeze_28" [style=solid, label="(4, 64, 64)"]; -"1519 view_52" -> "1520 quantize_per_tensor_578" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1520 quantize_per_tensor_578" -> "1521 dequantize_per_tensor_579" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1521 dequantize_per_tensor_579" -> "1526 add_32" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1522 unsqueeze_28" -> "1523 unsqueeze_29" [style=solid, label="(4, 1, 64, 64)"]; -"1523 unsqueeze_29" -> "1524 quantize_per_tensor_580" [style=solid, label="(1, 4, 1, 64, 64)"]; -"1524 quantize_per_tensor_580" -> "1525 dequantize_per_tensor_581" [style=solid, label="(1, 4, 1, 64, 64)"]; -"1525 dequantize_per_tensor_581" -> "1526 add_32" [style=solid, label="(1, 4, 1, 64, 64)"]; -"1526 add_32" -> "1527 quantize_per_tensor_582" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1527 quantize_per_tensor_582" -> "1528 dequantize_per_tensor_583" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1528 dequantize_per_tensor_583" -> "1529 view_53" [style=solid, label="(1, 4, 12, 64, 64)"]; -"1529 view_53" -> "1530 quantize_per_tensor_584" [style=solid, label="(4, 12, 64, 64)"]; -"1530 quantize_per_tensor_584" -> "1531 dequantize_per_tensor_585" [style=solid, label="(4, 12, 64, 64)"]; -"1531 dequantize_per_tensor_585" -> "1532 softmax_9" [style=solid, label="(4, 12, 64, 64)"]; -"1532 softmax_9" -> "1533 dropout_36" [style=solid, label="(4, 12, 64, 64)"]; -"1533 dropout_36" -> "1534 matmul_19" [style=solid, label="(4, 12, 64, 64)"]; -"1534 matmul_19" -> "1535 transpose_19" [style=solid, label="(4, 12, 64, 32)"]; -"1535 transpose_19" -> "1536 reshape_43" [style=solid, label="(4, 64, 12, 32)"]; -"1536 reshape_43" -> "1537 reshape_43_0_0_nncf_smooth_quant_0" [style=solid, label="(4, 64, 384)"]; -"1537 reshape_43_0_0_nncf_smooth_quant_0" -> "1538 quantize_per_tensor_586" [style=solid, label="(4, 64, 384)"]; -"1538 quantize_per_tensor_586" -> "1539 dequantize_per_tensor_587" [style=solid, label="(4, 64, 384)"]; -"1539 dequantize_per_tensor_587" -> "1542 linear_59" [style=solid, label="(4, 64, 384)"]; -"1540 _frozen_param90" -> "1541 dequantize_per_tensor_588" [style=solid, label="(384, 384)"]; -"1541 dequantize_per_tensor_588" -> "1542 linear_59" [style=solid, label="(384, 384)"]; -"1542 linear_59" -> "1543 quantize_per_tensor_589" [style=solid, label="(4, 64, 384)"]; -"1543 quantize_per_tensor_589" -> "1544 dequantize_per_tensor_590" [style=solid, label="(4, 64, 384)"]; -"1544 dequantize_per_tensor_590" -> "1545 dropout_37" [style=solid, label="(4, 64, 384)"]; -"1545 dropout_37" -> "1546 view_54" [style=solid, label="(4, 64, 384)"]; -"1546 view_54" -> "1547 permute_45" [style=solid, label="(1, 2, 2, 8, 8, 384)"]; -"1547 permute_45" -> "1548 reshape_44" [style=solid, label="(1, 2, 8, 2, 8, 384)"]; -"1548 reshape_44" -> "1549 roll_9" [style=solid, label="(1, 16, 16, 384)"]; -"1549 roll_9" -> "1550 slice_157" [style=solid, label="(1, 16, 16, 384)"]; -"1550 slice_157" -> "1551 slice_158" [style=solid, label="(1, 16, 16, 384)"]; -"1551 slice_158" -> "1552 slice_159" [style=solid, label="(1, 14, 16, 384)"]; -"1552 slice_159" -> "1553 slice_160" [style=solid, label="(1, 14, 14, 384)"]; -"1553 slice_160" -> "1554 contiguous_17" [style=solid, label="(1, 14, 14, 384)"]; -"1554 contiguous_17" -> "1555 layer_norm_21" [style=solid, label="(1, 14, 14, 384)"]; -"1555 layer_norm_21" -> "1556 quantize_per_tensor_591" [style=solid, label="(1, 14, 14, 384)"]; -"1556 quantize_per_tensor_591" -> "1557 dequantize_per_tensor_592" [style=solid, label="(1, 14, 14, 384)"]; -"1557 dequantize_per_tensor_592" -> "1558 add_33" [style=solid, label="(1, 14, 14, 384)"]; -"1558 add_33" -> "1559 quantize_per_tensor_593" [style=solid, label="(1, 14, 14, 384)"]; -"1559 quantize_per_tensor_593" -> "1560 dequantize_per_tensor_594" [style=solid, label="(1, 14, 14, 384)"]; -"1559 quantize_per_tensor_593" -> "1561 dequantize_per_tensor_595" [style=solid, label="(1, 14, 14, 384)"]; -"1560 dequantize_per_tensor_594" -> "1584 add_34" [style=solid, label="(1, 14, 14, 384)"]; -"1561 dequantize_per_tensor_595" -> "1562 add_33_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 384)"]; -"1562 add_33_0_0_nncf_smooth_quant_0" -> "1563 quantize_per_tensor_596" [style=solid, label="(1, 14, 14, 384)"]; -"1563 quantize_per_tensor_596" -> "1564 dequantize_per_tensor_597" [style=solid, label="(1, 14, 14, 384)"]; -"1564 dequantize_per_tensor_597" -> "1567 linear_60" [style=solid, label="(1, 14, 14, 384)"]; -"1565 _frozen_param91" -> "1566 dequantize_per_tensor_598" [style=solid, label="(1536, 384)"]; -"1566 dequantize_per_tensor_598" -> "1567 linear_60" [style=solid, label="(1536, 384)"]; -"1567 linear_60" -> "1568 quantize_per_tensor_599" [style=solid, label="(1, 14, 14, 1536)"]; -"1568 quantize_per_tensor_599" -> "1569 dequantize_per_tensor_600" [style=solid, label="(1, 14, 14, 1536)"]; -"1569 dequantize_per_tensor_600" -> "1570 gelu_9" [style=solid, label="(1, 14, 14, 1536)"]; -"1570 gelu_9" -> "1571 dropout_38" [style=solid, label="(1, 14, 14, 1536)"]; -"1571 dropout_38" -> "1572 dropout_38_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 14, 14, 1536)"]; -"1572 dropout_38_0_0_nncf_smooth_quant_0" -> "1573 quantize_per_tensor_601" [style=solid, label="(1, 14, 14, 1536)"]; -"1573 quantize_per_tensor_601" -> "1574 dequantize_per_tensor_602" [style=solid, label="(1, 14, 14, 1536)"]; -"1574 dequantize_per_tensor_602" -> "1577 linear_61" [style=solid, label="(1, 14, 14, 1536)"]; -"1575 _frozen_param92" -> "1576 dequantize_per_tensor_603" [style=solid, label="(384, 1536)"]; -"1576 dequantize_per_tensor_603" -> "1577 linear_61" [style=solid, label="(384, 1536)"]; -"1577 linear_61" -> "1578 quantize_per_tensor_604" [style=solid, label="(1, 14, 14, 384)"]; -"1578 quantize_per_tensor_604" -> "1579 dequantize_per_tensor_605" [style=solid, label="(1, 14, 14, 384)"]; -"1579 dequantize_per_tensor_605" -> "1580 dropout_39" [style=solid, label="(1, 14, 14, 384)"]; -"1580 dropout_39" -> "1581 layer_norm_22" [style=solid, label="(1, 14, 14, 384)"]; -"1581 layer_norm_22" -> "1582 quantize_per_tensor_606" [style=solid, label="(1, 14, 14, 384)"]; -"1582 quantize_per_tensor_606" -> "1583 dequantize_per_tensor_607" [style=solid, label="(1, 14, 14, 384)"]; -"1583 dequantize_per_tensor_607" -> "1584 add_34" [style=solid, label="(1, 14, 14, 384)"]; -"1584 add_34" -> "1585 quantize_per_tensor_608" [style=solid, label="(1, 14, 14, 384)"]; -"1585 quantize_per_tensor_608" -> "1586 dequantize_per_tensor_609" [style=solid, label="(1, 14, 14, 384)"]; -"1586 dequantize_per_tensor_609" -> "1587 pad_12" [style=solid, label="(1, 14, 14, 384)"]; -"1587 pad_12" -> "1588 slice_161" [style=solid, label="(1, 14, 14, 384)"]; -"1587 pad_12" -> "1593 slice_164" [style=solid, label="(1, 14, 14, 384)"]; -"1587 pad_12" -> "1598 slice_167" [style=solid, label="(1, 14, 14, 384)"]; -"1587 pad_12" -> "1603 slice_170" [style=solid, label="(1, 14, 14, 384)"]; -"1588 slice_161" -> "1589 slice_162" [style=solid, label="(1, 7, 14, 384)"]; -"1589 slice_162" -> "1590 slice_163" [style=solid, label="(1, 7, 7, 384)"]; -"1590 slice_163" -> "1591 quantize_per_tensor_610" [style=solid, label="(1, 7, 7, 384)"]; -"1591 quantize_per_tensor_610" -> "1592 dequantize_per_tensor_611" [style=solid, label="(1, 7, 7, 384)"]; -"1592 dequantize_per_tensor_611" -> "1608 cat_2" [style=solid, label="(1, 7, 7, 384)"]; -"1593 slice_164" -> "1594 slice_165" [style=solid, label="(1, 7, 14, 384)"]; -"1594 slice_165" -> "1595 slice_166" [style=solid, label="(1, 7, 7, 384)"]; -"1595 slice_166" -> "1596 quantize_per_tensor_612" [style=solid, label="(1, 7, 7, 384)"]; -"1596 quantize_per_tensor_612" -> "1597 dequantize_per_tensor_613" [style=solid, label="(1, 7, 7, 384)"]; -"1597 dequantize_per_tensor_613" -> "1608 cat_2" [style=solid, label="(1, 7, 7, 384)"]; -"1598 slice_167" -> "1599 slice_168" [style=solid, label="(1, 7, 14, 384)"]; -"1599 slice_168" -> "1600 slice_169" [style=solid, label="(1, 7, 7, 384)"]; -"1600 slice_169" -> "1601 quantize_per_tensor_614" [style=solid, label="(1, 7, 7, 384)"]; -"1601 quantize_per_tensor_614" -> "1602 dequantize_per_tensor_615" [style=solid, label="(1, 7, 7, 384)"]; -"1602 dequantize_per_tensor_615" -> "1608 cat_2" [style=solid, label="(1, 7, 7, 384)"]; -"1603 slice_170" -> "1604 slice_171" [style=solid, label="(1, 7, 14, 384)"]; -"1604 slice_171" -> "1605 slice_172" [style=solid, label="(1, 7, 7, 384)"]; -"1605 slice_172" -> "1606 quantize_per_tensor_616" [style=solid, label="(1, 7, 7, 384)"]; -"1606 quantize_per_tensor_616" -> "1607 dequantize_per_tensor_617" [style=solid, label="(1, 7, 7, 384)"]; -"1607 dequantize_per_tensor_617" -> "1608 cat_2" [style=solid, label="(1, 7, 7, 384)"]; -"1608 cat_2" -> "1609 quantize_per_tensor_618" [style=solid, label="(1, 7, 7, 1536)"]; -"1609 quantize_per_tensor_618" -> "1610 dequantize_per_tensor_619" [style=solid, label="(1, 7, 7, 1536)"]; -"1610 dequantize_per_tensor_619" -> "1611 cat_2_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 7, 7, 1536)"]; -"1611 cat_2_0_0_nncf_smooth_quant_0" -> "1612 quantize_per_tensor_620" [style=solid, label="(1, 7, 7, 1536)"]; -"1612 quantize_per_tensor_620" -> "1613 dequantize_per_tensor_621" [style=solid, label="(1, 7, 7, 1536)"]; -"1613 dequantize_per_tensor_621" -> "1616 linear_62" [style=solid, label="(1, 7, 7, 1536)"]; -"1614 _frozen_param93" -> "1615 dequantize_per_tensor_622" [style=solid, label="(768, 1536)"]; -"1615 dequantize_per_tensor_622" -> "1616 linear_62" [style=solid, label="(768, 1536)"]; -"1616 linear_62" -> "1617 quantize_per_tensor_623" [style=solid, label="(1, 7, 7, 768)"]; -"1617 quantize_per_tensor_623" -> "1618 dequantize_per_tensor_624" [style=solid, label="(1, 7, 7, 768)"]; -"1618 dequantize_per_tensor_624" -> "1619 layer_norm_23" [style=solid, label="(1, 7, 7, 768)"]; -"1619 layer_norm_23" -> "1652 pad_13" [style=solid, label="(1, 7, 7, 768)"]; -"1619 layer_norm_23" -> "1715 quantize_per_tensor_660" [style=solid, label="(1, 7, 7, 768)"]; -"1620 _frozen_param94" -> "1621 dequantize_per_tensor_625" [style=solid, label="(1, 15, 15, 2)"]; -"1621 dequantize_per_tensor_625" -> "1624 linear_63" [style=solid, label="(1, 15, 15, 2)"]; -"1622 _frozen_param95" -> "1623 dequantize_per_tensor_626" [style=solid, label="(512, 2)"]; -"1623 dequantize_per_tensor_626" -> "1624 linear_63" [style=solid, label="(512, 2)"]; -"1624 linear_63" -> "1625 relu__10" [style=solid, label="(1, 15, 15, 512)"]; -"1625 relu__10" -> "1626 quantize_per_tensor_627" [style=solid, label="(1, 15, 15, 512)"]; -"1626 quantize_per_tensor_627" -> "1627 dequantize_per_tensor_628" [style=solid, label="(1, 15, 15, 512)"]; -"1627 dequantize_per_tensor_628" -> "1628 relu__10_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"1628 relu__10_0_0_nncf_smooth_quant_0" -> "1629 quantize_per_tensor_629" [style=solid, label="(1, 15, 15, 512)"]; -"1629 quantize_per_tensor_629" -> "1630 dequantize_per_tensor_630" [style=solid, label="(1, 15, 15, 512)"]; -"1630 dequantize_per_tensor_630" -> "1633 linear_64" [style=solid, label="(1, 15, 15, 512)"]; -"1631 _frozen_param96" -> "1632 dequantize_per_tensor_631" [style=solid, label="(24, 512)"]; -"1632 dequantize_per_tensor_631" -> "1633 linear_64" [style=solid, label="(24, 512)"]; -"1633 linear_64" -> "1634 quantize_per_tensor_632" [style=solid, label="(1, 15, 15, 24)"]; -"1634 quantize_per_tensor_632" -> "1635 dequantize_per_tensor_633" [style=solid, label="(1, 15, 15, 24)"]; -"1635 dequantize_per_tensor_633" -> "1636 view_55" [style=solid, label="(1, 15, 15, 24)"]; -"1636 view_55" -> "1637 quantize_per_tensor_634" [style=solid, label="(225, 24)"]; -"1637 quantize_per_tensor_634" -> "1638 dequantize_per_tensor_635" [style=solid, label="(225, 24)"]; -"1638 dequantize_per_tensor_635" -> "1639 index_10" [style=solid, label="(225, 24)"]; -"1639 index_10" -> "1640 view_56" [style=solid, label="(4096, 24)"]; -"1640 view_56" -> "1641 permute_46" [style=solid, label="(64, 64, 24)"]; -"1641 permute_46" -> "1642 contiguous_18" [style=solid, label="(24, 64, 64)"]; -"1642 contiguous_18" -> "1643 unsqueeze_30" [style=solid, label="(24, 64, 64)"]; -"1643 unsqueeze_30" -> "1644 sigmoid_10" [style=solid, label="(1, 24, 64, 64)"]; -"1644 sigmoid_10" -> "1645 quantize_per_tensor_636" [style=solid, label="(1, 24, 64, 64)"]; -"1645 quantize_per_tensor_636" -> "1646 dequantize_per_tensor_637" [style=solid, label="(1, 24, 64, 64)"]; -"1646 dequantize_per_tensor_637" -> "1649 mul_20" [style=solid, label="(1, 24, 64, 64)"]; -"1647 _frozen_param97" -> "1648 dequantize_per_tensor_638" [style=solid, label="()"]; -"1648 dequantize_per_tensor_638" -> "1649 mul_20" [style=solid, label="()"]; -"1649 mul_20" -> "1650 quantize_per_tensor_639" [style=solid, label="(1, 24, 64, 64)"]; -"1650 quantize_per_tensor_639" -> "1651 dequantize_per_tensor_640" [style=solid, label="(1, 24, 64, 64)"]; -"1651 dequantize_per_tensor_640" -> "1687 add_35" [style=solid, label="(1, 24, 64, 64)"]; -"1652 pad_13" -> "1653 view_57" [style=solid, label="(1, 8, 8, 768)"]; -"1653 view_57" -> "1654 permute_47" [style=solid, label="(1, 1, 8, 1, 8, 768)"]; -"1654 permute_47" -> "1655 reshape_45" [style=solid, label="(1, 1, 1, 8, 8, 768)"]; -"1655 reshape_45" -> "1657 reshape_45_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 64, 768)"]; -"1656 clone_10" -> "1662 linear_65" [style=solid, label="(2304,)"]; -"1657 reshape_45_0_0_nncf_smooth_quant_0" -> "1658 quantize_per_tensor_641" [style=solid, label="(1, 64, 768)"]; -"1658 quantize_per_tensor_641" -> "1659 dequantize_per_tensor_642" [style=solid, label="(1, 64, 768)"]; -"1659 dequantize_per_tensor_642" -> "1662 linear_65" [style=solid, label="(1, 64, 768)"]; -"1660 _frozen_param98" -> "1661 dequantize_per_tensor_643" [style=solid, label="(2304, 768)"]; -"1661 dequantize_per_tensor_643" -> "1662 linear_65" [style=solid, label="(2304, 768)"]; -"1662 linear_65" -> "1663 quantize_per_tensor_644" [style=solid, label="(1, 64, 2304)"]; -"1663 quantize_per_tensor_644" -> "1664 dequantize_per_tensor_645" [style=solid, label="(1, 64, 2304)"]; -"1664 dequantize_per_tensor_645" -> "1665 reshape_46" [style=solid, label="(1, 64, 2304)"]; -"1665 reshape_46" -> "1666 permute_48" [style=solid, label="(1, 64, 3, 24, 32)"]; -"1666 permute_48" -> "1667 select_30" [style=solid, label="(3, 1, 24, 64, 32)"]; -"1666 permute_48" -> "1668 select_31" [style=solid, label="(3, 1, 24, 64, 32)"]; -"1666 permute_48" -> "1669 select_32" [style=solid, label="(3, 1, 24, 64, 32)"]; -"1667 select_30" -> "1670 linalg_vector_norm_20" [style=solid, label="(1, 24, 64, 32)"]; -"1667 select_30" -> "1672 expand_as_20" [style=solid, label="(1, 24, 64, 32)"]; -"1667 select_30" -> "1673 div_20" [style=solid, label="(1, 24, 64, 32)"]; -"1668 select_31" -> "1674 linalg_vector_norm_21" [style=solid, label="(1, 24, 64, 32)"]; -"1668 select_31" -> "1676 expand_as_21" [style=solid, label="(1, 24, 64, 32)"]; -"1668 select_31" -> "1677 div_21" [style=solid, label="(1, 24, 64, 32)"]; -"1669 select_32" -> "1692 matmul_21" [style=solid, label="(1, 24, 64, 32)"]; -"1670 linalg_vector_norm_20" -> "1671 clamp_min_20" [style=solid, label="(1, 24, 64, 1)"]; -"1671 clamp_min_20" -> "1672 expand_as_20" [style=solid, label="(1, 24, 64, 1)"]; -"1672 expand_as_20" -> "1673 div_20" [style=solid, label="(1, 24, 64, 32)"]; -"1673 div_20" -> "1679 matmul_20" [style=solid, label="(1, 24, 64, 32)"]; -"1674 linalg_vector_norm_21" -> "1675 clamp_min_21" [style=solid, label="(1, 24, 64, 1)"]; -"1675 clamp_min_21" -> "1676 expand_as_21" [style=solid, label="(1, 24, 64, 1)"]; -"1676 expand_as_21" -> "1677 div_21" [style=solid, label="(1, 24, 64, 32)"]; -"1677 div_21" -> "1678 transpose_20" [style=solid, label="(1, 24, 64, 32)"]; -"1678 transpose_20" -> "1679 matmul_20" [style=solid, label="(1, 24, 32, 64)"]; -"1679 matmul_20" -> "1680 quantize_per_tensor_646" [style=solid, label="(1, 24, 64, 64)"]; -"1680 quantize_per_tensor_646" -> "1681 dequantize_per_tensor_647" [style=solid, label="(1, 24, 64, 64)"]; -"1681 dequantize_per_tensor_647" -> "1684 mul_21" [style=solid, label="(1, 24, 64, 64)"]; -"1682 _frozen_param99" -> "1683 dequantize_per_tensor_648" [style=solid, label="(24, 1, 1)"]; -"1683 dequantize_per_tensor_648" -> "1684 mul_21" [style=solid, label="(24, 1, 1)"]; -"1684 mul_21" -> "1685 quantize_per_tensor_649" [style=solid, label="(1, 24, 64, 64)"]; -"1685 quantize_per_tensor_649" -> "1686 dequantize_per_tensor_650" [style=solid, label="(1, 24, 64, 64)"]; -"1686 dequantize_per_tensor_650" -> "1687 add_35" [style=solid, label="(1, 24, 64, 64)"]; -"1687 add_35" -> "1688 quantize_per_tensor_651" [style=solid, label="(1, 24, 64, 64)"]; -"1688 quantize_per_tensor_651" -> "1689 dequantize_per_tensor_652" [style=solid, label="(1, 24, 64, 64)"]; -"1689 dequantize_per_tensor_652" -> "1690 softmax_10" [style=solid, label="(1, 24, 64, 64)"]; -"1690 softmax_10" -> "1691 dropout_40" [style=solid, label="(1, 24, 64, 64)"]; -"1691 dropout_40" -> "1692 matmul_21" [style=solid, label="(1, 24, 64, 64)"]; -"1692 matmul_21" -> "1693 transpose_21" [style=solid, label="(1, 24, 64, 32)"]; -"1693 transpose_21" -> "1694 reshape_47" [style=solid, label="(1, 64, 24, 32)"]; -"1694 reshape_47" -> "1695 reshape_47_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 64, 768)"]; -"1695 reshape_47_0_0_nncf_smooth_quant_0" -> "1696 quantize_per_tensor_653" [style=solid, label="(1, 64, 768)"]; -"1696 quantize_per_tensor_653" -> "1697 dequantize_per_tensor_654" [style=solid, label="(1, 64, 768)"]; -"1697 dequantize_per_tensor_654" -> "1700 linear_66" [style=solid, label="(1, 64, 768)"]; -"1698 _frozen_param100" -> "1699 dequantize_per_tensor_655" [style=solid, label="(768, 768)"]; -"1699 dequantize_per_tensor_655" -> "1700 linear_66" [style=solid, label="(768, 768)"]; -"1700 linear_66" -> "1701 quantize_per_tensor_656" [style=solid, label="(1, 64, 768)"]; -"1701 quantize_per_tensor_656" -> "1702 dequantize_per_tensor_657" [style=solid, label="(1, 64, 768)"]; -"1702 dequantize_per_tensor_657" -> "1703 dropout_41" [style=solid, label="(1, 64, 768)"]; -"1703 dropout_41" -> "1704 view_58" [style=solid, label="(1, 64, 768)"]; -"1704 view_58" -> "1705 permute_49" [style=solid, label="(1, 1, 1, 8, 8, 768)"]; -"1705 permute_49" -> "1706 reshape_48" [style=solid, label="(1, 1, 8, 1, 8, 768)"]; -"1706 reshape_48" -> "1707 slice_174" [style=solid, label="(1, 8, 8, 768)"]; -"1707 slice_174" -> "1708 slice_175" [style=solid, label="(1, 8, 8, 768)"]; -"1708 slice_175" -> "1709 slice_176" [style=solid, label="(1, 7, 8, 768)"]; -"1709 slice_176" -> "1710 slice_177" [style=solid, label="(1, 7, 7, 768)"]; -"1710 slice_177" -> "1711 contiguous_19" [style=solid, label="(1, 7, 7, 768)"]; -"1711 contiguous_19" -> "1712 layer_norm_24" [style=solid, label="(1, 7, 7, 768)"]; -"1712 layer_norm_24" -> "1713 quantize_per_tensor_658" [style=solid, label="(1, 7, 7, 768)"]; -"1713 quantize_per_tensor_658" -> "1714 dequantize_per_tensor_659" [style=solid, label="(1, 7, 7, 768)"]; -"1714 dequantize_per_tensor_659" -> "1717 add_36" [style=solid, label="(1, 7, 7, 768)"]; -"1715 quantize_per_tensor_660" -> "1716 dequantize_per_tensor_661" [style=solid, label="(1, 7, 7, 768)"]; -"1716 dequantize_per_tensor_661" -> "1717 add_36" [style=solid, label="(1, 7, 7, 768)"]; -"1717 add_36" -> "1718 quantize_per_tensor_662" [style=solid, label="(1, 7, 7, 768)"]; -"1718 quantize_per_tensor_662" -> "1719 dequantize_per_tensor_663" [style=solid, label="(1, 7, 7, 768)"]; -"1718 quantize_per_tensor_662" -> "1720 dequantize_per_tensor_664" [style=solid, label="(1, 7, 7, 768)"]; -"1719 dequantize_per_tensor_663" -> "1743 add_37" [style=solid, label="(1, 7, 7, 768)"]; -"1720 dequantize_per_tensor_664" -> "1721 add_36_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 7, 7, 768)"]; -"1721 add_36_0_0_nncf_smooth_quant_0" -> "1722 quantize_per_tensor_665" [style=solid, label="(1, 7, 7, 768)"]; -"1722 quantize_per_tensor_665" -> "1723 dequantize_per_tensor_666" [style=solid, label="(1, 7, 7, 768)"]; -"1723 dequantize_per_tensor_666" -> "1726 linear_67" [style=solid, label="(1, 7, 7, 768)"]; -"1724 _frozen_param101" -> "1725 dequantize_per_tensor_667" [style=solid, label="(3072, 768)"]; -"1725 dequantize_per_tensor_667" -> "1726 linear_67" [style=solid, label="(3072, 768)"]; -"1726 linear_67" -> "1727 quantize_per_tensor_668" [style=solid, label="(1, 7, 7, 3072)"]; -"1727 quantize_per_tensor_668" -> "1728 dequantize_per_tensor_669" [style=solid, label="(1, 7, 7, 3072)"]; -"1728 dequantize_per_tensor_669" -> "1729 gelu_10" [style=solid, label="(1, 7, 7, 3072)"]; -"1729 gelu_10" -> "1730 dropout_42" [style=solid, label="(1, 7, 7, 3072)"]; -"1730 dropout_42" -> "1731 dropout_42_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 7, 7, 3072)"]; -"1731 dropout_42_0_0_nncf_smooth_quant_0" -> "1732 quantize_per_tensor_670" [style=solid, label="(1, 7, 7, 3072)"]; -"1732 quantize_per_tensor_670" -> "1733 dequantize_per_tensor_671" [style=solid, label="(1, 7, 7, 3072)"]; -"1733 dequantize_per_tensor_671" -> "1736 linear_68" [style=solid, label="(1, 7, 7, 3072)"]; -"1734 _frozen_param102" -> "1735 dequantize_per_tensor_672" [style=solid, label="(768, 3072)"]; -"1735 dequantize_per_tensor_672" -> "1736 linear_68" [style=solid, label="(768, 3072)"]; -"1736 linear_68" -> "1737 quantize_per_tensor_673" [style=solid, label="(1, 7, 7, 768)"]; -"1737 quantize_per_tensor_673" -> "1738 dequantize_per_tensor_674" [style=solid, label="(1, 7, 7, 768)"]; -"1738 dequantize_per_tensor_674" -> "1739 dropout_43" [style=solid, label="(1, 7, 7, 768)"]; -"1739 dropout_43" -> "1740 layer_norm_25" [style=solid, label="(1, 7, 7, 768)"]; -"1740 layer_norm_25" -> "1741 quantize_per_tensor_675" [style=solid, label="(1, 7, 7, 768)"]; -"1741 quantize_per_tensor_675" -> "1742 dequantize_per_tensor_676" [style=solid, label="(1, 7, 7, 768)"]; -"1742 dequantize_per_tensor_676" -> "1743 add_37" [style=solid, label="(1, 7, 7, 768)"]; -"1743 add_37" -> "1744 quantize_per_tensor_677" [style=solid, label="(1, 7, 7, 768)"]; -"1744 quantize_per_tensor_677" -> "1745 dequantize_per_tensor_678" [style=solid, label="(1, 7, 7, 768)"]; -"1744 quantize_per_tensor_677" -> "1746 dequantize_per_tensor_679" [style=solid, label="(1, 7, 7, 768)"]; -"1745 dequantize_per_tensor_678" -> "1842 add_39" [style=solid, label="(1, 7, 7, 768)"]; -"1746 dequantize_per_tensor_679" -> "1779 pad_14" [style=solid, label="(1, 7, 7, 768)"]; -"1747 _frozen_param103" -> "1748 dequantize_per_tensor_680" [style=solid, label="(1, 15, 15, 2)"]; -"1748 dequantize_per_tensor_680" -> "1751 linear_69" [style=solid, label="(1, 15, 15, 2)"]; -"1749 _frozen_param104" -> "1750 dequantize_per_tensor_681" [style=solid, label="(512, 2)"]; -"1750 dequantize_per_tensor_681" -> "1751 linear_69" [style=solid, label="(512, 2)"]; -"1751 linear_69" -> "1752 relu__11" [style=solid, label="(1, 15, 15, 512)"]; -"1752 relu__11" -> "1753 quantize_per_tensor_682" [style=solid, label="(1, 15, 15, 512)"]; -"1753 quantize_per_tensor_682" -> "1754 dequantize_per_tensor_683" [style=solid, label="(1, 15, 15, 512)"]; -"1754 dequantize_per_tensor_683" -> "1755 relu__11_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 15, 15, 512)"]; -"1755 relu__11_0_0_nncf_smooth_quant_0" -> "1756 quantize_per_tensor_684" [style=solid, label="(1, 15, 15, 512)"]; -"1756 quantize_per_tensor_684" -> "1757 dequantize_per_tensor_685" [style=solid, label="(1, 15, 15, 512)"]; -"1757 dequantize_per_tensor_685" -> "1760 linear_70" [style=solid, label="(1, 15, 15, 512)"]; -"1758 _frozen_param105" -> "1759 dequantize_per_tensor_686" [style=solid, label="(24, 512)"]; -"1759 dequantize_per_tensor_686" -> "1760 linear_70" [style=solid, label="(24, 512)"]; -"1760 linear_70" -> "1761 quantize_per_tensor_687" [style=solid, label="(1, 15, 15, 24)"]; -"1761 quantize_per_tensor_687" -> "1762 dequantize_per_tensor_688" [style=solid, label="(1, 15, 15, 24)"]; -"1762 dequantize_per_tensor_688" -> "1763 view_59" [style=solid, label="(1, 15, 15, 24)"]; -"1763 view_59" -> "1764 quantize_per_tensor_689" [style=solid, label="(225, 24)"]; -"1764 quantize_per_tensor_689" -> "1765 dequantize_per_tensor_690" [style=solid, label="(225, 24)"]; -"1765 dequantize_per_tensor_690" -> "1766 index_11" [style=solid, label="(225, 24)"]; -"1766 index_11" -> "1767 view_60" [style=solid, label="(4096, 24)"]; -"1767 view_60" -> "1768 permute_50" [style=solid, label="(64, 64, 24)"]; -"1768 permute_50" -> "1769 contiguous_20" [style=solid, label="(24, 64, 64)"]; -"1769 contiguous_20" -> "1770 unsqueeze_31" [style=solid, label="(24, 64, 64)"]; -"1770 unsqueeze_31" -> "1771 sigmoid_11" [style=solid, label="(1, 24, 64, 64)"]; -"1771 sigmoid_11" -> "1772 quantize_per_tensor_691" [style=solid, label="(1, 24, 64, 64)"]; -"1772 quantize_per_tensor_691" -> "1773 dequantize_per_tensor_692" [style=solid, label="(1, 24, 64, 64)"]; -"1773 dequantize_per_tensor_692" -> "1776 mul_22" [style=solid, label="(1, 24, 64, 64)"]; -"1774 _frozen_param106" -> "1775 dequantize_per_tensor_693" [style=solid, label="()"]; -"1775 dequantize_per_tensor_693" -> "1776 mul_22" [style=solid, label="()"]; -"1776 mul_22" -> "1777 quantize_per_tensor_694" [style=solid, label="(1, 24, 64, 64)"]; -"1777 quantize_per_tensor_694" -> "1778 dequantize_per_tensor_695" [style=solid, label="(1, 24, 64, 64)"]; -"1778 dequantize_per_tensor_695" -> "1814 add_38" [style=solid, label="(1, 24, 64, 64)"]; -"1779 pad_14" -> "1780 view_61" [style=solid, label="(1, 8, 8, 768)"]; -"1780 view_61" -> "1781 permute_51" [style=solid, label="(1, 1, 8, 1, 8, 768)"]; -"1781 permute_51" -> "1782 reshape_49" [style=solid, label="(1, 1, 1, 8, 8, 768)"]; -"1782 reshape_49" -> "1784 reshape_49_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 64, 768)"]; -"1783 clone_11" -> "1789 linear_71" [style=solid, label="(2304,)"]; -"1784 reshape_49_0_0_nncf_smooth_quant_0" -> "1785 quantize_per_tensor_696" [style=solid, label="(1, 64, 768)"]; -"1785 quantize_per_tensor_696" -> "1786 dequantize_per_tensor_697" [style=solid, label="(1, 64, 768)"]; -"1786 dequantize_per_tensor_697" -> "1789 linear_71" [style=solid, label="(1, 64, 768)"]; -"1787 _frozen_param107" -> "1788 dequantize_per_tensor_698" [style=solid, label="(2304, 768)"]; -"1788 dequantize_per_tensor_698" -> "1789 linear_71" [style=solid, label="(2304, 768)"]; -"1789 linear_71" -> "1790 quantize_per_tensor_699" [style=solid, label="(1, 64, 2304)"]; -"1790 quantize_per_tensor_699" -> "1791 dequantize_per_tensor_700" [style=solid, label="(1, 64, 2304)"]; -"1791 dequantize_per_tensor_700" -> "1792 reshape_50" [style=solid, label="(1, 64, 2304)"]; -"1792 reshape_50" -> "1793 permute_52" [style=solid, label="(1, 64, 3, 24, 32)"]; -"1793 permute_52" -> "1794 select_33" [style=solid, label="(3, 1, 24, 64, 32)"]; -"1793 permute_52" -> "1795 select_34" [style=solid, label="(3, 1, 24, 64, 32)"]; -"1793 permute_52" -> "1796 select_35" [style=solid, label="(3, 1, 24, 64, 32)"]; -"1794 select_33" -> "1797 linalg_vector_norm_22" [style=solid, label="(1, 24, 64, 32)"]; -"1794 select_33" -> "1799 expand_as_22" [style=solid, label="(1, 24, 64, 32)"]; -"1794 select_33" -> "1800 div_22" [style=solid, label="(1, 24, 64, 32)"]; -"1795 select_34" -> "1801 linalg_vector_norm_23" [style=solid, label="(1, 24, 64, 32)"]; -"1795 select_34" -> "1803 expand_as_23" [style=solid, label="(1, 24, 64, 32)"]; -"1795 select_34" -> "1804 div_23" [style=solid, label="(1, 24, 64, 32)"]; -"1796 select_35" -> "1819 matmul_23" [style=solid, label="(1, 24, 64, 32)"]; -"1797 linalg_vector_norm_22" -> "1798 clamp_min_22" [style=solid, label="(1, 24, 64, 1)"]; -"1798 clamp_min_22" -> "1799 expand_as_22" [style=solid, label="(1, 24, 64, 1)"]; -"1799 expand_as_22" -> "1800 div_22" [style=solid, label="(1, 24, 64, 32)"]; -"1800 div_22" -> "1806 matmul_22" [style=solid, label="(1, 24, 64, 32)"]; -"1801 linalg_vector_norm_23" -> "1802 clamp_min_23" [style=solid, label="(1, 24, 64, 1)"]; -"1802 clamp_min_23" -> "1803 expand_as_23" [style=solid, label="(1, 24, 64, 1)"]; -"1803 expand_as_23" -> "1804 div_23" [style=solid, label="(1, 24, 64, 32)"]; -"1804 div_23" -> "1805 transpose_22" [style=solid, label="(1, 24, 64, 32)"]; -"1805 transpose_22" -> "1806 matmul_22" [style=solid, label="(1, 24, 32, 64)"]; -"1806 matmul_22" -> "1807 quantize_per_tensor_701" [style=solid, label="(1, 24, 64, 64)"]; -"1807 quantize_per_tensor_701" -> "1808 dequantize_per_tensor_702" [style=solid, label="(1, 24, 64, 64)"]; -"1808 dequantize_per_tensor_702" -> "1811 mul_23" [style=solid, label="(1, 24, 64, 64)"]; -"1809 _frozen_param108" -> "1810 dequantize_per_tensor_703" [style=solid, label="(24, 1, 1)"]; -"1810 dequantize_per_tensor_703" -> "1811 mul_23" [style=solid, label="(24, 1, 1)"]; -"1811 mul_23" -> "1812 quantize_per_tensor_704" [style=solid, label="(1, 24, 64, 64)"]; -"1812 quantize_per_tensor_704" -> "1813 dequantize_per_tensor_705" [style=solid, label="(1, 24, 64, 64)"]; -"1813 dequantize_per_tensor_705" -> "1814 add_38" [style=solid, label="(1, 24, 64, 64)"]; -"1814 add_38" -> "1815 quantize_per_tensor_706" [style=solid, label="(1, 24, 64, 64)"]; -"1815 quantize_per_tensor_706" -> "1816 dequantize_per_tensor_707" [style=solid, label="(1, 24, 64, 64)"]; -"1816 dequantize_per_tensor_707" -> "1817 softmax_11" [style=solid, label="(1, 24, 64, 64)"]; -"1817 softmax_11" -> "1818 dropout_44" [style=solid, label="(1, 24, 64, 64)"]; -"1818 dropout_44" -> "1819 matmul_23" [style=solid, label="(1, 24, 64, 64)"]; -"1819 matmul_23" -> "1820 transpose_23" [style=solid, label="(1, 24, 64, 32)"]; -"1820 transpose_23" -> "1821 reshape_51" [style=solid, label="(1, 64, 24, 32)"]; -"1821 reshape_51" -> "1822 reshape_51_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 64, 768)"]; -"1822 reshape_51_0_0_nncf_smooth_quant_0" -> "1823 quantize_per_tensor_708" [style=solid, label="(1, 64, 768)"]; -"1823 quantize_per_tensor_708" -> "1824 dequantize_per_tensor_709" [style=solid, label="(1, 64, 768)"]; -"1824 dequantize_per_tensor_709" -> "1827 linear_72" [style=solid, label="(1, 64, 768)"]; -"1825 _frozen_param109" -> "1826 dequantize_per_tensor_710" [style=solid, label="(768, 768)"]; -"1826 dequantize_per_tensor_710" -> "1827 linear_72" [style=solid, label="(768, 768)"]; -"1827 linear_72" -> "1828 quantize_per_tensor_711" [style=solid, label="(1, 64, 768)"]; -"1828 quantize_per_tensor_711" -> "1829 dequantize_per_tensor_712" [style=solid, label="(1, 64, 768)"]; -"1829 dequantize_per_tensor_712" -> "1830 dropout_45" [style=solid, label="(1, 64, 768)"]; -"1830 dropout_45" -> "1831 view_62" [style=solid, label="(1, 64, 768)"]; -"1831 view_62" -> "1832 permute_53" [style=solid, label="(1, 1, 1, 8, 8, 768)"]; -"1832 permute_53" -> "1833 reshape_52" [style=solid, label="(1, 1, 8, 1, 8, 768)"]; -"1833 reshape_52" -> "1834 slice_179" [style=solid, label="(1, 8, 8, 768)"]; -"1834 slice_179" -> "1835 slice_180" [style=solid, label="(1, 8, 8, 768)"]; -"1835 slice_180" -> "1836 slice_181" [style=solid, label="(1, 7, 8, 768)"]; -"1836 slice_181" -> "1837 slice_182" [style=solid, label="(1, 7, 7, 768)"]; -"1837 slice_182" -> "1838 contiguous_21" [style=solid, label="(1, 7, 7, 768)"]; -"1838 contiguous_21" -> "1839 layer_norm_26" [style=solid, label="(1, 7, 7, 768)"]; -"1839 layer_norm_26" -> "1840 quantize_per_tensor_713" [style=solid, label="(1, 7, 7, 768)"]; -"1840 quantize_per_tensor_713" -> "1841 dequantize_per_tensor_714" [style=solid, label="(1, 7, 7, 768)"]; -"1841 dequantize_per_tensor_714" -> "1842 add_39" [style=solid, label="(1, 7, 7, 768)"]; -"1842 add_39" -> "1843 quantize_per_tensor_715" [style=solid, label="(1, 7, 7, 768)"]; -"1843 quantize_per_tensor_715" -> "1844 dequantize_per_tensor_716" [style=solid, label="(1, 7, 7, 768)"]; -"1843 quantize_per_tensor_715" -> "1845 dequantize_per_tensor_717" [style=solid, label="(1, 7, 7, 768)"]; -"1844 dequantize_per_tensor_716" -> "1868 add_40" [style=solid, label="(1, 7, 7, 768)"]; -"1845 dequantize_per_tensor_717" -> "1846 add_39_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 7, 7, 768)"]; -"1846 add_39_0_0_nncf_smooth_quant_0" -> "1847 quantize_per_tensor_718" [style=solid, label="(1, 7, 7, 768)"]; -"1847 quantize_per_tensor_718" -> "1848 dequantize_per_tensor_719" [style=solid, label="(1, 7, 7, 768)"]; -"1848 dequantize_per_tensor_719" -> "1851 linear_73" [style=solid, label="(1, 7, 7, 768)"]; -"1849 _frozen_param110" -> "1850 dequantize_per_tensor_720" [style=solid, label="(3072, 768)"]; -"1850 dequantize_per_tensor_720" -> "1851 linear_73" [style=solid, label="(3072, 768)"]; -"1851 linear_73" -> "1852 quantize_per_tensor_721" [style=solid, label="(1, 7, 7, 3072)"]; -"1852 quantize_per_tensor_721" -> "1853 dequantize_per_tensor_722" [style=solid, label="(1, 7, 7, 3072)"]; -"1853 dequantize_per_tensor_722" -> "1854 gelu_11" [style=solid, label="(1, 7, 7, 3072)"]; -"1854 gelu_11" -> "1855 dropout_46" [style=solid, label="(1, 7, 7, 3072)"]; -"1855 dropout_46" -> "1856 dropout_46_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 7, 7, 3072)"]; -"1856 dropout_46_0_0_nncf_smooth_quant_0" -> "1857 quantize_per_tensor_723" [style=solid, label="(1, 7, 7, 3072)"]; -"1857 quantize_per_tensor_723" -> "1858 dequantize_per_tensor_724" [style=solid, label="(1, 7, 7, 3072)"]; -"1858 dequantize_per_tensor_724" -> "1861 linear_74" [style=solid, label="(1, 7, 7, 3072)"]; -"1859 _frozen_param111" -> "1860 dequantize_per_tensor_725" [style=solid, label="(768, 3072)"]; -"1860 dequantize_per_tensor_725" -> "1861 linear_74" [style=solid, label="(768, 3072)"]; -"1861 linear_74" -> "1862 quantize_per_tensor_726" [style=solid, label="(1, 7, 7, 768)"]; -"1862 quantize_per_tensor_726" -> "1863 dequantize_per_tensor_727" [style=solid, label="(1, 7, 7, 768)"]; -"1863 dequantize_per_tensor_727" -> "1864 dropout_47" [style=solid, label="(1, 7, 7, 768)"]; -"1864 dropout_47" -> "1865 layer_norm_27" [style=solid, label="(1, 7, 7, 768)"]; -"1865 layer_norm_27" -> "1866 quantize_per_tensor_728" [style=solid, label="(1, 7, 7, 768)"]; -"1866 quantize_per_tensor_728" -> "1867 dequantize_per_tensor_729" [style=solid, label="(1, 7, 7, 768)"]; -"1867 dequantize_per_tensor_729" -> "1868 add_40" [style=solid, label="(1, 7, 7, 768)"]; -"1868 add_40" -> "1869 quantize_per_tensor_730" [style=solid, label="(1, 7, 7, 768)"]; -"1869 quantize_per_tensor_730" -> "1870 dequantize_per_tensor_731" [style=solid, label="(1, 7, 7, 768)"]; -"1870 dequantize_per_tensor_731" -> "1871 layer_norm_28" [style=solid, label="(1, 7, 7, 768)"]; -"1871 layer_norm_28" -> "1872 permute_54" [style=solid, label="(1, 7, 7, 768)"]; -"1872 permute_54" -> "1873 quantize_per_tensor_732" [style=solid, label="(1, 768, 7, 7)"]; -"1873 quantize_per_tensor_732" -> "1874 dequantize_per_tensor_733" [style=solid, label="(1, 768, 7, 7)"]; -"1874 dequantize_per_tensor_733" -> "1875 adaptive_avg_pool2d" [style=solid, label="(1, 768, 7, 7)"]; -"1875 adaptive_avg_pool2d" -> "1876 quantize_per_tensor_734" [style=solid, label="(1, 768, 1, 1)"]; -"1876 quantize_per_tensor_734" -> "1877 dequantize_per_tensor_735" [style=solid, label="(1, 768, 1, 1)"]; -"1877 dequantize_per_tensor_735" -> "1878 flatten" [style=solid, label="(1, 768, 1, 1)"]; -"1878 flatten" -> "1879 quantize_per_tensor_736" [style=solid, label="(1, 768)"]; -"1879 quantize_per_tensor_736" -> "1880 dequantize_per_tensor_737" [style=solid, label="(1, 768)"]; -"1880 dequantize_per_tensor_737" -> "1881 flatten_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 768)"]; -"1881 flatten_0_0_nncf_smooth_quant_0" -> "1882 quantize_per_tensor_738" [style=solid, label="(1, 768)"]; -"1882 quantize_per_tensor_738" -> "1883 dequantize_per_tensor_739" [style=solid, label="(1, 768)"]; -"1883 dequantize_per_tensor_739" -> "1886 linear_75" [style=solid, label="(1, 768)"]; -"1884 _frozen_param112" -> "1885 dequantize_per_tensor_740" [style=solid, label="(1000, 768)"]; -"1885 dequantize_per_tensor_740" -> "1886 linear_75" [style=solid, label="(1000, 768)"]; -"1886 linear_75" -> "1887 quantize_per_tensor_741" [style=solid, label="(1, 1000)"]; -"1887 quantize_per_tensor_741" -> "1888 dequantize_per_tensor_742" [style=solid, label="(1, 1000)"]; -"1888 dequantize_per_tensor_742" -> "1889 output" [style=solid, label="(1, 1000)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t_ref_qconfig.json deleted file mode 100644 index 949d019ed4c..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/swin_v2_t_ref_qconfig.json +++ /dev/null @@ -1,2813 +0,0 @@ -{ - "quantization_points": { - "('conv2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('permute',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('layer_norm',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_2',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_3',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_2', 'linear_4')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_4',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_5',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_5', 'pad_1')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_6',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_7',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_8',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_9',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_6', 'linear_10')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_10',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_11',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('pad_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_12',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('layer_norm_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_13',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_14',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('index_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_15',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_16',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_9', 'linear_17')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_17',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_18',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_12', 'pad_4')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_19',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_20',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('index_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_21',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_22',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_13', 'linear_23')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_23',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_24',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('pad_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_25',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_25',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('layer_norm_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_26',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_26',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_27',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_27',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_28',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_28',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_29',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_29',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_16', 'linear_30')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_30',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_31',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_31',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_19', 'pad_7')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_32',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_32',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_33',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_26',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('index_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_34',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_34',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_30',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_31',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_35',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_35',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_20', 'linear_36')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_36',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_37',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_22', 'pad_8')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_38',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_38',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_39',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_39',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('index_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_40',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_40',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_28',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_41',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_41',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_25',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_23', 'linear_42')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_42',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_43',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_43',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_27',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_26', 'pad_9')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_44',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_44',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_45',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_45',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_46',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_46',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_32',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_25',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_41',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_42',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_47',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_47',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_29',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_26',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_27', 'linear_48')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_48',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_49',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_49',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_31',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_27',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_29', 'pad_10')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_50',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_50',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_51',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_51',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_44',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_28',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_52',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_52',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_53',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_53',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_29',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_30', 'linear_54')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_54',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_55',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_55',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_35',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_30',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_33', 'pad_11')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_56',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_56',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_57',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_57',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_48',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('index_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_31',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_58',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_58',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_41',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_32',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_52',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_53',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_59',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_59',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_34', 'linear_60')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_60',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_61',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_61',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_39',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_34',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('pad_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_62',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_62',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('layer_norm_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_63',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_63',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_64',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_64',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_55',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_35',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_65',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_65',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_46',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_66',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_66',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_41',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_36',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_37', 'linear_67')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_67',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_68',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_68',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_43',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_39', 'pad_14')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_69',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_69',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_70',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_70',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('index_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_59',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_38',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_71',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_71',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape_50',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('mul_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('softmax_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_72',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_72',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_45',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_39',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_40', 'linear_73')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_73',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_74',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_74',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_47',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_40',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('layer_norm_28',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('flatten',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('adaptive_avg_pool2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_75',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_75',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('output',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": { - "0": [ - 2, - 3 - ], - "1": [ - 8, - 9 - ], - "2": [ - 37, - 38 - ], - "3": [ - 48, - 49 - ], - "4": [ - 51, - 52 - ], - "5": [ - 65, - 66, - 67, - 68, - 69 - ], - "6": [ - 76, - 77 - ], - "7": [ - 105, - 106 - ], - "8": [ - 116, - 117 - ], - "9": [ - 119, - 120 - ], - "10": [ - 133, - 134, - 135, - 136, - 137 - ], - "11": [ - 144, - 145 - ], - "12": [ - 173, - 174 - ], - "13": [ - 184, - 185 - ], - "14": [ - 187, - 188 - ], - "15": [ - 205, - 206 - ], - "16": [ - 233, - 234 - ], - "17": [ - 244, - 245 - ], - "18": [ - 247, - 248 - ], - "19": [ - 265, - 266 - ], - "20": [ - 293, - 294 - ], - "21": [ - 304, - 305 - ], - "22": [ - 307, - 308 - ], - "23": [ - 321, - 322, - 323, - 324, - 325 - ], - "24": [ - 332, - 333 - ], - "25": [ - 361, - 362 - ], - "26": [ - 385, - 386, - 387 - ] - }, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer.dot b/tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer.dot deleted file mode 100644 index 74c4d1d924f..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer.dot +++ /dev/null @@ -1,45 +0,0 @@ -strict digraph { -"0 wte_weight" [id=0, type="get_attr"]; -"1 linear_bias" [id=1, type="get_attr"]; -"2 lm_head_bias" [id=2, type="get_attr"]; -"3 input_ids" [id=3, type=input]; -"4 embedding" [id=4, type=embedding]; -"5 embedding_0_0_nncf_smooth_quant_0" [id=5, type="call_module"]; -"6 quantize_per_tensor_0" [id=6, type="quantize_per_tensor"]; -"7 dequantize_per_tensor_1" [id=7, type="dequantize_per_tensor"]; -"8 _frozen_param0" [id=8, type="get_attr"]; -"9 dequantize_per_tensor_2" [id=9, type="dequantize_per_tensor"]; -"10 linear" [id=10, type=linear]; -"11 quantize_per_tensor_3" [id=11, type="quantize_per_tensor"]; -"12 dequantize_per_tensor_4" [id=12, type="dequantize_per_tensor"]; -"13 linear_0_0_nncf_smooth_quant_0" [id=13, type="call_module"]; -"14 quantize_per_tensor_5" [id=14, type="quantize_per_tensor"]; -"15 dequantize_per_tensor_6" [id=15, type="dequantize_per_tensor"]; -"16 _frozen_param1" [id=16, type="get_attr"]; -"17 dequantize_per_tensor_7" [id=17, type="dequantize_per_tensor"]; -"18 linear_1" [id=18, type=linear]; -"19 quantize_per_tensor_8" [id=19, type="quantize_per_tensor"]; -"20 dequantize_per_tensor_9" [id=20, type="dequantize_per_tensor"]; -"21 output" [id=21, type=output]; -"0 wte_weight" -> "4 embedding" [style=solid, label="(10, 5)"]; -"1 linear_bias" -> "10 linear" [style=solid, label="(5,)"]; -"2 lm_head_bias" -> "18 linear_1" [style=solid, label="(10,)"]; -"3 input_ids" -> "4 embedding" [style=solid, label="(5,)"]; -"4 embedding" -> "5 embedding_0_0_nncf_smooth_quant_0" [style=solid, label="(5, 5)"]; -"5 embedding_0_0_nncf_smooth_quant_0" -> "6 quantize_per_tensor_0" [style=solid, label="(5, 5)"]; -"6 quantize_per_tensor_0" -> "7 dequantize_per_tensor_1" [style=solid, label="(5, 5)"]; -"7 dequantize_per_tensor_1" -> "10 linear" [style=solid, label="(5, 5)"]; -"8 _frozen_param0" -> "9 dequantize_per_tensor_2" [style=solid, label="(5, 5)"]; -"9 dequantize_per_tensor_2" -> "10 linear" [style=solid, label="(5, 5)"]; -"10 linear" -> "11 quantize_per_tensor_3" [style=solid, label="(5, 5)"]; -"11 quantize_per_tensor_3" -> "12 dequantize_per_tensor_4" [style=solid, label="(5, 5)"]; -"12 dequantize_per_tensor_4" -> "13 linear_0_0_nncf_smooth_quant_0" [style=solid, label="(5, 5)"]; -"13 linear_0_0_nncf_smooth_quant_0" -> "14 quantize_per_tensor_5" [style=solid, label="(5, 5)"]; -"14 quantize_per_tensor_5" -> "15 dequantize_per_tensor_6" [style=solid, label="(5, 5)"]; -"15 dequantize_per_tensor_6" -> "18 linear_1" [style=solid, label="(5, 5)"]; -"16 _frozen_param1" -> "17 dequantize_per_tensor_7" [style=solid, label="(10, 5)"]; -"17 dequantize_per_tensor_7" -> "18 linear_1" [style=solid, label="(10, 5)"]; -"18 linear_1" -> "19 quantize_per_tensor_8" [style=solid, label="(5, 10)"]; -"19 quantize_per_tensor_8" -> "20 dequantize_per_tensor_9" [style=solid, label="(5, 10)"]; -"20 dequantize_per_tensor_9" -> "21 output" [style=solid, label="(5, 10)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer_ref_qconfig.json deleted file mode 100644 index 44834aa7270..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/synthetic_transformer_ref_qconfig.json +++ /dev/null @@ -1,46 +0,0 @@ -{ - "quantization_points": { - "('linear',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('linear_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('output',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": {}, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/unet.dot b/tests/torch2/data/fx/XNNPACKQuantizer/unet.dot deleted file mode 100644 index 29115539b56..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/unet.dot +++ /dev/null @@ -1,421 +0,0 @@ -strict digraph { -"0 down_path_0_block_0_bias" [id=0, type="get_attr"]; -"1 down_path_0_block_3_bias" [id=1, type="get_attr"]; -"2 down_path_1_block_0_bias" [id=2, type="get_attr"]; -"3 down_path_1_block_3_bias" [id=3, type="get_attr"]; -"4 down_path_2_block_0_bias" [id=4, type="get_attr"]; -"5 down_path_2_block_3_bias" [id=5, type="get_attr"]; -"6 down_path_3_block_0_bias" [id=6, type="get_attr"]; -"7 down_path_3_block_3_bias" [id=7, type="get_attr"]; -"8 down_path_4_block_0_bias" [id=8, type="get_attr"]; -"9 down_path_4_block_3_bias" [id=9, type="get_attr"]; -"10 up_path_0_up_weight" [id=10, type="get_attr"]; -"11 up_path_0_up_bias" [id=11, type="get_attr"]; -"12 up_path_0_conv_block_block_0_bias" [id=12, type="get_attr"]; -"13 up_path_0_conv_block_block_3_bias" [id=13, type="get_attr"]; -"14 up_path_1_up_weight" [id=14, type="get_attr"]; -"15 up_path_1_up_bias" [id=15, type="get_attr"]; -"16 up_path_1_conv_block_block_0_bias" [id=16, type="get_attr"]; -"17 up_path_1_conv_block_block_3_bias" [id=17, type="get_attr"]; -"18 up_path_2_up_weight" [id=18, type="get_attr"]; -"19 up_path_2_up_bias" [id=19, type="get_attr"]; -"20 up_path_2_conv_block_block_0_bias" [id=20, type="get_attr"]; -"21 up_path_2_conv_block_block_3_bias" [id=21, type="get_attr"]; -"22 up_path_3_up_weight" [id=22, type="get_attr"]; -"23 up_path_3_up_bias" [id=23, type="get_attr"]; -"24 up_path_3_conv_block_block_0_bias" [id=24, type="get_attr"]; -"25 up_path_3_conv_block_block_3_bias" [id=25, type="get_attr"]; -"26 last_bias" [id=26, type="get_attr"]; -"27 x" [id=27, type=input]; -"28 quantize_per_tensor_0" [id=28, type="quantize_per_tensor"]; -"29 dequantize_per_tensor_1" [id=29, type="dequantize_per_tensor"]; -"30 _frozen_param0" [id=30, type="get_attr"]; -"31 dequantize_per_tensor_2" [id=31, type="dequantize_per_tensor"]; -"32 conv2d" [id=32, type=conv2d]; -"33 relu" [id=33, type=relu]; -"34 quantize_per_tensor_3" [id=34, type="quantize_per_tensor"]; -"35 dequantize_per_tensor_4" [id=35, type="dequantize_per_tensor"]; -"36 _frozen_param1" [id=36, type="get_attr"]; -"37 dequantize_per_tensor_5" [id=37, type="dequantize_per_tensor"]; -"38 conv2d_1" [id=38, type=conv2d]; -"39 relu_1" [id=39, type=relu]; -"40 quantize_per_tensor_6" [id=40, type="quantize_per_tensor"]; -"41 dequantize_per_tensor_7" [id=41, type="dequantize_per_tensor"]; -"42 dequantize_per_tensor_8" [id=42, type="dequantize_per_tensor"]; -"43 max_pool2d" [id=43, type="max_pool2d"]; -"44 quantize_per_tensor_9" [id=44, type="quantize_per_tensor"]; -"45 dequantize_per_tensor_10" [id=45, type="dequantize_per_tensor"]; -"46 _frozen_param2" [id=46, type="get_attr"]; -"47 dequantize_per_tensor_11" [id=47, type="dequantize_per_tensor"]; -"48 conv2d_2" [id=48, type=conv2d]; -"49 relu_2" [id=49, type=relu]; -"50 quantize_per_tensor_12" [id=50, type="quantize_per_tensor"]; -"51 dequantize_per_tensor_13" [id=51, type="dequantize_per_tensor"]; -"52 _frozen_param3" [id=52, type="get_attr"]; -"53 dequantize_per_tensor_14" [id=53, type="dequantize_per_tensor"]; -"54 conv2d_3" [id=54, type=conv2d]; -"55 relu_3" [id=55, type=relu]; -"56 quantize_per_tensor_15" [id=56, type="quantize_per_tensor"]; -"57 dequantize_per_tensor_16" [id=57, type="dequantize_per_tensor"]; -"58 dequantize_per_tensor_17" [id=58, type="dequantize_per_tensor"]; -"59 max_pool2d_1" [id=59, type="max_pool2d"]; -"60 quantize_per_tensor_18" [id=60, type="quantize_per_tensor"]; -"61 dequantize_per_tensor_19" [id=61, type="dequantize_per_tensor"]; -"62 _frozen_param4" [id=62, type="get_attr"]; -"63 dequantize_per_tensor_20" [id=63, type="dequantize_per_tensor"]; -"64 conv2d_4" [id=64, type=conv2d]; -"65 relu_4" [id=65, type=relu]; -"66 quantize_per_tensor_21" [id=66, type="quantize_per_tensor"]; -"67 dequantize_per_tensor_22" [id=67, type="dequantize_per_tensor"]; -"68 _frozen_param5" [id=68, type="get_attr"]; -"69 dequantize_per_tensor_23" [id=69, type="dequantize_per_tensor"]; -"70 conv2d_5" [id=70, type=conv2d]; -"71 relu_5" [id=71, type=relu]; -"72 quantize_per_tensor_24" [id=72, type="quantize_per_tensor"]; -"73 dequantize_per_tensor_25" [id=73, type="dequantize_per_tensor"]; -"74 dequantize_per_tensor_26" [id=74, type="dequantize_per_tensor"]; -"75 max_pool2d_2" [id=75, type="max_pool2d"]; -"76 quantize_per_tensor_27" [id=76, type="quantize_per_tensor"]; -"77 dequantize_per_tensor_28" [id=77, type="dequantize_per_tensor"]; -"78 _frozen_param6" [id=78, type="get_attr"]; -"79 dequantize_per_tensor_29" [id=79, type="dequantize_per_tensor"]; -"80 conv2d_6" [id=80, type=conv2d]; -"81 relu_6" [id=81, type=relu]; -"82 quantize_per_tensor_30" [id=82, type="quantize_per_tensor"]; -"83 dequantize_per_tensor_31" [id=83, type="dequantize_per_tensor"]; -"84 _frozen_param7" [id=84, type="get_attr"]; -"85 dequantize_per_tensor_32" [id=85, type="dequantize_per_tensor"]; -"86 conv2d_7" [id=86, type=conv2d]; -"87 relu_7" [id=87, type=relu]; -"88 quantize_per_tensor_33" [id=88, type="quantize_per_tensor"]; -"89 dequantize_per_tensor_34" [id=89, type="dequantize_per_tensor"]; -"90 dequantize_per_tensor_35" [id=90, type="dequantize_per_tensor"]; -"91 max_pool2d_3" [id=91, type="max_pool2d"]; -"92 quantize_per_tensor_36" [id=92, type="quantize_per_tensor"]; -"93 dequantize_per_tensor_37" [id=93, type="dequantize_per_tensor"]; -"94 _frozen_param8" [id=94, type="get_attr"]; -"95 dequantize_per_tensor_38" [id=95, type="dequantize_per_tensor"]; -"96 conv2d_8" [id=96, type=conv2d]; -"97 relu_8" [id=97, type=relu]; -"98 quantize_per_tensor_39" [id=98, type="quantize_per_tensor"]; -"99 dequantize_per_tensor_40" [id=99, type="dequantize_per_tensor"]; -"100 _frozen_param9" [id=100, type="get_attr"]; -"101 dequantize_per_tensor_41" [id=101, type="dequantize_per_tensor"]; -"102 conv2d_9" [id=102, type=conv2d]; -"103 relu_9" [id=103, type=relu]; -"104 quantize_per_tensor_42" [id=104, type="quantize_per_tensor"]; -"105 dequantize_per_tensor_43" [id=105, type="dequantize_per_tensor"]; -"106 conv_transpose2d" [id=106, type="conv_transpose2d"]; -"107 quantize_per_tensor_44" [id=107, type="quantize_per_tensor"]; -"108 dequantize_per_tensor_45" [id=108, type="dequantize_per_tensor"]; -"109 slice_1" [id=109, type=slice]; -"110 slice_2" [id=110, type=slice]; -"111 slice_3" [id=111, type=slice]; -"112 slice_4" [id=112, type=slice]; -"113 quantize_per_tensor_46" [id=113, type="quantize_per_tensor"]; -"114 dequantize_per_tensor_47" [id=114, type="dequantize_per_tensor"]; -"115 cat" [id=115, type=cat]; -"116 quantize_per_tensor_48" [id=116, type="quantize_per_tensor"]; -"117 dequantize_per_tensor_49" [id=117, type="dequantize_per_tensor"]; -"118 _frozen_param10" [id=118, type="get_attr"]; -"119 dequantize_per_tensor_50" [id=119, type="dequantize_per_tensor"]; -"120 conv2d_10" [id=120, type=conv2d]; -"121 relu_10" [id=121, type=relu]; -"122 quantize_per_tensor_51" [id=122, type="quantize_per_tensor"]; -"123 dequantize_per_tensor_52" [id=123, type="dequantize_per_tensor"]; -"124 _frozen_param11" [id=124, type="get_attr"]; -"125 dequantize_per_tensor_53" [id=125, type="dequantize_per_tensor"]; -"126 conv2d_11" [id=126, type=conv2d]; -"127 relu_11" [id=127, type=relu]; -"128 quantize_per_tensor_54" [id=128, type="quantize_per_tensor"]; -"129 dequantize_per_tensor_55" [id=129, type="dequantize_per_tensor"]; -"130 conv_transpose2d_1" [id=130, type="conv_transpose2d"]; -"131 quantize_per_tensor_56" [id=131, type="quantize_per_tensor"]; -"132 dequantize_per_tensor_57" [id=132, type="dequantize_per_tensor"]; -"133 slice_5" [id=133, type=slice]; -"134 slice_6" [id=134, type=slice]; -"135 slice_7" [id=135, type=slice]; -"136 slice_8" [id=136, type=slice]; -"137 quantize_per_tensor_58" [id=137, type="quantize_per_tensor"]; -"138 dequantize_per_tensor_59" [id=138, type="dequantize_per_tensor"]; -"139 cat_1" [id=139, type=cat]; -"140 quantize_per_tensor_60" [id=140, type="quantize_per_tensor"]; -"141 dequantize_per_tensor_61" [id=141, type="dequantize_per_tensor"]; -"142 _frozen_param12" [id=142, type="get_attr"]; -"143 dequantize_per_tensor_62" [id=143, type="dequantize_per_tensor"]; -"144 conv2d_12" [id=144, type=conv2d]; -"145 relu_12" [id=145, type=relu]; -"146 quantize_per_tensor_63" [id=146, type="quantize_per_tensor"]; -"147 dequantize_per_tensor_64" [id=147, type="dequantize_per_tensor"]; -"148 _frozen_param13" [id=148, type="get_attr"]; -"149 dequantize_per_tensor_65" [id=149, type="dequantize_per_tensor"]; -"150 conv2d_13" [id=150, type=conv2d]; -"151 relu_13" [id=151, type=relu]; -"152 quantize_per_tensor_66" [id=152, type="quantize_per_tensor"]; -"153 dequantize_per_tensor_67" [id=153, type="dequantize_per_tensor"]; -"154 conv_transpose2d_2" [id=154, type="conv_transpose2d"]; -"155 quantize_per_tensor_68" [id=155, type="quantize_per_tensor"]; -"156 dequantize_per_tensor_69" [id=156, type="dequantize_per_tensor"]; -"157 slice_9" [id=157, type=slice]; -"158 slice_10" [id=158, type=slice]; -"159 slice_11" [id=159, type=slice]; -"160 slice_12" [id=160, type=slice]; -"161 quantize_per_tensor_70" [id=161, type="quantize_per_tensor"]; -"162 dequantize_per_tensor_71" [id=162, type="dequantize_per_tensor"]; -"163 cat_2" [id=163, type=cat]; -"164 quantize_per_tensor_72" [id=164, type="quantize_per_tensor"]; -"165 dequantize_per_tensor_73" [id=165, type="dequantize_per_tensor"]; -"166 _frozen_param14" [id=166, type="get_attr"]; -"167 dequantize_per_tensor_74" [id=167, type="dequantize_per_tensor"]; -"168 conv2d_14" [id=168, type=conv2d]; -"169 relu_14" [id=169, type=relu]; -"170 quantize_per_tensor_75" [id=170, type="quantize_per_tensor"]; -"171 dequantize_per_tensor_76" [id=171, type="dequantize_per_tensor"]; -"172 _frozen_param15" [id=172, type="get_attr"]; -"173 dequantize_per_tensor_77" [id=173, type="dequantize_per_tensor"]; -"174 conv2d_15" [id=174, type=conv2d]; -"175 relu_15" [id=175, type=relu]; -"176 quantize_per_tensor_78" [id=176, type="quantize_per_tensor"]; -"177 dequantize_per_tensor_79" [id=177, type="dequantize_per_tensor"]; -"178 conv_transpose2d_3" [id=178, type="conv_transpose2d"]; -"179 quantize_per_tensor_80" [id=179, type="quantize_per_tensor"]; -"180 dequantize_per_tensor_81" [id=180, type="dequantize_per_tensor"]; -"181 slice_13" [id=181, type=slice]; -"182 slice_14" [id=182, type=slice]; -"183 slice_15" [id=183, type=slice]; -"184 slice_16" [id=184, type=slice]; -"185 quantize_per_tensor_82" [id=185, type="quantize_per_tensor"]; -"186 dequantize_per_tensor_83" [id=186, type="dequantize_per_tensor"]; -"187 cat_3" [id=187, type=cat]; -"188 quantize_per_tensor_84" [id=188, type="quantize_per_tensor"]; -"189 dequantize_per_tensor_85" [id=189, type="dequantize_per_tensor"]; -"190 _frozen_param16" [id=190, type="get_attr"]; -"191 dequantize_per_tensor_86" [id=191, type="dequantize_per_tensor"]; -"192 conv2d_16" [id=192, type=conv2d]; -"193 relu_16" [id=193, type=relu]; -"194 quantize_per_tensor_87" [id=194, type="quantize_per_tensor"]; -"195 dequantize_per_tensor_88" [id=195, type="dequantize_per_tensor"]; -"196 _frozen_param17" [id=196, type="get_attr"]; -"197 dequantize_per_tensor_89" [id=197, type="dequantize_per_tensor"]; -"198 conv2d_17" [id=198, type=conv2d]; -"199 relu_17" [id=199, type=relu]; -"200 quantize_per_tensor_90" [id=200, type="quantize_per_tensor"]; -"201 dequantize_per_tensor_91" [id=201, type="dequantize_per_tensor"]; -"202 _frozen_param18" [id=202, type="get_attr"]; -"203 dequantize_per_tensor_92" [id=203, type="dequantize_per_tensor"]; -"204 conv2d_18" [id=204, type=conv2d]; -"205 quantize_per_tensor_93" [id=205, type="quantize_per_tensor"]; -"206 dequantize_per_tensor_94" [id=206, type="dequantize_per_tensor"]; -"207 output" [id=207, type=output]; -"0 down_path_0_block_0_bias" -> "32 conv2d" [style=solid, label="(64,)"]; -"1 down_path_0_block_3_bias" -> "38 conv2d_1" [style=solid, label="(64,)"]; -"2 down_path_1_block_0_bias" -> "48 conv2d_2" [style=solid, label="(128,)"]; -"3 down_path_1_block_3_bias" -> "54 conv2d_3" [style=solid, label="(128,)"]; -"4 down_path_2_block_0_bias" -> "64 conv2d_4" [style=solid, label="(256,)"]; -"5 down_path_2_block_3_bias" -> "70 conv2d_5" [style=solid, label="(256,)"]; -"6 down_path_3_block_0_bias" -> "80 conv2d_6" [style=solid, label="(512,)"]; -"7 down_path_3_block_3_bias" -> "86 conv2d_7" [style=solid, label="(512,)"]; -"8 down_path_4_block_0_bias" -> "96 conv2d_8" [style=solid, label="(1024,)"]; -"9 down_path_4_block_3_bias" -> "102 conv2d_9" [style=solid, label="(1024,)"]; -"10 up_path_0_up_weight" -> "106 conv_transpose2d" [style=solid, label="(1024, 512, 2, 2)"]; -"11 up_path_0_up_bias" -> "106 conv_transpose2d" [style=solid, label="(512,)"]; -"12 up_path_0_conv_block_block_0_bias" -> "120 conv2d_10" [style=solid, label="(512,)"]; -"13 up_path_0_conv_block_block_3_bias" -> "126 conv2d_11" [style=solid, label="(512,)"]; -"14 up_path_1_up_weight" -> "130 conv_transpose2d_1" [style=solid, label="(512, 256, 2, 2)"]; -"15 up_path_1_up_bias" -> "130 conv_transpose2d_1" [style=solid, label="(256,)"]; -"16 up_path_1_conv_block_block_0_bias" -> "144 conv2d_12" [style=solid, label="(256,)"]; -"17 up_path_1_conv_block_block_3_bias" -> "150 conv2d_13" [style=solid, label="(256,)"]; -"18 up_path_2_up_weight" -> "154 conv_transpose2d_2" [style=solid, label="(256, 128, 2, 2)"]; -"19 up_path_2_up_bias" -> "154 conv_transpose2d_2" [style=solid, label="(128,)"]; -"20 up_path_2_conv_block_block_0_bias" -> "168 conv2d_14" [style=solid, label="(128,)"]; -"21 up_path_2_conv_block_block_3_bias" -> "174 conv2d_15" [style=solid, label="(128,)"]; -"22 up_path_3_up_weight" -> "178 conv_transpose2d_3" [style=solid, label="(128, 64, 2, 2)"]; -"23 up_path_3_up_bias" -> "178 conv_transpose2d_3" [style=solid, label="(64,)"]; -"24 up_path_3_conv_block_block_0_bias" -> "192 conv2d_16" [style=solid, label="(64,)"]; -"25 up_path_3_conv_block_block_3_bias" -> "198 conv2d_17" [style=solid, label="(64,)"]; -"26 last_bias" -> "204 conv2d_18" [style=solid, label="(12,)"]; -"27 x" -> "28 quantize_per_tensor_0" [style=solid, label="(1, 3, 224, 224)"]; -"28 quantize_per_tensor_0" -> "29 dequantize_per_tensor_1" [style=solid, label="(1, 3, 224, 224)"]; -"29 dequantize_per_tensor_1" -> "32 conv2d" [style=solid, label="(1, 3, 224, 224)"]; -"30 _frozen_param0" -> "31 dequantize_per_tensor_2" [style=solid, label="(64, 3, 3, 3)"]; -"31 dequantize_per_tensor_2" -> "32 conv2d" [style=solid, label="(64, 3, 3, 3)"]; -"32 conv2d" -> "33 relu" [style=solid, label="(1, 64, 222, 222)"]; -"33 relu" -> "34 quantize_per_tensor_3" [style=solid, label="(1, 64, 222, 222)"]; -"34 quantize_per_tensor_3" -> "35 dequantize_per_tensor_4" [style=solid, label="(1, 64, 222, 222)"]; -"35 dequantize_per_tensor_4" -> "38 conv2d_1" [style=solid, label="(1, 64, 222, 222)"]; -"36 _frozen_param1" -> "37 dequantize_per_tensor_5" [style=solid, label="(64, 64, 3, 3)"]; -"37 dequantize_per_tensor_5" -> "38 conv2d_1" [style=solid, label="(64, 64, 3, 3)"]; -"38 conv2d_1" -> "39 relu_1" [style=solid, label="(1, 64, 220, 220)"]; -"39 relu_1" -> "40 quantize_per_tensor_6" [style=solid, label="(1, 64, 220, 220)"]; -"40 quantize_per_tensor_6" -> "41 dequantize_per_tensor_7" [style=solid, label="(1, 64, 220, 220)"]; -"40 quantize_per_tensor_6" -> "42 dequantize_per_tensor_8" [style=solid, label="(1, 64, 220, 220)"]; -"41 dequantize_per_tensor_7" -> "181 slice_13" [style=solid, label="(1, 64, 220, 220)"]; -"42 dequantize_per_tensor_8" -> "43 max_pool2d" [style=solid, label="(1, 64, 220, 220)"]; -"43 max_pool2d" -> "44 quantize_per_tensor_9" [style=solid, label="(1, 64, 110, 110)"]; -"44 quantize_per_tensor_9" -> "45 dequantize_per_tensor_10" [style=solid, label="(1, 64, 110, 110)"]; -"45 dequantize_per_tensor_10" -> "48 conv2d_2" [style=solid, label="(1, 64, 110, 110)"]; -"46 _frozen_param2" -> "47 dequantize_per_tensor_11" [style=solid, label="(128, 64, 3, 3)"]; -"47 dequantize_per_tensor_11" -> "48 conv2d_2" [style=solid, label="(128, 64, 3, 3)"]; -"48 conv2d_2" -> "49 relu_2" [style=solid, label="(1, 128, 108, 108)"]; -"49 relu_2" -> "50 quantize_per_tensor_12" [style=solid, label="(1, 128, 108, 108)"]; -"50 quantize_per_tensor_12" -> "51 dequantize_per_tensor_13" [style=solid, label="(1, 128, 108, 108)"]; -"51 dequantize_per_tensor_13" -> "54 conv2d_3" [style=solid, label="(1, 128, 108, 108)"]; -"52 _frozen_param3" -> "53 dequantize_per_tensor_14" [style=solid, label="(128, 128, 3, 3)"]; -"53 dequantize_per_tensor_14" -> "54 conv2d_3" [style=solid, label="(128, 128, 3, 3)"]; -"54 conv2d_3" -> "55 relu_3" [style=solid, label="(1, 128, 106, 106)"]; -"55 relu_3" -> "56 quantize_per_tensor_15" [style=solid, label="(1, 128, 106, 106)"]; -"56 quantize_per_tensor_15" -> "57 dequantize_per_tensor_16" [style=solid, label="(1, 128, 106, 106)"]; -"56 quantize_per_tensor_15" -> "58 dequantize_per_tensor_17" [style=solid, label="(1, 128, 106, 106)"]; -"57 dequantize_per_tensor_16" -> "157 slice_9" [style=solid, label="(1, 128, 106, 106)"]; -"58 dequantize_per_tensor_17" -> "59 max_pool2d_1" [style=solid, label="(1, 128, 106, 106)"]; -"59 max_pool2d_1" -> "60 quantize_per_tensor_18" [style=solid, label="(1, 128, 53, 53)"]; -"60 quantize_per_tensor_18" -> "61 dequantize_per_tensor_19" [style=solid, label="(1, 128, 53, 53)"]; -"61 dequantize_per_tensor_19" -> "64 conv2d_4" [style=solid, label="(1, 128, 53, 53)"]; -"62 _frozen_param4" -> "63 dequantize_per_tensor_20" [style=solid, label="(256, 128, 3, 3)"]; -"63 dequantize_per_tensor_20" -> "64 conv2d_4" [style=solid, label="(256, 128, 3, 3)"]; -"64 conv2d_4" -> "65 relu_4" [style=solid, label="(1, 256, 51, 51)"]; -"65 relu_4" -> "66 quantize_per_tensor_21" [style=solid, label="(1, 256, 51, 51)"]; -"66 quantize_per_tensor_21" -> "67 dequantize_per_tensor_22" [style=solid, label="(1, 256, 51, 51)"]; -"67 dequantize_per_tensor_22" -> "70 conv2d_5" [style=solid, label="(1, 256, 51, 51)"]; -"68 _frozen_param5" -> "69 dequantize_per_tensor_23" [style=solid, label="(256, 256, 3, 3)"]; -"69 dequantize_per_tensor_23" -> "70 conv2d_5" [style=solid, label="(256, 256, 3, 3)"]; -"70 conv2d_5" -> "71 relu_5" [style=solid, label="(1, 256, 49, 49)"]; -"71 relu_5" -> "72 quantize_per_tensor_24" [style=solid, label="(1, 256, 49, 49)"]; -"72 quantize_per_tensor_24" -> "73 dequantize_per_tensor_25" [style=solid, label="(1, 256, 49, 49)"]; -"72 quantize_per_tensor_24" -> "74 dequantize_per_tensor_26" [style=solid, label="(1, 256, 49, 49)"]; -"73 dequantize_per_tensor_25" -> "133 slice_5" [style=solid, label="(1, 256, 49, 49)"]; -"74 dequantize_per_tensor_26" -> "75 max_pool2d_2" [style=solid, label="(1, 256, 49, 49)"]; -"75 max_pool2d_2" -> "76 quantize_per_tensor_27" [style=solid, label="(1, 256, 24, 24)"]; -"76 quantize_per_tensor_27" -> "77 dequantize_per_tensor_28" [style=solid, label="(1, 256, 24, 24)"]; -"77 dequantize_per_tensor_28" -> "80 conv2d_6" [style=solid, label="(1, 256, 24, 24)"]; -"78 _frozen_param6" -> "79 dequantize_per_tensor_29" [style=solid, label="(512, 256, 3, 3)"]; -"79 dequantize_per_tensor_29" -> "80 conv2d_6" [style=solid, label="(512, 256, 3, 3)"]; -"80 conv2d_6" -> "81 relu_6" [style=solid, label="(1, 512, 22, 22)"]; -"81 relu_6" -> "82 quantize_per_tensor_30" [style=solid, label="(1, 512, 22, 22)"]; -"82 quantize_per_tensor_30" -> "83 dequantize_per_tensor_31" [style=solid, label="(1, 512, 22, 22)"]; -"83 dequantize_per_tensor_31" -> "86 conv2d_7" [style=solid, label="(1, 512, 22, 22)"]; -"84 _frozen_param7" -> "85 dequantize_per_tensor_32" [style=solid, label="(512, 512, 3, 3)"]; -"85 dequantize_per_tensor_32" -> "86 conv2d_7" [style=solid, label="(512, 512, 3, 3)"]; -"86 conv2d_7" -> "87 relu_7" [style=solid, label="(1, 512, 20, 20)"]; -"87 relu_7" -> "88 quantize_per_tensor_33" [style=solid, label="(1, 512, 20, 20)"]; -"88 quantize_per_tensor_33" -> "89 dequantize_per_tensor_34" [style=solid, label="(1, 512, 20, 20)"]; -"88 quantize_per_tensor_33" -> "90 dequantize_per_tensor_35" [style=solid, label="(1, 512, 20, 20)"]; -"89 dequantize_per_tensor_34" -> "109 slice_1" [style=solid, label="(1, 512, 20, 20)"]; -"90 dequantize_per_tensor_35" -> "91 max_pool2d_3" [style=solid, label="(1, 512, 20, 20)"]; -"91 max_pool2d_3" -> "92 quantize_per_tensor_36" [style=solid, label="(1, 512, 10, 10)"]; -"92 quantize_per_tensor_36" -> "93 dequantize_per_tensor_37" [style=solid, label="(1, 512, 10, 10)"]; -"93 dequantize_per_tensor_37" -> "96 conv2d_8" [style=solid, label="(1, 512, 10, 10)"]; -"94 _frozen_param8" -> "95 dequantize_per_tensor_38" [style=solid, label="(1024, 512, 3, 3)"]; -"95 dequantize_per_tensor_38" -> "96 conv2d_8" [style=solid, label="(1024, 512, 3, 3)"]; -"96 conv2d_8" -> "97 relu_8" [style=solid, label="(1, 1024, 8, 8)"]; -"97 relu_8" -> "98 quantize_per_tensor_39" [style=solid, label="(1, 1024, 8, 8)"]; -"98 quantize_per_tensor_39" -> "99 dequantize_per_tensor_40" [style=solid, label="(1, 1024, 8, 8)"]; -"99 dequantize_per_tensor_40" -> "102 conv2d_9" [style=solid, label="(1, 1024, 8, 8)"]; -"100 _frozen_param9" -> "101 dequantize_per_tensor_41" [style=solid, label="(1024, 1024, 3, 3)"]; -"101 dequantize_per_tensor_41" -> "102 conv2d_9" [style=solid, label="(1024, 1024, 3, 3)"]; -"102 conv2d_9" -> "103 relu_9" [style=solid, label="(1, 1024, 6, 6)"]; -"103 relu_9" -> "104 quantize_per_tensor_42" [style=solid, label="(1, 1024, 6, 6)"]; -"104 quantize_per_tensor_42" -> "105 dequantize_per_tensor_43" [style=solid, label="(1, 1024, 6, 6)"]; -"105 dequantize_per_tensor_43" -> "106 conv_transpose2d" [style=solid, label="(1, 1024, 6, 6)"]; -"106 conv_transpose2d" -> "107 quantize_per_tensor_44" [style=solid, label="(1, 512, 12, 12)"]; -"107 quantize_per_tensor_44" -> "108 dequantize_per_tensor_45" [style=solid, label="(1, 512, 12, 12)"]; -"108 dequantize_per_tensor_45" -> "115 cat" [style=solid, label="(1, 512, 12, 12)"]; -"109 slice_1" -> "110 slice_2" [style=solid, label="(1, 512, 20, 20)"]; -"110 slice_2" -> "111 slice_3" [style=solid, label="(1, 512, 20, 20)"]; -"111 slice_3" -> "112 slice_4" [style=solid, label="(1, 512, 12, 20)"]; -"112 slice_4" -> "113 quantize_per_tensor_46" [style=solid, label="(1, 512, 12, 12)"]; -"113 quantize_per_tensor_46" -> "114 dequantize_per_tensor_47" [style=solid, label="(1, 512, 12, 12)"]; -"114 dequantize_per_tensor_47" -> "115 cat" [style=solid, label="(1, 512, 12, 12)"]; -"115 cat" -> "116 quantize_per_tensor_48" [style=solid, label="(1, 1024, 12, 12)"]; -"116 quantize_per_tensor_48" -> "117 dequantize_per_tensor_49" [style=solid, label="(1, 1024, 12, 12)"]; -"117 dequantize_per_tensor_49" -> "120 conv2d_10" [style=solid, label="(1, 1024, 12, 12)"]; -"118 _frozen_param10" -> "119 dequantize_per_tensor_50" [style=solid, label="(512, 1024, 3, 3)"]; -"119 dequantize_per_tensor_50" -> "120 conv2d_10" [style=solid, label="(512, 1024, 3, 3)"]; -"120 conv2d_10" -> "121 relu_10" [style=solid, label="(1, 512, 10, 10)"]; -"121 relu_10" -> "122 quantize_per_tensor_51" [style=solid, label="(1, 512, 10, 10)"]; -"122 quantize_per_tensor_51" -> "123 dequantize_per_tensor_52" [style=solid, label="(1, 512, 10, 10)"]; -"123 dequantize_per_tensor_52" -> "126 conv2d_11" [style=solid, label="(1, 512, 10, 10)"]; -"124 _frozen_param11" -> "125 dequantize_per_tensor_53" [style=solid, label="(512, 512, 3, 3)"]; -"125 dequantize_per_tensor_53" -> "126 conv2d_11" [style=solid, label="(512, 512, 3, 3)"]; -"126 conv2d_11" -> "127 relu_11" [style=solid, label="(1, 512, 8, 8)"]; -"127 relu_11" -> "128 quantize_per_tensor_54" [style=solid, label="(1, 512, 8, 8)"]; -"128 quantize_per_tensor_54" -> "129 dequantize_per_tensor_55" [style=solid, label="(1, 512, 8, 8)"]; -"129 dequantize_per_tensor_55" -> "130 conv_transpose2d_1" [style=solid, label="(1, 512, 8, 8)"]; -"130 conv_transpose2d_1" -> "131 quantize_per_tensor_56" [style=solid, label="(1, 256, 16, 16)"]; -"131 quantize_per_tensor_56" -> "132 dequantize_per_tensor_57" [style=solid, label="(1, 256, 16, 16)"]; -"132 dequantize_per_tensor_57" -> "139 cat_1" [style=solid, label="(1, 256, 16, 16)"]; -"133 slice_5" -> "134 slice_6" [style=solid, label="(1, 256, 49, 49)"]; -"134 slice_6" -> "135 slice_7" [style=solid, label="(1, 256, 49, 49)"]; -"135 slice_7" -> "136 slice_8" [style=solid, label="(1, 256, 16, 49)"]; -"136 slice_8" -> "137 quantize_per_tensor_58" [style=solid, label="(1, 256, 16, 16)"]; -"137 quantize_per_tensor_58" -> "138 dequantize_per_tensor_59" [style=solid, label="(1, 256, 16, 16)"]; -"138 dequantize_per_tensor_59" -> "139 cat_1" [style=solid, label="(1, 256, 16, 16)"]; -"139 cat_1" -> "140 quantize_per_tensor_60" [style=solid, label="(1, 512, 16, 16)"]; -"140 quantize_per_tensor_60" -> "141 dequantize_per_tensor_61" [style=solid, label="(1, 512, 16, 16)"]; -"141 dequantize_per_tensor_61" -> "144 conv2d_12" [style=solid, label="(1, 512, 16, 16)"]; -"142 _frozen_param12" -> "143 dequantize_per_tensor_62" [style=solid, label="(256, 512, 3, 3)"]; -"143 dequantize_per_tensor_62" -> "144 conv2d_12" [style=solid, label="(256, 512, 3, 3)"]; -"144 conv2d_12" -> "145 relu_12" [style=solid, label="(1, 256, 14, 14)"]; -"145 relu_12" -> "146 quantize_per_tensor_63" [style=solid, label="(1, 256, 14, 14)"]; -"146 quantize_per_tensor_63" -> "147 dequantize_per_tensor_64" [style=solid, label="(1, 256, 14, 14)"]; -"147 dequantize_per_tensor_64" -> "150 conv2d_13" [style=solid, label="(1, 256, 14, 14)"]; -"148 _frozen_param13" -> "149 dequantize_per_tensor_65" [style=solid, label="(256, 256, 3, 3)"]; -"149 dequantize_per_tensor_65" -> "150 conv2d_13" [style=solid, label="(256, 256, 3, 3)"]; -"150 conv2d_13" -> "151 relu_13" [style=solid, label="(1, 256, 12, 12)"]; -"151 relu_13" -> "152 quantize_per_tensor_66" [style=solid, label="(1, 256, 12, 12)"]; -"152 quantize_per_tensor_66" -> "153 dequantize_per_tensor_67" [style=solid, label="(1, 256, 12, 12)"]; -"153 dequantize_per_tensor_67" -> "154 conv_transpose2d_2" [style=solid, label="(1, 256, 12, 12)"]; -"154 conv_transpose2d_2" -> "155 quantize_per_tensor_68" [style=solid, label="(1, 128, 24, 24)"]; -"155 quantize_per_tensor_68" -> "156 dequantize_per_tensor_69" [style=solid, label="(1, 128, 24, 24)"]; -"156 dequantize_per_tensor_69" -> "163 cat_2" [style=solid, label="(1, 128, 24, 24)"]; -"157 slice_9" -> "158 slice_10" [style=solid, label="(1, 128, 106, 106)"]; -"158 slice_10" -> "159 slice_11" [style=solid, label="(1, 128, 106, 106)"]; -"159 slice_11" -> "160 slice_12" [style=solid, label="(1, 128, 24, 106)"]; -"160 slice_12" -> "161 quantize_per_tensor_70" [style=solid, label="(1, 128, 24, 24)"]; -"161 quantize_per_tensor_70" -> "162 dequantize_per_tensor_71" [style=solid, label="(1, 128, 24, 24)"]; -"162 dequantize_per_tensor_71" -> "163 cat_2" [style=solid, label="(1, 128, 24, 24)"]; -"163 cat_2" -> "164 quantize_per_tensor_72" [style=solid, label="(1, 256, 24, 24)"]; -"164 quantize_per_tensor_72" -> "165 dequantize_per_tensor_73" [style=solid, label="(1, 256, 24, 24)"]; -"165 dequantize_per_tensor_73" -> "168 conv2d_14" [style=solid, label="(1, 256, 24, 24)"]; -"166 _frozen_param14" -> "167 dequantize_per_tensor_74" [style=solid, label="(128, 256, 3, 3)"]; -"167 dequantize_per_tensor_74" -> "168 conv2d_14" [style=solid, label="(128, 256, 3, 3)"]; -"168 conv2d_14" -> "169 relu_14" [style=solid, label="(1, 128, 22, 22)"]; -"169 relu_14" -> "170 quantize_per_tensor_75" [style=solid, label="(1, 128, 22, 22)"]; -"170 quantize_per_tensor_75" -> "171 dequantize_per_tensor_76" [style=solid, label="(1, 128, 22, 22)"]; -"171 dequantize_per_tensor_76" -> "174 conv2d_15" [style=solid, label="(1, 128, 22, 22)"]; -"172 _frozen_param15" -> "173 dequantize_per_tensor_77" [style=solid, label="(128, 128, 3, 3)"]; -"173 dequantize_per_tensor_77" -> "174 conv2d_15" [style=solid, label="(128, 128, 3, 3)"]; -"174 conv2d_15" -> "175 relu_15" [style=solid, label="(1, 128, 20, 20)"]; -"175 relu_15" -> "176 quantize_per_tensor_78" [style=solid, label="(1, 128, 20, 20)"]; -"176 quantize_per_tensor_78" -> "177 dequantize_per_tensor_79" [style=solid, label="(1, 128, 20, 20)"]; -"177 dequantize_per_tensor_79" -> "178 conv_transpose2d_3" [style=solid, label="(1, 128, 20, 20)"]; -"178 conv_transpose2d_3" -> "179 quantize_per_tensor_80" [style=solid, label="(1, 64, 40, 40)"]; -"179 quantize_per_tensor_80" -> "180 dequantize_per_tensor_81" [style=solid, label="(1, 64, 40, 40)"]; -"180 dequantize_per_tensor_81" -> "187 cat_3" [style=solid, label="(1, 64, 40, 40)"]; -"181 slice_13" -> "182 slice_14" [style=solid, label="(1, 64, 220, 220)"]; -"182 slice_14" -> "183 slice_15" [style=solid, label="(1, 64, 220, 220)"]; -"183 slice_15" -> "184 slice_16" [style=solid, label="(1, 64, 40, 220)"]; -"184 slice_16" -> "185 quantize_per_tensor_82" [style=solid, label="(1, 64, 40, 40)"]; -"185 quantize_per_tensor_82" -> "186 dequantize_per_tensor_83" [style=solid, label="(1, 64, 40, 40)"]; -"186 dequantize_per_tensor_83" -> "187 cat_3" [style=solid, label="(1, 64, 40, 40)"]; -"187 cat_3" -> "188 quantize_per_tensor_84" [style=solid, label="(1, 128, 40, 40)"]; -"188 quantize_per_tensor_84" -> "189 dequantize_per_tensor_85" [style=solid, label="(1, 128, 40, 40)"]; -"189 dequantize_per_tensor_85" -> "192 conv2d_16" [style=solid, label="(1, 128, 40, 40)"]; -"190 _frozen_param16" -> "191 dequantize_per_tensor_86" [style=solid, label="(64, 128, 3, 3)"]; -"191 dequantize_per_tensor_86" -> "192 conv2d_16" [style=solid, label="(64, 128, 3, 3)"]; -"192 conv2d_16" -> "193 relu_16" [style=solid, label="(1, 64, 38, 38)"]; -"193 relu_16" -> "194 quantize_per_tensor_87" [style=solid, label="(1, 64, 38, 38)"]; -"194 quantize_per_tensor_87" -> "195 dequantize_per_tensor_88" [style=solid, label="(1, 64, 38, 38)"]; -"195 dequantize_per_tensor_88" -> "198 conv2d_17" [style=solid, label="(1, 64, 38, 38)"]; -"196 _frozen_param17" -> "197 dequantize_per_tensor_89" [style=solid, label="(64, 64, 3, 3)"]; -"197 dequantize_per_tensor_89" -> "198 conv2d_17" [style=solid, label="(64, 64, 3, 3)"]; -"198 conv2d_17" -> "199 relu_17" [style=solid, label="(1, 64, 36, 36)"]; -"199 relu_17" -> "200 quantize_per_tensor_90" [style=solid, label="(1, 64, 36, 36)"]; -"200 quantize_per_tensor_90" -> "201 dequantize_per_tensor_91" [style=solid, label="(1, 64, 36, 36)"]; -"201 dequantize_per_tensor_91" -> "204 conv2d_18" [style=solid, label="(1, 64, 36, 36)"]; -"202 _frozen_param18" -> "203 dequantize_per_tensor_92" [style=solid, label="(12, 64, 1, 1)"]; -"203 dequantize_per_tensor_92" -> "204 conv2d_18" [style=solid, label="(12, 64, 1, 1)"]; -"204 conv2d_18" -> "205 quantize_per_tensor_93" [style=solid, label="(1, 12, 36, 36)"]; -"205 quantize_per_tensor_93" -> "206 dequantize_per_tensor_94" [style=solid, label="(1, 12, 36, 36)"]; -"206 dequantize_per_tensor_94" -> "207 output" [style=solid, label="(1, 12, 36, 36)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/unet_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/unet_ref_qconfig.json deleted file mode 100644 index b9c9e41e3af..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/unet_ref_qconfig.json +++ /dev/null @@ -1,451 +0,0 @@ -{ - "quantization_points": { - "('conv2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('max_pool2d', 'slice_13')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_2',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_3',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('max_pool2d_1', 'slice_9')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_4',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_5',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('max_pool2d_2', 'slice_5')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_6',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_7',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('max_pool2d_3', 'slice_1')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_8',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_9',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv_transpose2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_10',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_11',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv_transpose2d_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_12',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_13',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv_transpose2d_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_14',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_15',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv_transpose2d_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_16',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_17',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('conv2d_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d_18',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('output',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": { - "0": [ - 4, - 5 - ], - "1": [ - 9, - 10 - ], - "2": [ - 14, - 15 - ], - "3": [ - 19, - 20 - ], - "4": [ - 25, - 26, - 27 - ], - "5": [ - 32, - 33, - 34 - ], - "6": [ - 39, - 40, - 41 - ], - "7": [ - 46, - 47, - 48 - ] - }, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16.dot b/tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16.dot deleted file mode 100644 index 9afd165b7e7..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16.dot +++ /dev/null @@ -1,2121 +0,0 @@ -strict digraph { -"0 _frozen_param0" [id=0, type="get_attr"]; -"1 dequantize_per_tensor_0" [id=1, type="dequantize_per_tensor"]; -"2 conv_proj_bias" [id=2, type="get_attr"]; -"3 encoder_layers_encoder_layer_0_ln_1_weight" [id=3, type="get_attr"]; -"4 encoder_layers_encoder_layer_0_ln_1_bias" [id=4, type="get_attr"]; -"5 encoder_layers_encoder_layer_0_self_attention_in_proj_bias" [id=5, type="get_attr"]; -"6 encoder_layers_encoder_layer_0_self_attention_out_proj_bias" [id=6, type="get_attr"]; -"7 encoder_layers_encoder_layer_0_ln_2_weight" [id=7, type="get_attr"]; -"8 encoder_layers_encoder_layer_0_ln_2_bias" [id=8, type="get_attr"]; -"9 encoder_layers_encoder_layer_0_mlp_0_bias" [id=9, type="get_attr"]; -"10 encoder_layers_encoder_layer_0_mlp_3_bias" [id=10, type="get_attr"]; -"11 encoder_layers_encoder_layer_1_ln_1_weight" [id=11, type="get_attr"]; -"12 encoder_layers_encoder_layer_1_ln_1_bias" [id=12, type="get_attr"]; -"13 encoder_layers_encoder_layer_1_self_attention_in_proj_bias" [id=13, type="get_attr"]; -"14 encoder_layers_encoder_layer_1_self_attention_out_proj_bias" [id=14, type="get_attr"]; -"15 encoder_layers_encoder_layer_1_ln_2_weight" [id=15, type="get_attr"]; -"16 encoder_layers_encoder_layer_1_ln_2_bias" [id=16, type="get_attr"]; -"17 encoder_layers_encoder_layer_1_mlp_0_bias" [id=17, type="get_attr"]; -"18 encoder_layers_encoder_layer_1_mlp_3_bias" [id=18, type="get_attr"]; -"19 encoder_layers_encoder_layer_2_ln_1_weight" [id=19, type="get_attr"]; -"20 encoder_layers_encoder_layer_2_ln_1_bias" [id=20, type="get_attr"]; -"21 encoder_layers_encoder_layer_2_self_attention_in_proj_bias" [id=21, type="get_attr"]; -"22 encoder_layers_encoder_layer_2_self_attention_out_proj_bias" [id=22, type="get_attr"]; -"23 encoder_layers_encoder_layer_2_ln_2_weight" [id=23, type="get_attr"]; -"24 encoder_layers_encoder_layer_2_ln_2_bias" [id=24, type="get_attr"]; -"25 encoder_layers_encoder_layer_2_mlp_0_bias" [id=25, type="get_attr"]; -"26 encoder_layers_encoder_layer_2_mlp_3_bias" [id=26, type="get_attr"]; -"27 encoder_layers_encoder_layer_3_ln_1_weight" [id=27, type="get_attr"]; -"28 encoder_layers_encoder_layer_3_ln_1_bias" [id=28, type="get_attr"]; -"29 encoder_layers_encoder_layer_3_self_attention_in_proj_bias" [id=29, type="get_attr"]; -"30 encoder_layers_encoder_layer_3_self_attention_out_proj_bias" [id=30, type="get_attr"]; -"31 encoder_layers_encoder_layer_3_ln_2_weight" [id=31, type="get_attr"]; -"32 encoder_layers_encoder_layer_3_ln_2_bias" [id=32, type="get_attr"]; -"33 encoder_layers_encoder_layer_3_mlp_0_bias" [id=33, type="get_attr"]; -"34 encoder_layers_encoder_layer_3_mlp_3_bias" [id=34, type="get_attr"]; -"35 encoder_layers_encoder_layer_4_ln_1_weight" [id=35, type="get_attr"]; -"36 encoder_layers_encoder_layer_4_ln_1_bias" [id=36, type="get_attr"]; -"37 encoder_layers_encoder_layer_4_self_attention_in_proj_bias" [id=37, type="get_attr"]; -"38 encoder_layers_encoder_layer_4_self_attention_out_proj_bias" [id=38, type="get_attr"]; -"39 encoder_layers_encoder_layer_4_ln_2_weight" [id=39, type="get_attr"]; -"40 encoder_layers_encoder_layer_4_ln_2_bias" [id=40, type="get_attr"]; -"41 encoder_layers_encoder_layer_4_mlp_0_bias" [id=41, type="get_attr"]; -"42 encoder_layers_encoder_layer_4_mlp_3_bias" [id=42, type="get_attr"]; -"43 encoder_layers_encoder_layer_5_ln_1_weight" [id=43, type="get_attr"]; -"44 encoder_layers_encoder_layer_5_ln_1_bias" [id=44, type="get_attr"]; -"45 encoder_layers_encoder_layer_5_self_attention_in_proj_bias" [id=45, type="get_attr"]; -"46 encoder_layers_encoder_layer_5_self_attention_out_proj_bias" [id=46, type="get_attr"]; -"47 encoder_layers_encoder_layer_5_ln_2_weight" [id=47, type="get_attr"]; -"48 encoder_layers_encoder_layer_5_ln_2_bias" [id=48, type="get_attr"]; -"49 encoder_layers_encoder_layer_5_mlp_0_bias" [id=49, type="get_attr"]; -"50 encoder_layers_encoder_layer_5_mlp_3_bias" [id=50, type="get_attr"]; -"51 encoder_layers_encoder_layer_6_ln_1_weight" [id=51, type="get_attr"]; -"52 encoder_layers_encoder_layer_6_ln_1_bias" [id=52, type="get_attr"]; -"53 encoder_layers_encoder_layer_6_self_attention_in_proj_bias" [id=53, type="get_attr"]; -"54 encoder_layers_encoder_layer_6_self_attention_out_proj_bias" [id=54, type="get_attr"]; -"55 encoder_layers_encoder_layer_6_ln_2_weight" [id=55, type="get_attr"]; -"56 encoder_layers_encoder_layer_6_ln_2_bias" [id=56, type="get_attr"]; -"57 encoder_layers_encoder_layer_6_mlp_0_bias" [id=57, type="get_attr"]; -"58 encoder_layers_encoder_layer_6_mlp_3_bias" [id=58, type="get_attr"]; -"59 encoder_layers_encoder_layer_7_ln_1_weight" [id=59, type="get_attr"]; -"60 encoder_layers_encoder_layer_7_ln_1_bias" [id=60, type="get_attr"]; -"61 encoder_layers_encoder_layer_7_self_attention_in_proj_bias" [id=61, type="get_attr"]; -"62 encoder_layers_encoder_layer_7_self_attention_out_proj_bias" [id=62, type="get_attr"]; -"63 encoder_layers_encoder_layer_7_ln_2_weight" [id=63, type="get_attr"]; -"64 encoder_layers_encoder_layer_7_ln_2_bias" [id=64, type="get_attr"]; -"65 encoder_layers_encoder_layer_7_mlp_0_bias" [id=65, type="get_attr"]; -"66 encoder_layers_encoder_layer_7_mlp_3_bias" [id=66, type="get_attr"]; -"67 encoder_layers_encoder_layer_8_ln_1_weight" [id=67, type="get_attr"]; -"68 encoder_layers_encoder_layer_8_ln_1_bias" [id=68, type="get_attr"]; -"69 encoder_layers_encoder_layer_8_self_attention_in_proj_bias" [id=69, type="get_attr"]; -"70 encoder_layers_encoder_layer_8_self_attention_out_proj_bias" [id=70, type="get_attr"]; -"71 encoder_layers_encoder_layer_8_ln_2_weight" [id=71, type="get_attr"]; -"72 encoder_layers_encoder_layer_8_ln_2_bias" [id=72, type="get_attr"]; -"73 encoder_layers_encoder_layer_8_mlp_0_bias" [id=73, type="get_attr"]; -"74 encoder_layers_encoder_layer_8_mlp_3_bias" [id=74, type="get_attr"]; -"75 encoder_layers_encoder_layer_9_ln_1_weight" [id=75, type="get_attr"]; -"76 encoder_layers_encoder_layer_9_ln_1_bias" [id=76, type="get_attr"]; -"77 encoder_layers_encoder_layer_9_self_attention_in_proj_bias" [id=77, type="get_attr"]; -"78 encoder_layers_encoder_layer_9_self_attention_out_proj_bias" [id=78, type="get_attr"]; -"79 encoder_layers_encoder_layer_9_ln_2_weight" [id=79, type="get_attr"]; -"80 encoder_layers_encoder_layer_9_ln_2_bias" [id=80, type="get_attr"]; -"81 encoder_layers_encoder_layer_9_mlp_0_bias" [id=81, type="get_attr"]; -"82 encoder_layers_encoder_layer_9_mlp_3_bias" [id=82, type="get_attr"]; -"83 encoder_layers_encoder_layer_10_ln_1_weight" [id=83, type="get_attr"]; -"84 encoder_layers_encoder_layer_10_ln_1_bias" [id=84, type="get_attr"]; -"85 encoder_layers_encoder_layer_10_self_attention_in_proj_bias" [id=85, type="get_attr"]; -"86 encoder_layers_encoder_layer_10_self_attention_out_proj_bias" [id=86, type="get_attr"]; -"87 encoder_layers_encoder_layer_10_ln_2_weight" [id=87, type="get_attr"]; -"88 encoder_layers_encoder_layer_10_ln_2_bias" [id=88, type="get_attr"]; -"89 encoder_layers_encoder_layer_10_mlp_0_bias" [id=89, type="get_attr"]; -"90 encoder_layers_encoder_layer_10_mlp_3_bias" [id=90, type="get_attr"]; -"91 encoder_layers_encoder_layer_11_ln_1_weight" [id=91, type="get_attr"]; -"92 encoder_layers_encoder_layer_11_ln_1_bias" [id=92, type="get_attr"]; -"93 encoder_layers_encoder_layer_11_self_attention_in_proj_bias" [id=93, type="get_attr"]; -"94 encoder_layers_encoder_layer_11_self_attention_out_proj_bias" [id=94, type="get_attr"]; -"95 encoder_layers_encoder_layer_11_ln_2_weight" [id=95, type="get_attr"]; -"96 encoder_layers_encoder_layer_11_ln_2_bias" [id=96, type="get_attr"]; -"97 encoder_layers_encoder_layer_11_mlp_0_bias" [id=97, type="get_attr"]; -"98 encoder_layers_encoder_layer_11_mlp_3_bias" [id=98, type="get_attr"]; -"99 encoder_ln_weight" [id=99, type="get_attr"]; -"100 encoder_ln_bias" [id=100, type="get_attr"]; -"101 heads_head_bias" [id=101, type="get_attr"]; -"102 x" [id=102, type=input]; -"103 quantize_per_tensor_1" [id=103, type="quantize_per_tensor"]; -"104 dequantize_per_tensor_2" [id=104, type="dequantize_per_tensor"]; -"105 _frozen_param1" [id=105, type="get_attr"]; -"106 dequantize_per_tensor_3" [id=106, type="dequantize_per_tensor"]; -"107 conv2d" [id=107, type=conv2d]; -"108 quantize_per_tensor_4" [id=108, type="quantize_per_tensor"]; -"109 dequantize_per_tensor_5" [id=109, type="dequantize_per_tensor"]; -"110 reshape" [id=110, type=reshape]; -"111 permute" [id=111, type=permute]; -"112 quantize_per_tensor_6" [id=112, type="quantize_per_tensor"]; -"113 dequantize_per_tensor_7" [id=113, type="dequantize_per_tensor"]; -"114 _frozen_param2" [id=114, type="get_attr"]; -"115 dequantize_per_tensor_8" [id=115, type="dequantize_per_tensor"]; -"116 cat" [id=116, type=cat]; -"117 quantize_per_tensor_9" [id=117, type="quantize_per_tensor"]; -"118 dequantize_per_tensor_10" [id=118, type="dequantize_per_tensor"]; -"119 add" [id=119, type=add]; -"120 quantize_per_tensor_11" [id=120, type="quantize_per_tensor"]; -"121 dequantize_per_tensor_12" [id=121, type="dequantize_per_tensor"]; -"122 dropout" [id=122, type=dropout]; -"123 layer_norm" [id=123, type="layer_norm"]; -"124 transpose" [id=124, type=transpose]; -"125 transpose_0_0_nncf_smooth_quant_0" [id=125, type="call_module"]; -"126 quantize_per_tensor_13" [id=126, type="quantize_per_tensor"]; -"127 dequantize_per_tensor_14" [id=127, type="dequantize_per_tensor"]; -"128 _frozen_param3" [id=128, type="get_attr"]; -"129 dequantize_per_tensor_15" [id=129, type="dequantize_per_tensor"]; -"130 linear" [id=130, type=linear]; -"131 quantize_per_tensor_16" [id=131, type="quantize_per_tensor"]; -"132 dequantize_per_tensor_17" [id=132, type="dequantize_per_tensor"]; -"133 unflatten" [id=133, type=unflatten]; -"134 unsqueeze" [id=134, type=unsqueeze]; -"135 transpose_1" [id=135, type=transpose]; -"136 squeeze" [id=136, type=squeeze]; -"137 contiguous" [id=137, type=contiguous]; -"138 select" [id=138, type=select]; -"139 select_1" [id=139, type=select]; -"140 select_2" [id=140, type=select]; -"141 view" [id=141, type=view]; -"142 transpose_2" [id=142, type=transpose]; -"143 view_1" [id=143, type=view]; -"144 transpose_3" [id=144, type=transpose]; -"145 view_2" [id=145, type=view]; -"146 transpose_4" [id=146, type=transpose]; -"147 view_3" [id=147, type=view]; -"148 view_4" [id=148, type=view]; -"149 view_5" [id=149, type=view]; -"150 scaled_dot_product_attention" [id=150, type="scaled_dot_product_attention"]; -"151 permute_1" [id=151, type=permute]; -"152 view_6" [id=152, type=view]; -"153 view_6_0_0_nncf_smooth_quant_0" [id=153, type="call_module"]; -"154 quantize_per_tensor_18" [id=154, type="quantize_per_tensor"]; -"155 dequantize_per_tensor_19" [id=155, type="dequantize_per_tensor"]; -"156 _frozen_param4" [id=156, type="get_attr"]; -"157 dequantize_per_tensor_20" [id=157, type="dequantize_per_tensor"]; -"158 linear_1" [id=158, type=linear]; -"159 quantize_per_tensor_21" [id=159, type="quantize_per_tensor"]; -"160 dequantize_per_tensor_22" [id=160, type="dequantize_per_tensor"]; -"161 view_7" [id=161, type=view]; -"162 quantize_per_tensor_23" [id=162, type="quantize_per_tensor"]; -"163 dequantize_per_tensor_24" [id=163, type="dequantize_per_tensor"]; -"164 transpose_5" [id=164, type=transpose]; -"165 dropout_1" [id=165, type=dropout]; -"166 quantize_per_tensor_25" [id=166, type="quantize_per_tensor"]; -"167 dequantize_per_tensor_26" [id=167, type="dequantize_per_tensor"]; -"168 quantize_per_tensor_27" [id=168, type="quantize_per_tensor"]; -"169 dequantize_per_tensor_28" [id=169, type="dequantize_per_tensor"]; -"170 add_1" [id=170, type=add]; -"171 quantize_per_tensor_29" [id=171, type="quantize_per_tensor"]; -"172 dequantize_per_tensor_30" [id=172, type="dequantize_per_tensor"]; -"173 dequantize_per_tensor_31" [id=173, type="dequantize_per_tensor"]; -"174 layer_norm_1" [id=174, type="layer_norm"]; -"175 layer_norm_1_0_0_nncf_smooth_quant_0" [id=175, type="call_module"]; -"176 quantize_per_tensor_32" [id=176, type="quantize_per_tensor"]; -"177 dequantize_per_tensor_33" [id=177, type="dequantize_per_tensor"]; -"178 _frozen_param5" [id=178, type="get_attr"]; -"179 dequantize_per_tensor_34" [id=179, type="dequantize_per_tensor"]; -"180 linear_2" [id=180, type=linear]; -"181 quantize_per_tensor_35" [id=181, type="quantize_per_tensor"]; -"182 dequantize_per_tensor_36" [id=182, type="dequantize_per_tensor"]; -"183 gelu" [id=183, type=gelu]; -"184 dropout_2" [id=184, type=dropout]; -"185 dropout_2_0_0_nncf_smooth_quant_0" [id=185, type="call_module"]; -"186 quantize_per_tensor_37" [id=186, type="quantize_per_tensor"]; -"187 dequantize_per_tensor_38" [id=187, type="dequantize_per_tensor"]; -"188 _frozen_param6" [id=188, type="get_attr"]; -"189 dequantize_per_tensor_39" [id=189, type="dequantize_per_tensor"]; -"190 linear_3" [id=190, type=linear]; -"191 quantize_per_tensor_40" [id=191, type="quantize_per_tensor"]; -"192 dequantize_per_tensor_41" [id=192, type="dequantize_per_tensor"]; -"193 dropout_3" [id=193, type=dropout]; -"194 quantize_per_tensor_42" [id=194, type="quantize_per_tensor"]; -"195 dequantize_per_tensor_43" [id=195, type="dequantize_per_tensor"]; -"196 add_2" [id=196, type=add]; -"197 quantize_per_tensor_44" [id=197, type="quantize_per_tensor"]; -"198 dequantize_per_tensor_45" [id=198, type="dequantize_per_tensor"]; -"199 dequantize_per_tensor_46" [id=199, type="dequantize_per_tensor"]; -"200 layer_norm_2" [id=200, type="layer_norm"]; -"201 transpose_6" [id=201, type=transpose]; -"202 transpose_6_0_0_nncf_smooth_quant_0" [id=202, type="call_module"]; -"203 quantize_per_tensor_47" [id=203, type="quantize_per_tensor"]; -"204 dequantize_per_tensor_48" [id=204, type="dequantize_per_tensor"]; -"205 _frozen_param7" [id=205, type="get_attr"]; -"206 dequantize_per_tensor_49" [id=206, type="dequantize_per_tensor"]; -"207 linear_4" [id=207, type=linear]; -"208 quantize_per_tensor_50" [id=208, type="quantize_per_tensor"]; -"209 dequantize_per_tensor_51" [id=209, type="dequantize_per_tensor"]; -"210 unflatten_1" [id=210, type=unflatten]; -"211 unsqueeze_1" [id=211, type=unsqueeze]; -"212 transpose_7" [id=212, type=transpose]; -"213 squeeze_1" [id=213, type=squeeze]; -"214 contiguous_1" [id=214, type=contiguous]; -"215 select_3" [id=215, type=select]; -"216 select_4" [id=216, type=select]; -"217 select_5" [id=217, type=select]; -"218 view_8" [id=218, type=view]; -"219 transpose_8" [id=219, type=transpose]; -"220 view_9" [id=220, type=view]; -"221 transpose_9" [id=221, type=transpose]; -"222 view_10" [id=222, type=view]; -"223 transpose_10" [id=223, type=transpose]; -"224 view_11" [id=224, type=view]; -"225 view_12" [id=225, type=view]; -"226 view_13" [id=226, type=view]; -"227 scaled_dot_product_attention_1" [id=227, type="scaled_dot_product_attention"]; -"228 permute_2" [id=228, type=permute]; -"229 view_14" [id=229, type=view]; -"230 view_14_0_0_nncf_smooth_quant_0" [id=230, type="call_module"]; -"231 quantize_per_tensor_52" [id=231, type="quantize_per_tensor"]; -"232 dequantize_per_tensor_53" [id=232, type="dequantize_per_tensor"]; -"233 _frozen_param8" [id=233, type="get_attr"]; -"234 dequantize_per_tensor_54" [id=234, type="dequantize_per_tensor"]; -"235 linear_5" [id=235, type=linear]; -"236 quantize_per_tensor_55" [id=236, type="quantize_per_tensor"]; -"237 dequantize_per_tensor_56" [id=237, type="dequantize_per_tensor"]; -"238 view_15" [id=238, type=view]; -"239 quantize_per_tensor_57" [id=239, type="quantize_per_tensor"]; -"240 dequantize_per_tensor_58" [id=240, type="dequantize_per_tensor"]; -"241 transpose_11" [id=241, type=transpose]; -"242 dropout_4" [id=242, type=dropout]; -"243 quantize_per_tensor_59" [id=243, type="quantize_per_tensor"]; -"244 dequantize_per_tensor_60" [id=244, type="dequantize_per_tensor"]; -"245 add_3" [id=245, type=add]; -"246 quantize_per_tensor_61" [id=246, type="quantize_per_tensor"]; -"247 dequantize_per_tensor_62" [id=247, type="dequantize_per_tensor"]; -"248 dequantize_per_tensor_63" [id=248, type="dequantize_per_tensor"]; -"249 layer_norm_3" [id=249, type="layer_norm"]; -"250 layer_norm_3_0_0_nncf_smooth_quant_0" [id=250, type="call_module"]; -"251 quantize_per_tensor_64" [id=251, type="quantize_per_tensor"]; -"252 dequantize_per_tensor_65" [id=252, type="dequantize_per_tensor"]; -"253 _frozen_param9" [id=253, type="get_attr"]; -"254 dequantize_per_tensor_66" [id=254, type="dequantize_per_tensor"]; -"255 linear_6" [id=255, type=linear]; -"256 quantize_per_tensor_67" [id=256, type="quantize_per_tensor"]; -"257 dequantize_per_tensor_68" [id=257, type="dequantize_per_tensor"]; -"258 gelu_1" [id=258, type=gelu]; -"259 dropout_5" [id=259, type=dropout]; -"260 dropout_5_0_0_nncf_smooth_quant_0" [id=260, type="call_module"]; -"261 quantize_per_tensor_69" [id=261, type="quantize_per_tensor"]; -"262 dequantize_per_tensor_70" [id=262, type="dequantize_per_tensor"]; -"263 _frozen_param10" [id=263, type="get_attr"]; -"264 dequantize_per_tensor_71" [id=264, type="dequantize_per_tensor"]; -"265 linear_7" [id=265, type=linear]; -"266 quantize_per_tensor_72" [id=266, type="quantize_per_tensor"]; -"267 dequantize_per_tensor_73" [id=267, type="dequantize_per_tensor"]; -"268 dropout_6" [id=268, type=dropout]; -"269 quantize_per_tensor_74" [id=269, type="quantize_per_tensor"]; -"270 dequantize_per_tensor_75" [id=270, type="dequantize_per_tensor"]; -"271 add_4" [id=271, type=add]; -"272 quantize_per_tensor_76" [id=272, type="quantize_per_tensor"]; -"273 dequantize_per_tensor_77" [id=273, type="dequantize_per_tensor"]; -"274 dequantize_per_tensor_78" [id=274, type="dequantize_per_tensor"]; -"275 layer_norm_4" [id=275, type="layer_norm"]; -"276 transpose_12" [id=276, type=transpose]; -"277 transpose_12_0_0_nncf_smooth_quant_0" [id=277, type="call_module"]; -"278 quantize_per_tensor_79" [id=278, type="quantize_per_tensor"]; -"279 dequantize_per_tensor_80" [id=279, type="dequantize_per_tensor"]; -"280 _frozen_param11" [id=280, type="get_attr"]; -"281 dequantize_per_tensor_81" [id=281, type="dequantize_per_tensor"]; -"282 linear_8" [id=282, type=linear]; -"283 quantize_per_tensor_82" [id=283, type="quantize_per_tensor"]; -"284 dequantize_per_tensor_83" [id=284, type="dequantize_per_tensor"]; -"285 unflatten_2" [id=285, type=unflatten]; -"286 unsqueeze_2" [id=286, type=unsqueeze]; -"287 transpose_13" [id=287, type=transpose]; -"288 squeeze_2" [id=288, type=squeeze]; -"289 contiguous_2" [id=289, type=contiguous]; -"290 select_6" [id=290, type=select]; -"291 select_7" [id=291, type=select]; -"292 select_8" [id=292, type=select]; -"293 view_16" [id=293, type=view]; -"294 transpose_14" [id=294, type=transpose]; -"295 view_17" [id=295, type=view]; -"296 transpose_15" [id=296, type=transpose]; -"297 view_18" [id=297, type=view]; -"298 transpose_16" [id=298, type=transpose]; -"299 view_19" [id=299, type=view]; -"300 view_20" [id=300, type=view]; -"301 view_21" [id=301, type=view]; -"302 scaled_dot_product_attention_2" [id=302, type="scaled_dot_product_attention"]; -"303 permute_3" [id=303, type=permute]; -"304 view_22" [id=304, type=view]; -"305 view_22_0_0_nncf_smooth_quant_0" [id=305, type="call_module"]; -"306 quantize_per_tensor_84" [id=306, type="quantize_per_tensor"]; -"307 dequantize_per_tensor_85" [id=307, type="dequantize_per_tensor"]; -"308 _frozen_param12" [id=308, type="get_attr"]; -"309 dequantize_per_tensor_86" [id=309, type="dequantize_per_tensor"]; -"310 linear_9" [id=310, type=linear]; -"311 quantize_per_tensor_87" [id=311, type="quantize_per_tensor"]; -"312 dequantize_per_tensor_88" [id=312, type="dequantize_per_tensor"]; -"313 view_23" [id=313, type=view]; -"314 quantize_per_tensor_89" [id=314, type="quantize_per_tensor"]; -"315 dequantize_per_tensor_90" [id=315, type="dequantize_per_tensor"]; -"316 transpose_17" [id=316, type=transpose]; -"317 dropout_7" [id=317, type=dropout]; -"318 quantize_per_tensor_91" [id=318, type="quantize_per_tensor"]; -"319 dequantize_per_tensor_92" [id=319, type="dequantize_per_tensor"]; -"320 add_5" [id=320, type=add]; -"321 quantize_per_tensor_93" [id=321, type="quantize_per_tensor"]; -"322 dequantize_per_tensor_94" [id=322, type="dequantize_per_tensor"]; -"323 dequantize_per_tensor_95" [id=323, type="dequantize_per_tensor"]; -"324 layer_norm_5" [id=324, type="layer_norm"]; -"325 layer_norm_5_0_0_nncf_smooth_quant_0" [id=325, type="call_module"]; -"326 quantize_per_tensor_96" [id=326, type="quantize_per_tensor"]; -"327 dequantize_per_tensor_97" [id=327, type="dequantize_per_tensor"]; -"328 _frozen_param13" [id=328, type="get_attr"]; -"329 dequantize_per_tensor_98" [id=329, type="dequantize_per_tensor"]; -"330 linear_10" [id=330, type=linear]; -"331 quantize_per_tensor_99" [id=331, type="quantize_per_tensor"]; -"332 dequantize_per_tensor_100" [id=332, type="dequantize_per_tensor"]; -"333 gelu_2" [id=333, type=gelu]; -"334 dropout_8" [id=334, type=dropout]; -"335 dropout_8_0_0_nncf_smooth_quant_0" [id=335, type="call_module"]; -"336 quantize_per_tensor_101" [id=336, type="quantize_per_tensor"]; -"337 dequantize_per_tensor_102" [id=337, type="dequantize_per_tensor"]; -"338 _frozen_param14" [id=338, type="get_attr"]; -"339 dequantize_per_tensor_103" [id=339, type="dequantize_per_tensor"]; -"340 linear_11" [id=340, type=linear]; -"341 quantize_per_tensor_104" [id=341, type="quantize_per_tensor"]; -"342 dequantize_per_tensor_105" [id=342, type="dequantize_per_tensor"]; -"343 dropout_9" [id=343, type=dropout]; -"344 quantize_per_tensor_106" [id=344, type="quantize_per_tensor"]; -"345 dequantize_per_tensor_107" [id=345, type="dequantize_per_tensor"]; -"346 add_6" [id=346, type=add]; -"347 quantize_per_tensor_108" [id=347, type="quantize_per_tensor"]; -"348 dequantize_per_tensor_109" [id=348, type="dequantize_per_tensor"]; -"349 dequantize_per_tensor_110" [id=349, type="dequantize_per_tensor"]; -"350 layer_norm_6" [id=350, type="layer_norm"]; -"351 transpose_18" [id=351, type=transpose]; -"352 transpose_18_0_0_nncf_smooth_quant_0" [id=352, type="call_module"]; -"353 quantize_per_tensor_111" [id=353, type="quantize_per_tensor"]; -"354 dequantize_per_tensor_112" [id=354, type="dequantize_per_tensor"]; -"355 _frozen_param15" [id=355, type="get_attr"]; -"356 dequantize_per_tensor_113" [id=356, type="dequantize_per_tensor"]; -"357 linear_12" [id=357, type=linear]; -"358 quantize_per_tensor_114" [id=358, type="quantize_per_tensor"]; -"359 dequantize_per_tensor_115" [id=359, type="dequantize_per_tensor"]; -"360 unflatten_3" [id=360, type=unflatten]; -"361 unsqueeze_3" [id=361, type=unsqueeze]; -"362 transpose_19" [id=362, type=transpose]; -"363 squeeze_3" [id=363, type=squeeze]; -"364 contiguous_3" [id=364, type=contiguous]; -"365 select_9" [id=365, type=select]; -"366 select_10" [id=366, type=select]; -"367 select_11" [id=367, type=select]; -"368 view_24" [id=368, type=view]; -"369 transpose_20" [id=369, type=transpose]; -"370 view_25" [id=370, type=view]; -"371 transpose_21" [id=371, type=transpose]; -"372 view_26" [id=372, type=view]; -"373 transpose_22" [id=373, type=transpose]; -"374 view_27" [id=374, type=view]; -"375 view_28" [id=375, type=view]; -"376 view_29" [id=376, type=view]; -"377 scaled_dot_product_attention_3" [id=377, type="scaled_dot_product_attention"]; -"378 permute_4" [id=378, type=permute]; -"379 view_30" [id=379, type=view]; -"380 view_30_0_0_nncf_smooth_quant_0" [id=380, type="call_module"]; -"381 quantize_per_tensor_116" [id=381, type="quantize_per_tensor"]; -"382 dequantize_per_tensor_117" [id=382, type="dequantize_per_tensor"]; -"383 _frozen_param16" [id=383, type="get_attr"]; -"384 dequantize_per_tensor_118" [id=384, type="dequantize_per_tensor"]; -"385 linear_13" [id=385, type=linear]; -"386 quantize_per_tensor_119" [id=386, type="quantize_per_tensor"]; -"387 dequantize_per_tensor_120" [id=387, type="dequantize_per_tensor"]; -"388 view_31" [id=388, type=view]; -"389 quantize_per_tensor_121" [id=389, type="quantize_per_tensor"]; -"390 dequantize_per_tensor_122" [id=390, type="dequantize_per_tensor"]; -"391 transpose_23" [id=391, type=transpose]; -"392 dropout_10" [id=392, type=dropout]; -"393 quantize_per_tensor_123" [id=393, type="quantize_per_tensor"]; -"394 dequantize_per_tensor_124" [id=394, type="dequantize_per_tensor"]; -"395 add_7" [id=395, type=add]; -"396 quantize_per_tensor_125" [id=396, type="quantize_per_tensor"]; -"397 dequantize_per_tensor_126" [id=397, type="dequantize_per_tensor"]; -"398 dequantize_per_tensor_127" [id=398, type="dequantize_per_tensor"]; -"399 layer_norm_7" [id=399, type="layer_norm"]; -"400 layer_norm_7_0_0_nncf_smooth_quant_0" [id=400, type="call_module"]; -"401 quantize_per_tensor_128" [id=401, type="quantize_per_tensor"]; -"402 dequantize_per_tensor_129" [id=402, type="dequantize_per_tensor"]; -"403 _frozen_param17" [id=403, type="get_attr"]; -"404 dequantize_per_tensor_130" [id=404, type="dequantize_per_tensor"]; -"405 linear_14" [id=405, type=linear]; -"406 quantize_per_tensor_131" [id=406, type="quantize_per_tensor"]; -"407 dequantize_per_tensor_132" [id=407, type="dequantize_per_tensor"]; -"408 gelu_3" [id=408, type=gelu]; -"409 dropout_11" [id=409, type=dropout]; -"410 dropout_11_0_0_nncf_smooth_quant_0" [id=410, type="call_module"]; -"411 quantize_per_tensor_133" [id=411, type="quantize_per_tensor"]; -"412 dequantize_per_tensor_134" [id=412, type="dequantize_per_tensor"]; -"413 _frozen_param18" [id=413, type="get_attr"]; -"414 dequantize_per_tensor_135" [id=414, type="dequantize_per_tensor"]; -"415 linear_15" [id=415, type=linear]; -"416 quantize_per_tensor_136" [id=416, type="quantize_per_tensor"]; -"417 dequantize_per_tensor_137" [id=417, type="dequantize_per_tensor"]; -"418 dropout_12" [id=418, type=dropout]; -"419 quantize_per_tensor_138" [id=419, type="quantize_per_tensor"]; -"420 dequantize_per_tensor_139" [id=420, type="dequantize_per_tensor"]; -"421 add_8" [id=421, type=add]; -"422 quantize_per_tensor_140" [id=422, type="quantize_per_tensor"]; -"423 dequantize_per_tensor_141" [id=423, type="dequantize_per_tensor"]; -"424 dequantize_per_tensor_142" [id=424, type="dequantize_per_tensor"]; -"425 layer_norm_8" [id=425, type="layer_norm"]; -"426 transpose_24" [id=426, type=transpose]; -"427 transpose_24_0_0_nncf_smooth_quant_0" [id=427, type="call_module"]; -"428 quantize_per_tensor_143" [id=428, type="quantize_per_tensor"]; -"429 dequantize_per_tensor_144" [id=429, type="dequantize_per_tensor"]; -"430 _frozen_param19" [id=430, type="get_attr"]; -"431 dequantize_per_tensor_145" [id=431, type="dequantize_per_tensor"]; -"432 linear_16" [id=432, type=linear]; -"433 quantize_per_tensor_146" [id=433, type="quantize_per_tensor"]; -"434 dequantize_per_tensor_147" [id=434, type="dequantize_per_tensor"]; -"435 unflatten_4" [id=435, type=unflatten]; -"436 unsqueeze_4" [id=436, type=unsqueeze]; -"437 transpose_25" [id=437, type=transpose]; -"438 squeeze_4" [id=438, type=squeeze]; -"439 contiguous_4" [id=439, type=contiguous]; -"440 select_12" [id=440, type=select]; -"441 select_13" [id=441, type=select]; -"442 select_14" [id=442, type=select]; -"443 view_32" [id=443, type=view]; -"444 transpose_26" [id=444, type=transpose]; -"445 view_33" [id=445, type=view]; -"446 transpose_27" [id=446, type=transpose]; -"447 view_34" [id=447, type=view]; -"448 transpose_28" [id=448, type=transpose]; -"449 view_35" [id=449, type=view]; -"450 view_36" [id=450, type=view]; -"451 view_37" [id=451, type=view]; -"452 scaled_dot_product_attention_4" [id=452, type="scaled_dot_product_attention"]; -"453 permute_5" [id=453, type=permute]; -"454 view_38" [id=454, type=view]; -"455 view_38_0_0_nncf_smooth_quant_0" [id=455, type="call_module"]; -"456 quantize_per_tensor_148" [id=456, type="quantize_per_tensor"]; -"457 dequantize_per_tensor_149" [id=457, type="dequantize_per_tensor"]; -"458 _frozen_param20" [id=458, type="get_attr"]; -"459 dequantize_per_tensor_150" [id=459, type="dequantize_per_tensor"]; -"460 linear_17" [id=460, type=linear]; -"461 quantize_per_tensor_151" [id=461, type="quantize_per_tensor"]; -"462 dequantize_per_tensor_152" [id=462, type="dequantize_per_tensor"]; -"463 view_39" [id=463, type=view]; -"464 quantize_per_tensor_153" [id=464, type="quantize_per_tensor"]; -"465 dequantize_per_tensor_154" [id=465, type="dequantize_per_tensor"]; -"466 transpose_29" [id=466, type=transpose]; -"467 dropout_13" [id=467, type=dropout]; -"468 quantize_per_tensor_155" [id=468, type="quantize_per_tensor"]; -"469 dequantize_per_tensor_156" [id=469, type="dequantize_per_tensor"]; -"470 add_9" [id=470, type=add]; -"471 quantize_per_tensor_157" [id=471, type="quantize_per_tensor"]; -"472 dequantize_per_tensor_158" [id=472, type="dequantize_per_tensor"]; -"473 dequantize_per_tensor_159" [id=473, type="dequantize_per_tensor"]; -"474 layer_norm_9" [id=474, type="layer_norm"]; -"475 layer_norm_9_0_0_nncf_smooth_quant_0" [id=475, type="call_module"]; -"476 quantize_per_tensor_160" [id=476, type="quantize_per_tensor"]; -"477 dequantize_per_tensor_161" [id=477, type="dequantize_per_tensor"]; -"478 _frozen_param21" [id=478, type="get_attr"]; -"479 dequantize_per_tensor_162" [id=479, type="dequantize_per_tensor"]; -"480 linear_18" [id=480, type=linear]; -"481 quantize_per_tensor_163" [id=481, type="quantize_per_tensor"]; -"482 dequantize_per_tensor_164" [id=482, type="dequantize_per_tensor"]; -"483 gelu_4" [id=483, type=gelu]; -"484 dropout_14" [id=484, type=dropout]; -"485 dropout_14_0_0_nncf_smooth_quant_0" [id=485, type="call_module"]; -"486 quantize_per_tensor_165" [id=486, type="quantize_per_tensor"]; -"487 dequantize_per_tensor_166" [id=487, type="dequantize_per_tensor"]; -"488 _frozen_param22" [id=488, type="get_attr"]; -"489 dequantize_per_tensor_167" [id=489, type="dequantize_per_tensor"]; -"490 linear_19" [id=490, type=linear]; -"491 quantize_per_tensor_168" [id=491, type="quantize_per_tensor"]; -"492 dequantize_per_tensor_169" [id=492, type="dequantize_per_tensor"]; -"493 dropout_15" [id=493, type=dropout]; -"494 quantize_per_tensor_170" [id=494, type="quantize_per_tensor"]; -"495 dequantize_per_tensor_171" [id=495, type="dequantize_per_tensor"]; -"496 add_10" [id=496, type=add]; -"497 quantize_per_tensor_172" [id=497, type="quantize_per_tensor"]; -"498 dequantize_per_tensor_173" [id=498, type="dequantize_per_tensor"]; -"499 dequantize_per_tensor_174" [id=499, type="dequantize_per_tensor"]; -"500 layer_norm_10" [id=500, type="layer_norm"]; -"501 transpose_30" [id=501, type=transpose]; -"502 transpose_30_0_0_nncf_smooth_quant_0" [id=502, type="call_module"]; -"503 quantize_per_tensor_175" [id=503, type="quantize_per_tensor"]; -"504 dequantize_per_tensor_176" [id=504, type="dequantize_per_tensor"]; -"505 _frozen_param23" [id=505, type="get_attr"]; -"506 dequantize_per_tensor_177" [id=506, type="dequantize_per_tensor"]; -"507 linear_20" [id=507, type=linear]; -"508 quantize_per_tensor_178" [id=508, type="quantize_per_tensor"]; -"509 dequantize_per_tensor_179" [id=509, type="dequantize_per_tensor"]; -"510 unflatten_5" [id=510, type=unflatten]; -"511 unsqueeze_5" [id=511, type=unsqueeze]; -"512 transpose_31" [id=512, type=transpose]; -"513 squeeze_5" [id=513, type=squeeze]; -"514 contiguous_5" [id=514, type=contiguous]; -"515 select_15" [id=515, type=select]; -"516 select_16" [id=516, type=select]; -"517 select_17" [id=517, type=select]; -"518 view_40" [id=518, type=view]; -"519 transpose_32" [id=519, type=transpose]; -"520 view_41" [id=520, type=view]; -"521 transpose_33" [id=521, type=transpose]; -"522 view_42" [id=522, type=view]; -"523 transpose_34" [id=523, type=transpose]; -"524 view_43" [id=524, type=view]; -"525 view_44" [id=525, type=view]; -"526 view_45" [id=526, type=view]; -"527 scaled_dot_product_attention_5" [id=527, type="scaled_dot_product_attention"]; -"528 permute_6" [id=528, type=permute]; -"529 view_46" [id=529, type=view]; -"530 view_46_0_0_nncf_smooth_quant_0" [id=530, type="call_module"]; -"531 quantize_per_tensor_180" [id=531, type="quantize_per_tensor"]; -"532 dequantize_per_tensor_181" [id=532, type="dequantize_per_tensor"]; -"533 _frozen_param24" [id=533, type="get_attr"]; -"534 dequantize_per_tensor_182" [id=534, type="dequantize_per_tensor"]; -"535 linear_21" [id=535, type=linear]; -"536 quantize_per_tensor_183" [id=536, type="quantize_per_tensor"]; -"537 dequantize_per_tensor_184" [id=537, type="dequantize_per_tensor"]; -"538 view_47" [id=538, type=view]; -"539 quantize_per_tensor_185" [id=539, type="quantize_per_tensor"]; -"540 dequantize_per_tensor_186" [id=540, type="dequantize_per_tensor"]; -"541 transpose_35" [id=541, type=transpose]; -"542 dropout_16" [id=542, type=dropout]; -"543 quantize_per_tensor_187" [id=543, type="quantize_per_tensor"]; -"544 dequantize_per_tensor_188" [id=544, type="dequantize_per_tensor"]; -"545 add_11" [id=545, type=add]; -"546 quantize_per_tensor_189" [id=546, type="quantize_per_tensor"]; -"547 dequantize_per_tensor_190" [id=547, type="dequantize_per_tensor"]; -"548 dequantize_per_tensor_191" [id=548, type="dequantize_per_tensor"]; -"549 layer_norm_11" [id=549, type="layer_norm"]; -"550 layer_norm_11_0_0_nncf_smooth_quant_0" [id=550, type="call_module"]; -"551 quantize_per_tensor_192" [id=551, type="quantize_per_tensor"]; -"552 dequantize_per_tensor_193" [id=552, type="dequantize_per_tensor"]; -"553 _frozen_param25" [id=553, type="get_attr"]; -"554 dequantize_per_tensor_194" [id=554, type="dequantize_per_tensor"]; -"555 linear_22" [id=555, type=linear]; -"556 quantize_per_tensor_195" [id=556, type="quantize_per_tensor"]; -"557 dequantize_per_tensor_196" [id=557, type="dequantize_per_tensor"]; -"558 gelu_5" [id=558, type=gelu]; -"559 dropout_17" [id=559, type=dropout]; -"560 dropout_17_0_0_nncf_smooth_quant_0" [id=560, type="call_module"]; -"561 quantize_per_tensor_197" [id=561, type="quantize_per_tensor"]; -"562 dequantize_per_tensor_198" [id=562, type="dequantize_per_tensor"]; -"563 _frozen_param26" [id=563, type="get_attr"]; -"564 dequantize_per_tensor_199" [id=564, type="dequantize_per_tensor"]; -"565 linear_23" [id=565, type=linear]; -"566 quantize_per_tensor_200" [id=566, type="quantize_per_tensor"]; -"567 dequantize_per_tensor_201" [id=567, type="dequantize_per_tensor"]; -"568 dropout_18" [id=568, type=dropout]; -"569 quantize_per_tensor_202" [id=569, type="quantize_per_tensor"]; -"570 dequantize_per_tensor_203" [id=570, type="dequantize_per_tensor"]; -"571 add_12" [id=571, type=add]; -"572 quantize_per_tensor_204" [id=572, type="quantize_per_tensor"]; -"573 dequantize_per_tensor_205" [id=573, type="dequantize_per_tensor"]; -"574 dequantize_per_tensor_206" [id=574, type="dequantize_per_tensor"]; -"575 layer_norm_12" [id=575, type="layer_norm"]; -"576 transpose_36" [id=576, type=transpose]; -"577 transpose_36_0_0_nncf_smooth_quant_0" [id=577, type="call_module"]; -"578 quantize_per_tensor_207" [id=578, type="quantize_per_tensor"]; -"579 dequantize_per_tensor_208" [id=579, type="dequantize_per_tensor"]; -"580 _frozen_param27" [id=580, type="get_attr"]; -"581 dequantize_per_tensor_209" [id=581, type="dequantize_per_tensor"]; -"582 linear_24" [id=582, type=linear]; -"583 quantize_per_tensor_210" [id=583, type="quantize_per_tensor"]; -"584 dequantize_per_tensor_211" [id=584, type="dequantize_per_tensor"]; -"585 unflatten_6" [id=585, type=unflatten]; -"586 unsqueeze_6" [id=586, type=unsqueeze]; -"587 transpose_37" [id=587, type=transpose]; -"588 squeeze_6" [id=588, type=squeeze]; -"589 contiguous_6" [id=589, type=contiguous]; -"590 select_18" [id=590, type=select]; -"591 select_19" [id=591, type=select]; -"592 select_20" [id=592, type=select]; -"593 view_48" [id=593, type=view]; -"594 transpose_38" [id=594, type=transpose]; -"595 view_49" [id=595, type=view]; -"596 transpose_39" [id=596, type=transpose]; -"597 view_50" [id=597, type=view]; -"598 transpose_40" [id=598, type=transpose]; -"599 view_51" [id=599, type=view]; -"600 view_52" [id=600, type=view]; -"601 view_53" [id=601, type=view]; -"602 scaled_dot_product_attention_6" [id=602, type="scaled_dot_product_attention"]; -"603 permute_7" [id=603, type=permute]; -"604 view_54" [id=604, type=view]; -"605 view_54_0_0_nncf_smooth_quant_0" [id=605, type="call_module"]; -"606 quantize_per_tensor_212" [id=606, type="quantize_per_tensor"]; -"607 dequantize_per_tensor_213" [id=607, type="dequantize_per_tensor"]; -"608 _frozen_param28" [id=608, type="get_attr"]; -"609 dequantize_per_tensor_214" [id=609, type="dequantize_per_tensor"]; -"610 linear_25" [id=610, type=linear]; -"611 quantize_per_tensor_215" [id=611, type="quantize_per_tensor"]; -"612 dequantize_per_tensor_216" [id=612, type="dequantize_per_tensor"]; -"613 view_55" [id=613, type=view]; -"614 quantize_per_tensor_217" [id=614, type="quantize_per_tensor"]; -"615 dequantize_per_tensor_218" [id=615, type="dequantize_per_tensor"]; -"616 transpose_41" [id=616, type=transpose]; -"617 dropout_19" [id=617, type=dropout]; -"618 quantize_per_tensor_219" [id=618, type="quantize_per_tensor"]; -"619 dequantize_per_tensor_220" [id=619, type="dequantize_per_tensor"]; -"620 add_13" [id=620, type=add]; -"621 quantize_per_tensor_221" [id=621, type="quantize_per_tensor"]; -"622 dequantize_per_tensor_222" [id=622, type="dequantize_per_tensor"]; -"623 dequantize_per_tensor_223" [id=623, type="dequantize_per_tensor"]; -"624 layer_norm_13" [id=624, type="layer_norm"]; -"625 layer_norm_13_0_0_nncf_smooth_quant_0" [id=625, type="call_module"]; -"626 quantize_per_tensor_224" [id=626, type="quantize_per_tensor"]; -"627 dequantize_per_tensor_225" [id=627, type="dequantize_per_tensor"]; -"628 _frozen_param29" [id=628, type="get_attr"]; -"629 dequantize_per_tensor_226" [id=629, type="dequantize_per_tensor"]; -"630 linear_26" [id=630, type=linear]; -"631 quantize_per_tensor_227" [id=631, type="quantize_per_tensor"]; -"632 dequantize_per_tensor_228" [id=632, type="dequantize_per_tensor"]; -"633 gelu_6" [id=633, type=gelu]; -"634 dropout_20" [id=634, type=dropout]; -"635 dropout_20_0_0_nncf_smooth_quant_0" [id=635, type="call_module"]; -"636 quantize_per_tensor_229" [id=636, type="quantize_per_tensor"]; -"637 dequantize_per_tensor_230" [id=637, type="dequantize_per_tensor"]; -"638 _frozen_param30" [id=638, type="get_attr"]; -"639 dequantize_per_tensor_231" [id=639, type="dequantize_per_tensor"]; -"640 linear_27" [id=640, type=linear]; -"641 quantize_per_tensor_232" [id=641, type="quantize_per_tensor"]; -"642 dequantize_per_tensor_233" [id=642, type="dequantize_per_tensor"]; -"643 dropout_21" [id=643, type=dropout]; -"644 quantize_per_tensor_234" [id=644, type="quantize_per_tensor"]; -"645 dequantize_per_tensor_235" [id=645, type="dequantize_per_tensor"]; -"646 add_14" [id=646, type=add]; -"647 quantize_per_tensor_236" [id=647, type="quantize_per_tensor"]; -"648 dequantize_per_tensor_237" [id=648, type="dequantize_per_tensor"]; -"649 dequantize_per_tensor_238" [id=649, type="dequantize_per_tensor"]; -"650 layer_norm_14" [id=650, type="layer_norm"]; -"651 transpose_42" [id=651, type=transpose]; -"652 transpose_42_0_0_nncf_smooth_quant_0" [id=652, type="call_module"]; -"653 quantize_per_tensor_239" [id=653, type="quantize_per_tensor"]; -"654 dequantize_per_tensor_240" [id=654, type="dequantize_per_tensor"]; -"655 _frozen_param31" [id=655, type="get_attr"]; -"656 dequantize_per_tensor_241" [id=656, type="dequantize_per_tensor"]; -"657 linear_28" [id=657, type=linear]; -"658 quantize_per_tensor_242" [id=658, type="quantize_per_tensor"]; -"659 dequantize_per_tensor_243" [id=659, type="dequantize_per_tensor"]; -"660 unflatten_7" [id=660, type=unflatten]; -"661 unsqueeze_7" [id=661, type=unsqueeze]; -"662 transpose_43" [id=662, type=transpose]; -"663 squeeze_7" [id=663, type=squeeze]; -"664 contiguous_7" [id=664, type=contiguous]; -"665 select_21" [id=665, type=select]; -"666 select_22" [id=666, type=select]; -"667 select_23" [id=667, type=select]; -"668 view_56" [id=668, type=view]; -"669 transpose_44" [id=669, type=transpose]; -"670 view_57" [id=670, type=view]; -"671 transpose_45" [id=671, type=transpose]; -"672 view_58" [id=672, type=view]; -"673 transpose_46" [id=673, type=transpose]; -"674 view_59" [id=674, type=view]; -"675 view_60" [id=675, type=view]; -"676 view_61" [id=676, type=view]; -"677 scaled_dot_product_attention_7" [id=677, type="scaled_dot_product_attention"]; -"678 permute_8" [id=678, type=permute]; -"679 view_62" [id=679, type=view]; -"680 view_62_0_0_nncf_smooth_quant_0" [id=680, type="call_module"]; -"681 quantize_per_tensor_244" [id=681, type="quantize_per_tensor"]; -"682 dequantize_per_tensor_245" [id=682, type="dequantize_per_tensor"]; -"683 _frozen_param32" [id=683, type="get_attr"]; -"684 dequantize_per_tensor_246" [id=684, type="dequantize_per_tensor"]; -"685 linear_29" [id=685, type=linear]; -"686 quantize_per_tensor_247" [id=686, type="quantize_per_tensor"]; -"687 dequantize_per_tensor_248" [id=687, type="dequantize_per_tensor"]; -"688 view_63" [id=688, type=view]; -"689 quantize_per_tensor_249" [id=689, type="quantize_per_tensor"]; -"690 dequantize_per_tensor_250" [id=690, type="dequantize_per_tensor"]; -"691 transpose_47" [id=691, type=transpose]; -"692 dropout_22" [id=692, type=dropout]; -"693 quantize_per_tensor_251" [id=693, type="quantize_per_tensor"]; -"694 dequantize_per_tensor_252" [id=694, type="dequantize_per_tensor"]; -"695 add_15" [id=695, type=add]; -"696 quantize_per_tensor_253" [id=696, type="quantize_per_tensor"]; -"697 dequantize_per_tensor_254" [id=697, type="dequantize_per_tensor"]; -"698 dequantize_per_tensor_255" [id=698, type="dequantize_per_tensor"]; -"699 layer_norm_15" [id=699, type="layer_norm"]; -"700 layer_norm_15_0_0_nncf_smooth_quant_0" [id=700, type="call_module"]; -"701 quantize_per_tensor_256" [id=701, type="quantize_per_tensor"]; -"702 dequantize_per_tensor_257" [id=702, type="dequantize_per_tensor"]; -"703 _frozen_param33" [id=703, type="get_attr"]; -"704 dequantize_per_tensor_258" [id=704, type="dequantize_per_tensor"]; -"705 linear_30" [id=705, type=linear]; -"706 quantize_per_tensor_259" [id=706, type="quantize_per_tensor"]; -"707 dequantize_per_tensor_260" [id=707, type="dequantize_per_tensor"]; -"708 gelu_7" [id=708, type=gelu]; -"709 dropout_23" [id=709, type=dropout]; -"710 dropout_23_0_0_nncf_smooth_quant_0" [id=710, type="call_module"]; -"711 quantize_per_tensor_261" [id=711, type="quantize_per_tensor"]; -"712 dequantize_per_tensor_262" [id=712, type="dequantize_per_tensor"]; -"713 _frozen_param34" [id=713, type="get_attr"]; -"714 dequantize_per_tensor_263" [id=714, type="dequantize_per_tensor"]; -"715 linear_31" [id=715, type=linear]; -"716 quantize_per_tensor_264" [id=716, type="quantize_per_tensor"]; -"717 dequantize_per_tensor_265" [id=717, type="dequantize_per_tensor"]; -"718 dropout_24" [id=718, type=dropout]; -"719 quantize_per_tensor_266" [id=719, type="quantize_per_tensor"]; -"720 dequantize_per_tensor_267" [id=720, type="dequantize_per_tensor"]; -"721 add_16" [id=721, type=add]; -"722 quantize_per_tensor_268" [id=722, type="quantize_per_tensor"]; -"723 dequantize_per_tensor_269" [id=723, type="dequantize_per_tensor"]; -"724 dequantize_per_tensor_270" [id=724, type="dequantize_per_tensor"]; -"725 layer_norm_16" [id=725, type="layer_norm"]; -"726 transpose_48" [id=726, type=transpose]; -"727 transpose_48_0_0_nncf_smooth_quant_0" [id=727, type="call_module"]; -"728 quantize_per_tensor_271" [id=728, type="quantize_per_tensor"]; -"729 dequantize_per_tensor_272" [id=729, type="dequantize_per_tensor"]; -"730 _frozen_param35" [id=730, type="get_attr"]; -"731 dequantize_per_tensor_273" [id=731, type="dequantize_per_tensor"]; -"732 linear_32" [id=732, type=linear]; -"733 quantize_per_tensor_274" [id=733, type="quantize_per_tensor"]; -"734 dequantize_per_tensor_275" [id=734, type="dequantize_per_tensor"]; -"735 unflatten_8" [id=735, type=unflatten]; -"736 unsqueeze_8" [id=736, type=unsqueeze]; -"737 transpose_49" [id=737, type=transpose]; -"738 squeeze_8" [id=738, type=squeeze]; -"739 contiguous_8" [id=739, type=contiguous]; -"740 select_24" [id=740, type=select]; -"741 select_25" [id=741, type=select]; -"742 select_26" [id=742, type=select]; -"743 view_64" [id=743, type=view]; -"744 transpose_50" [id=744, type=transpose]; -"745 view_65" [id=745, type=view]; -"746 transpose_51" [id=746, type=transpose]; -"747 view_66" [id=747, type=view]; -"748 transpose_52" [id=748, type=transpose]; -"749 view_67" [id=749, type=view]; -"750 view_68" [id=750, type=view]; -"751 view_69" [id=751, type=view]; -"752 scaled_dot_product_attention_8" [id=752, type="scaled_dot_product_attention"]; -"753 permute_9" [id=753, type=permute]; -"754 view_70" [id=754, type=view]; -"755 view_70_0_0_nncf_smooth_quant_0" [id=755, type="call_module"]; -"756 quantize_per_tensor_276" [id=756, type="quantize_per_tensor"]; -"757 dequantize_per_tensor_277" [id=757, type="dequantize_per_tensor"]; -"758 _frozen_param36" [id=758, type="get_attr"]; -"759 dequantize_per_tensor_278" [id=759, type="dequantize_per_tensor"]; -"760 linear_33" [id=760, type=linear]; -"761 quantize_per_tensor_279" [id=761, type="quantize_per_tensor"]; -"762 dequantize_per_tensor_280" [id=762, type="dequantize_per_tensor"]; -"763 view_71" [id=763, type=view]; -"764 quantize_per_tensor_281" [id=764, type="quantize_per_tensor"]; -"765 dequantize_per_tensor_282" [id=765, type="dequantize_per_tensor"]; -"766 transpose_53" [id=766, type=transpose]; -"767 dropout_25" [id=767, type=dropout]; -"768 quantize_per_tensor_283" [id=768, type="quantize_per_tensor"]; -"769 dequantize_per_tensor_284" [id=769, type="dequantize_per_tensor"]; -"770 add_17" [id=770, type=add]; -"771 quantize_per_tensor_285" [id=771, type="quantize_per_tensor"]; -"772 dequantize_per_tensor_286" [id=772, type="dequantize_per_tensor"]; -"773 dequantize_per_tensor_287" [id=773, type="dequantize_per_tensor"]; -"774 layer_norm_17" [id=774, type="layer_norm"]; -"775 layer_norm_17_0_0_nncf_smooth_quant_0" [id=775, type="call_module"]; -"776 quantize_per_tensor_288" [id=776, type="quantize_per_tensor"]; -"777 dequantize_per_tensor_289" [id=777, type="dequantize_per_tensor"]; -"778 _frozen_param37" [id=778, type="get_attr"]; -"779 dequantize_per_tensor_290" [id=779, type="dequantize_per_tensor"]; -"780 linear_34" [id=780, type=linear]; -"781 quantize_per_tensor_291" [id=781, type="quantize_per_tensor"]; -"782 dequantize_per_tensor_292" [id=782, type="dequantize_per_tensor"]; -"783 gelu_8" [id=783, type=gelu]; -"784 dropout_26" [id=784, type=dropout]; -"785 dropout_26_0_0_nncf_smooth_quant_0" [id=785, type="call_module"]; -"786 quantize_per_tensor_293" [id=786, type="quantize_per_tensor"]; -"787 dequantize_per_tensor_294" [id=787, type="dequantize_per_tensor"]; -"788 _frozen_param38" [id=788, type="get_attr"]; -"789 dequantize_per_tensor_295" [id=789, type="dequantize_per_tensor"]; -"790 linear_35" [id=790, type=linear]; -"791 quantize_per_tensor_296" [id=791, type="quantize_per_tensor"]; -"792 dequantize_per_tensor_297" [id=792, type="dequantize_per_tensor"]; -"793 dropout_27" [id=793, type=dropout]; -"794 quantize_per_tensor_298" [id=794, type="quantize_per_tensor"]; -"795 dequantize_per_tensor_299" [id=795, type="dequantize_per_tensor"]; -"796 add_18" [id=796, type=add]; -"797 quantize_per_tensor_300" [id=797, type="quantize_per_tensor"]; -"798 dequantize_per_tensor_301" [id=798, type="dequantize_per_tensor"]; -"799 dequantize_per_tensor_302" [id=799, type="dequantize_per_tensor"]; -"800 layer_norm_18" [id=800, type="layer_norm"]; -"801 transpose_54" [id=801, type=transpose]; -"802 transpose_54_0_0_nncf_smooth_quant_0" [id=802, type="call_module"]; -"803 quantize_per_tensor_303" [id=803, type="quantize_per_tensor"]; -"804 dequantize_per_tensor_304" [id=804, type="dequantize_per_tensor"]; -"805 _frozen_param39" [id=805, type="get_attr"]; -"806 dequantize_per_tensor_305" [id=806, type="dequantize_per_tensor"]; -"807 linear_36" [id=807, type=linear]; -"808 quantize_per_tensor_306" [id=808, type="quantize_per_tensor"]; -"809 dequantize_per_tensor_307" [id=809, type="dequantize_per_tensor"]; -"810 unflatten_9" [id=810, type=unflatten]; -"811 unsqueeze_9" [id=811, type=unsqueeze]; -"812 transpose_55" [id=812, type=transpose]; -"813 squeeze_9" [id=813, type=squeeze]; -"814 contiguous_9" [id=814, type=contiguous]; -"815 select_27" [id=815, type=select]; -"816 select_28" [id=816, type=select]; -"817 select_29" [id=817, type=select]; -"818 view_72" [id=818, type=view]; -"819 transpose_56" [id=819, type=transpose]; -"820 view_73" [id=820, type=view]; -"821 transpose_57" [id=821, type=transpose]; -"822 view_74" [id=822, type=view]; -"823 transpose_58" [id=823, type=transpose]; -"824 view_75" [id=824, type=view]; -"825 view_76" [id=825, type=view]; -"826 view_77" [id=826, type=view]; -"827 scaled_dot_product_attention_9" [id=827, type="scaled_dot_product_attention"]; -"828 permute_10" [id=828, type=permute]; -"829 view_78" [id=829, type=view]; -"830 view_78_0_0_nncf_smooth_quant_0" [id=830, type="call_module"]; -"831 quantize_per_tensor_308" [id=831, type="quantize_per_tensor"]; -"832 dequantize_per_tensor_309" [id=832, type="dequantize_per_tensor"]; -"833 _frozen_param40" [id=833, type="get_attr"]; -"834 dequantize_per_tensor_310" [id=834, type="dequantize_per_tensor"]; -"835 linear_37" [id=835, type=linear]; -"836 quantize_per_tensor_311" [id=836, type="quantize_per_tensor"]; -"837 dequantize_per_tensor_312" [id=837, type="dequantize_per_tensor"]; -"838 view_79" [id=838, type=view]; -"839 quantize_per_tensor_313" [id=839, type="quantize_per_tensor"]; -"840 dequantize_per_tensor_314" [id=840, type="dequantize_per_tensor"]; -"841 transpose_59" [id=841, type=transpose]; -"842 dropout_28" [id=842, type=dropout]; -"843 quantize_per_tensor_315" [id=843, type="quantize_per_tensor"]; -"844 dequantize_per_tensor_316" [id=844, type="dequantize_per_tensor"]; -"845 add_19" [id=845, type=add]; -"846 quantize_per_tensor_317" [id=846, type="quantize_per_tensor"]; -"847 dequantize_per_tensor_318" [id=847, type="dequantize_per_tensor"]; -"848 dequantize_per_tensor_319" [id=848, type="dequantize_per_tensor"]; -"849 layer_norm_19" [id=849, type="layer_norm"]; -"850 layer_norm_19_0_0_nncf_smooth_quant_0" [id=850, type="call_module"]; -"851 quantize_per_tensor_320" [id=851, type="quantize_per_tensor"]; -"852 dequantize_per_tensor_321" [id=852, type="dequantize_per_tensor"]; -"853 _frozen_param41" [id=853, type="get_attr"]; -"854 dequantize_per_tensor_322" [id=854, type="dequantize_per_tensor"]; -"855 linear_38" [id=855, type=linear]; -"856 quantize_per_tensor_323" [id=856, type="quantize_per_tensor"]; -"857 dequantize_per_tensor_324" [id=857, type="dequantize_per_tensor"]; -"858 gelu_9" [id=858, type=gelu]; -"859 dropout_29" [id=859, type=dropout]; -"860 dropout_29_0_0_nncf_smooth_quant_0" [id=860, type="call_module"]; -"861 quantize_per_tensor_325" [id=861, type="quantize_per_tensor"]; -"862 dequantize_per_tensor_326" [id=862, type="dequantize_per_tensor"]; -"863 _frozen_param42" [id=863, type="get_attr"]; -"864 dequantize_per_tensor_327" [id=864, type="dequantize_per_tensor"]; -"865 linear_39" [id=865, type=linear]; -"866 quantize_per_tensor_328" [id=866, type="quantize_per_tensor"]; -"867 dequantize_per_tensor_329" [id=867, type="dequantize_per_tensor"]; -"868 dropout_30" [id=868, type=dropout]; -"869 quantize_per_tensor_330" [id=869, type="quantize_per_tensor"]; -"870 dequantize_per_tensor_331" [id=870, type="dequantize_per_tensor"]; -"871 add_20" [id=871, type=add]; -"872 quantize_per_tensor_332" [id=872, type="quantize_per_tensor"]; -"873 dequantize_per_tensor_333" [id=873, type="dequantize_per_tensor"]; -"874 dequantize_per_tensor_334" [id=874, type="dequantize_per_tensor"]; -"875 layer_norm_20" [id=875, type="layer_norm"]; -"876 transpose_60" [id=876, type=transpose]; -"877 transpose_60_0_0_nncf_smooth_quant_0" [id=877, type="call_module"]; -"878 quantize_per_tensor_335" [id=878, type="quantize_per_tensor"]; -"879 dequantize_per_tensor_336" [id=879, type="dequantize_per_tensor"]; -"880 _frozen_param43" [id=880, type="get_attr"]; -"881 dequantize_per_tensor_337" [id=881, type="dequantize_per_tensor"]; -"882 linear_40" [id=882, type=linear]; -"883 quantize_per_tensor_338" [id=883, type="quantize_per_tensor"]; -"884 dequantize_per_tensor_339" [id=884, type="dequantize_per_tensor"]; -"885 unflatten_10" [id=885, type=unflatten]; -"886 unsqueeze_10" [id=886, type=unsqueeze]; -"887 transpose_61" [id=887, type=transpose]; -"888 squeeze_10" [id=888, type=squeeze]; -"889 contiguous_10" [id=889, type=contiguous]; -"890 select_30" [id=890, type=select]; -"891 select_31" [id=891, type=select]; -"892 select_32" [id=892, type=select]; -"893 view_80" [id=893, type=view]; -"894 transpose_62" [id=894, type=transpose]; -"895 view_81" [id=895, type=view]; -"896 transpose_63" [id=896, type=transpose]; -"897 view_82" [id=897, type=view]; -"898 transpose_64" [id=898, type=transpose]; -"899 view_83" [id=899, type=view]; -"900 view_84" [id=900, type=view]; -"901 view_85" [id=901, type=view]; -"902 scaled_dot_product_attention_10" [id=902, type="scaled_dot_product_attention"]; -"903 permute_11" [id=903, type=permute]; -"904 view_86" [id=904, type=view]; -"905 view_86_0_0_nncf_smooth_quant_0" [id=905, type="call_module"]; -"906 quantize_per_tensor_340" [id=906, type="quantize_per_tensor"]; -"907 dequantize_per_tensor_341" [id=907, type="dequantize_per_tensor"]; -"908 _frozen_param44" [id=908, type="get_attr"]; -"909 dequantize_per_tensor_342" [id=909, type="dequantize_per_tensor"]; -"910 linear_41" [id=910, type=linear]; -"911 quantize_per_tensor_343" [id=911, type="quantize_per_tensor"]; -"912 dequantize_per_tensor_344" [id=912, type="dequantize_per_tensor"]; -"913 view_87" [id=913, type=view]; -"914 quantize_per_tensor_345" [id=914, type="quantize_per_tensor"]; -"915 dequantize_per_tensor_346" [id=915, type="dequantize_per_tensor"]; -"916 transpose_65" [id=916, type=transpose]; -"917 dropout_31" [id=917, type=dropout]; -"918 quantize_per_tensor_347" [id=918, type="quantize_per_tensor"]; -"919 dequantize_per_tensor_348" [id=919, type="dequantize_per_tensor"]; -"920 add_21" [id=920, type=add]; -"921 quantize_per_tensor_349" [id=921, type="quantize_per_tensor"]; -"922 dequantize_per_tensor_350" [id=922, type="dequantize_per_tensor"]; -"923 dequantize_per_tensor_351" [id=923, type="dequantize_per_tensor"]; -"924 layer_norm_21" [id=924, type="layer_norm"]; -"925 layer_norm_21_0_0_nncf_smooth_quant_0" [id=925, type="call_module"]; -"926 quantize_per_tensor_352" [id=926, type="quantize_per_tensor"]; -"927 dequantize_per_tensor_353" [id=927, type="dequantize_per_tensor"]; -"928 _frozen_param45" [id=928, type="get_attr"]; -"929 dequantize_per_tensor_354" [id=929, type="dequantize_per_tensor"]; -"930 linear_42" [id=930, type=linear]; -"931 quantize_per_tensor_355" [id=931, type="quantize_per_tensor"]; -"932 dequantize_per_tensor_356" [id=932, type="dequantize_per_tensor"]; -"933 gelu_10" [id=933, type=gelu]; -"934 dropout_32" [id=934, type=dropout]; -"935 dropout_32_0_0_nncf_smooth_quant_0" [id=935, type="call_module"]; -"936 quantize_per_tensor_357" [id=936, type="quantize_per_tensor"]; -"937 dequantize_per_tensor_358" [id=937, type="dequantize_per_tensor"]; -"938 _frozen_param46" [id=938, type="get_attr"]; -"939 dequantize_per_tensor_359" [id=939, type="dequantize_per_tensor"]; -"940 linear_43" [id=940, type=linear]; -"941 quantize_per_tensor_360" [id=941, type="quantize_per_tensor"]; -"942 dequantize_per_tensor_361" [id=942, type="dequantize_per_tensor"]; -"943 dropout_33" [id=943, type=dropout]; -"944 quantize_per_tensor_362" [id=944, type="quantize_per_tensor"]; -"945 dequantize_per_tensor_363" [id=945, type="dequantize_per_tensor"]; -"946 add_22" [id=946, type=add]; -"947 quantize_per_tensor_364" [id=947, type="quantize_per_tensor"]; -"948 dequantize_per_tensor_365" [id=948, type="dequantize_per_tensor"]; -"949 dequantize_per_tensor_366" [id=949, type="dequantize_per_tensor"]; -"950 layer_norm_22" [id=950, type="layer_norm"]; -"951 transpose_66" [id=951, type=transpose]; -"952 transpose_66_0_0_nncf_smooth_quant_0" [id=952, type="call_module"]; -"953 quantize_per_tensor_367" [id=953, type="quantize_per_tensor"]; -"954 dequantize_per_tensor_368" [id=954, type="dequantize_per_tensor"]; -"955 _frozen_param47" [id=955, type="get_attr"]; -"956 dequantize_per_tensor_369" [id=956, type="dequantize_per_tensor"]; -"957 linear_44" [id=957, type=linear]; -"958 quantize_per_tensor_370" [id=958, type="quantize_per_tensor"]; -"959 dequantize_per_tensor_371" [id=959, type="dequantize_per_tensor"]; -"960 unflatten_11" [id=960, type=unflatten]; -"961 unsqueeze_11" [id=961, type=unsqueeze]; -"962 transpose_67" [id=962, type=transpose]; -"963 squeeze_11" [id=963, type=squeeze]; -"964 contiguous_11" [id=964, type=contiguous]; -"965 select_33" [id=965, type=select]; -"966 select_34" [id=966, type=select]; -"967 select_35" [id=967, type=select]; -"968 view_88" [id=968, type=view]; -"969 transpose_68" [id=969, type=transpose]; -"970 view_89" [id=970, type=view]; -"971 transpose_69" [id=971, type=transpose]; -"972 view_90" [id=972, type=view]; -"973 transpose_70" [id=973, type=transpose]; -"974 view_91" [id=974, type=view]; -"975 view_92" [id=975, type=view]; -"976 view_93" [id=976, type=view]; -"977 scaled_dot_product_attention_11" [id=977, type="scaled_dot_product_attention"]; -"978 permute_12" [id=978, type=permute]; -"979 view_94" [id=979, type=view]; -"980 view_94_0_0_nncf_smooth_quant_0" [id=980, type="call_module"]; -"981 quantize_per_tensor_372" [id=981, type="quantize_per_tensor"]; -"982 dequantize_per_tensor_373" [id=982, type="dequantize_per_tensor"]; -"983 _frozen_param48" [id=983, type="get_attr"]; -"984 dequantize_per_tensor_374" [id=984, type="dequantize_per_tensor"]; -"985 linear_45" [id=985, type=linear]; -"986 quantize_per_tensor_375" [id=986, type="quantize_per_tensor"]; -"987 dequantize_per_tensor_376" [id=987, type="dequantize_per_tensor"]; -"988 view_95" [id=988, type=view]; -"989 quantize_per_tensor_377" [id=989, type="quantize_per_tensor"]; -"990 dequantize_per_tensor_378" [id=990, type="dequantize_per_tensor"]; -"991 transpose_71" [id=991, type=transpose]; -"992 dropout_34" [id=992, type=dropout]; -"993 quantize_per_tensor_379" [id=993, type="quantize_per_tensor"]; -"994 dequantize_per_tensor_380" [id=994, type="dequantize_per_tensor"]; -"995 add_23" [id=995, type=add]; -"996 quantize_per_tensor_381" [id=996, type="quantize_per_tensor"]; -"997 dequantize_per_tensor_382" [id=997, type="dequantize_per_tensor"]; -"998 dequantize_per_tensor_383" [id=998, type="dequantize_per_tensor"]; -"999 layer_norm_23" [id=999, type="layer_norm"]; -"1000 layer_norm_23_0_0_nncf_smooth_quant_0" [id=1000, type="call_module"]; -"1001 quantize_per_tensor_384" [id=1001, type="quantize_per_tensor"]; -"1002 dequantize_per_tensor_385" [id=1002, type="dequantize_per_tensor"]; -"1003 _frozen_param49" [id=1003, type="get_attr"]; -"1004 dequantize_per_tensor_386" [id=1004, type="dequantize_per_tensor"]; -"1005 linear_46" [id=1005, type=linear]; -"1006 quantize_per_tensor_387" [id=1006, type="quantize_per_tensor"]; -"1007 dequantize_per_tensor_388" [id=1007, type="dequantize_per_tensor"]; -"1008 gelu_11" [id=1008, type=gelu]; -"1009 dropout_35" [id=1009, type=dropout]; -"1010 dropout_35_0_0_nncf_smooth_quant_0" [id=1010, type="call_module"]; -"1011 quantize_per_tensor_389" [id=1011, type="quantize_per_tensor"]; -"1012 dequantize_per_tensor_390" [id=1012, type="dequantize_per_tensor"]; -"1013 _frozen_param50" [id=1013, type="get_attr"]; -"1014 dequantize_per_tensor_391" [id=1014, type="dequantize_per_tensor"]; -"1015 linear_47" [id=1015, type=linear]; -"1016 quantize_per_tensor_392" [id=1016, type="quantize_per_tensor"]; -"1017 dequantize_per_tensor_393" [id=1017, type="dequantize_per_tensor"]; -"1018 dropout_36" [id=1018, type=dropout]; -"1019 quantize_per_tensor_394" [id=1019, type="quantize_per_tensor"]; -"1020 dequantize_per_tensor_395" [id=1020, type="dequantize_per_tensor"]; -"1021 add_24" [id=1021, type=add]; -"1022 quantize_per_tensor_396" [id=1022, type="quantize_per_tensor"]; -"1023 dequantize_per_tensor_397" [id=1023, type="dequantize_per_tensor"]; -"1024 layer_norm_24" [id=1024, type="layer_norm"]; -"1025 slice_1" [id=1025, type=slice]; -"1026 select_36" [id=1026, type=select]; -"1027 select_36_0_0_nncf_smooth_quant_0" [id=1027, type="call_module"]; -"1028 quantize_per_tensor_398" [id=1028, type="quantize_per_tensor"]; -"1029 dequantize_per_tensor_399" [id=1029, type="dequantize_per_tensor"]; -"1030 _frozen_param51" [id=1030, type="get_attr"]; -"1031 dequantize_per_tensor_400" [id=1031, type="dequantize_per_tensor"]; -"1032 linear_48" [id=1032, type=linear]; -"1033 quantize_per_tensor_401" [id=1033, type="quantize_per_tensor"]; -"1034 dequantize_per_tensor_402" [id=1034, type="dequantize_per_tensor"]; -"1035 output" [id=1035, type=output]; -"0 _frozen_param0" -> "1 dequantize_per_tensor_0" [style=solid, label="(1, 197, 768)"]; -"1 dequantize_per_tensor_0" -> "119 add" [style=solid, label="(1, 197, 768)"]; -"2 conv_proj_bias" -> "107 conv2d" [style=solid, label="(768,)"]; -"3 encoder_layers_encoder_layer_0_ln_1_weight" -> "123 layer_norm" [style=solid, label="(768,)"]; -"4 encoder_layers_encoder_layer_0_ln_1_bias" -> "123 layer_norm" [style=solid, label="(768,)"]; -"5 encoder_layers_encoder_layer_0_self_attention_in_proj_bias" -> "130 linear" [style=solid, label="(2304,)"]; -"6 encoder_layers_encoder_layer_0_self_attention_out_proj_bias" -> "158 linear_1" [style=solid, label="(768,)"]; -"7 encoder_layers_encoder_layer_0_ln_2_weight" -> "174 layer_norm_1" [style=solid, label="(768,)"]; -"8 encoder_layers_encoder_layer_0_ln_2_bias" -> "174 layer_norm_1" [style=solid, label="(768,)"]; -"9 encoder_layers_encoder_layer_0_mlp_0_bias" -> "180 linear_2" [style=solid, label="(3072,)"]; -"10 encoder_layers_encoder_layer_0_mlp_3_bias" -> "190 linear_3" [style=solid, label="(768,)"]; -"11 encoder_layers_encoder_layer_1_ln_1_weight" -> "200 layer_norm_2" [style=solid, label="(768,)"]; -"12 encoder_layers_encoder_layer_1_ln_1_bias" -> "200 layer_norm_2" [style=solid, label="(768,)"]; -"13 encoder_layers_encoder_layer_1_self_attention_in_proj_bias" -> "207 linear_4" [style=solid, label="(2304,)"]; -"14 encoder_layers_encoder_layer_1_self_attention_out_proj_bias" -> "235 linear_5" [style=solid, label="(768,)"]; -"15 encoder_layers_encoder_layer_1_ln_2_weight" -> "249 layer_norm_3" [style=solid, label="(768,)"]; -"16 encoder_layers_encoder_layer_1_ln_2_bias" -> "249 layer_norm_3" [style=solid, label="(768,)"]; -"17 encoder_layers_encoder_layer_1_mlp_0_bias" -> "255 linear_6" [style=solid, label="(3072,)"]; -"18 encoder_layers_encoder_layer_1_mlp_3_bias" -> "265 linear_7" [style=solid, label="(768,)"]; -"19 encoder_layers_encoder_layer_2_ln_1_weight" -> "275 layer_norm_4" [style=solid, label="(768,)"]; -"20 encoder_layers_encoder_layer_2_ln_1_bias" -> "275 layer_norm_4" [style=solid, label="(768,)"]; -"21 encoder_layers_encoder_layer_2_self_attention_in_proj_bias" -> "282 linear_8" [style=solid, label="(2304,)"]; -"22 encoder_layers_encoder_layer_2_self_attention_out_proj_bias" -> "310 linear_9" [style=solid, label="(768,)"]; -"23 encoder_layers_encoder_layer_2_ln_2_weight" -> "324 layer_norm_5" [style=solid, label="(768,)"]; -"24 encoder_layers_encoder_layer_2_ln_2_bias" -> "324 layer_norm_5" [style=solid, label="(768,)"]; -"25 encoder_layers_encoder_layer_2_mlp_0_bias" -> "330 linear_10" [style=solid, label="(3072,)"]; -"26 encoder_layers_encoder_layer_2_mlp_3_bias" -> "340 linear_11" [style=solid, label="(768,)"]; -"27 encoder_layers_encoder_layer_3_ln_1_weight" -> "350 layer_norm_6" [style=solid, label="(768,)"]; -"28 encoder_layers_encoder_layer_3_ln_1_bias" -> "350 layer_norm_6" [style=solid, label="(768,)"]; -"29 encoder_layers_encoder_layer_3_self_attention_in_proj_bias" -> "357 linear_12" [style=solid, label="(2304,)"]; -"30 encoder_layers_encoder_layer_3_self_attention_out_proj_bias" -> "385 linear_13" [style=solid, label="(768,)"]; -"31 encoder_layers_encoder_layer_3_ln_2_weight" -> "399 layer_norm_7" [style=solid, label="(768,)"]; -"32 encoder_layers_encoder_layer_3_ln_2_bias" -> "399 layer_norm_7" [style=solid, label="(768,)"]; -"33 encoder_layers_encoder_layer_3_mlp_0_bias" -> "405 linear_14" [style=solid, label="(3072,)"]; -"34 encoder_layers_encoder_layer_3_mlp_3_bias" -> "415 linear_15" [style=solid, label="(768,)"]; -"35 encoder_layers_encoder_layer_4_ln_1_weight" -> "425 layer_norm_8" [style=solid, label="(768,)"]; -"36 encoder_layers_encoder_layer_4_ln_1_bias" -> "425 layer_norm_8" [style=solid, label="(768,)"]; -"37 encoder_layers_encoder_layer_4_self_attention_in_proj_bias" -> "432 linear_16" [style=solid, label="(2304,)"]; -"38 encoder_layers_encoder_layer_4_self_attention_out_proj_bias" -> "460 linear_17" [style=solid, label="(768,)"]; -"39 encoder_layers_encoder_layer_4_ln_2_weight" -> "474 layer_norm_9" [style=solid, label="(768,)"]; -"40 encoder_layers_encoder_layer_4_ln_2_bias" -> "474 layer_norm_9" [style=solid, label="(768,)"]; -"41 encoder_layers_encoder_layer_4_mlp_0_bias" -> "480 linear_18" [style=solid, label="(3072,)"]; -"42 encoder_layers_encoder_layer_4_mlp_3_bias" -> "490 linear_19" [style=solid, label="(768,)"]; -"43 encoder_layers_encoder_layer_5_ln_1_weight" -> "500 layer_norm_10" [style=solid, label="(768,)"]; -"44 encoder_layers_encoder_layer_5_ln_1_bias" -> "500 layer_norm_10" [style=solid, label="(768,)"]; -"45 encoder_layers_encoder_layer_5_self_attention_in_proj_bias" -> "507 linear_20" [style=solid, label="(2304,)"]; -"46 encoder_layers_encoder_layer_5_self_attention_out_proj_bias" -> "535 linear_21" [style=solid, label="(768,)"]; -"47 encoder_layers_encoder_layer_5_ln_2_weight" -> "549 layer_norm_11" [style=solid, label="(768,)"]; -"48 encoder_layers_encoder_layer_5_ln_2_bias" -> "549 layer_norm_11" [style=solid, label="(768,)"]; -"49 encoder_layers_encoder_layer_5_mlp_0_bias" -> "555 linear_22" [style=solid, label="(3072,)"]; -"50 encoder_layers_encoder_layer_5_mlp_3_bias" -> "565 linear_23" [style=solid, label="(768,)"]; -"51 encoder_layers_encoder_layer_6_ln_1_weight" -> "575 layer_norm_12" [style=solid, label="(768,)"]; -"52 encoder_layers_encoder_layer_6_ln_1_bias" -> "575 layer_norm_12" [style=solid, label="(768,)"]; -"53 encoder_layers_encoder_layer_6_self_attention_in_proj_bias" -> "582 linear_24" [style=solid, label="(2304,)"]; -"54 encoder_layers_encoder_layer_6_self_attention_out_proj_bias" -> "610 linear_25" [style=solid, label="(768,)"]; -"55 encoder_layers_encoder_layer_6_ln_2_weight" -> "624 layer_norm_13" [style=solid, label="(768,)"]; -"56 encoder_layers_encoder_layer_6_ln_2_bias" -> "624 layer_norm_13" [style=solid, label="(768,)"]; -"57 encoder_layers_encoder_layer_6_mlp_0_bias" -> "630 linear_26" [style=solid, label="(3072,)"]; -"58 encoder_layers_encoder_layer_6_mlp_3_bias" -> "640 linear_27" [style=solid, label="(768,)"]; -"59 encoder_layers_encoder_layer_7_ln_1_weight" -> "650 layer_norm_14" [style=solid, label="(768,)"]; -"60 encoder_layers_encoder_layer_7_ln_1_bias" -> "650 layer_norm_14" [style=solid, label="(768,)"]; -"61 encoder_layers_encoder_layer_7_self_attention_in_proj_bias" -> "657 linear_28" [style=solid, label="(2304,)"]; -"62 encoder_layers_encoder_layer_7_self_attention_out_proj_bias" -> "685 linear_29" [style=solid, label="(768,)"]; -"63 encoder_layers_encoder_layer_7_ln_2_weight" -> "699 layer_norm_15" [style=solid, label="(768,)"]; -"64 encoder_layers_encoder_layer_7_ln_2_bias" -> "699 layer_norm_15" [style=solid, label="(768,)"]; -"65 encoder_layers_encoder_layer_7_mlp_0_bias" -> "705 linear_30" [style=solid, label="(3072,)"]; -"66 encoder_layers_encoder_layer_7_mlp_3_bias" -> "715 linear_31" [style=solid, label="(768,)"]; -"67 encoder_layers_encoder_layer_8_ln_1_weight" -> "725 layer_norm_16" [style=solid, label="(768,)"]; -"68 encoder_layers_encoder_layer_8_ln_1_bias" -> "725 layer_norm_16" [style=solid, label="(768,)"]; -"69 encoder_layers_encoder_layer_8_self_attention_in_proj_bias" -> "732 linear_32" [style=solid, label="(2304,)"]; -"70 encoder_layers_encoder_layer_8_self_attention_out_proj_bias" -> "760 linear_33" [style=solid, label="(768,)"]; -"71 encoder_layers_encoder_layer_8_ln_2_weight" -> "774 layer_norm_17" [style=solid, label="(768,)"]; -"72 encoder_layers_encoder_layer_8_ln_2_bias" -> "774 layer_norm_17" [style=solid, label="(768,)"]; -"73 encoder_layers_encoder_layer_8_mlp_0_bias" -> "780 linear_34" [style=solid, label="(3072,)"]; -"74 encoder_layers_encoder_layer_8_mlp_3_bias" -> "790 linear_35" [style=solid, label="(768,)"]; -"75 encoder_layers_encoder_layer_9_ln_1_weight" -> "800 layer_norm_18" [style=solid, label="(768,)"]; -"76 encoder_layers_encoder_layer_9_ln_1_bias" -> "800 layer_norm_18" [style=solid, label="(768,)"]; -"77 encoder_layers_encoder_layer_9_self_attention_in_proj_bias" -> "807 linear_36" [style=solid, label="(2304,)"]; -"78 encoder_layers_encoder_layer_9_self_attention_out_proj_bias" -> "835 linear_37" [style=solid, label="(768,)"]; -"79 encoder_layers_encoder_layer_9_ln_2_weight" -> "849 layer_norm_19" [style=solid, label="(768,)"]; -"80 encoder_layers_encoder_layer_9_ln_2_bias" -> "849 layer_norm_19" [style=solid, label="(768,)"]; -"81 encoder_layers_encoder_layer_9_mlp_0_bias" -> "855 linear_38" [style=solid, label="(3072,)"]; -"82 encoder_layers_encoder_layer_9_mlp_3_bias" -> "865 linear_39" [style=solid, label="(768,)"]; -"83 encoder_layers_encoder_layer_10_ln_1_weight" -> "875 layer_norm_20" [style=solid, label="(768,)"]; -"84 encoder_layers_encoder_layer_10_ln_1_bias" -> "875 layer_norm_20" [style=solid, label="(768,)"]; -"85 encoder_layers_encoder_layer_10_self_attention_in_proj_bias" -> "882 linear_40" [style=solid, label="(2304,)"]; -"86 encoder_layers_encoder_layer_10_self_attention_out_proj_bias" -> "910 linear_41" [style=solid, label="(768,)"]; -"87 encoder_layers_encoder_layer_10_ln_2_weight" -> "924 layer_norm_21" [style=solid, label="(768,)"]; -"88 encoder_layers_encoder_layer_10_ln_2_bias" -> "924 layer_norm_21" [style=solid, label="(768,)"]; -"89 encoder_layers_encoder_layer_10_mlp_0_bias" -> "930 linear_42" [style=solid, label="(3072,)"]; -"90 encoder_layers_encoder_layer_10_mlp_3_bias" -> "940 linear_43" [style=solid, label="(768,)"]; -"91 encoder_layers_encoder_layer_11_ln_1_weight" -> "950 layer_norm_22" [style=solid, label="(768,)"]; -"92 encoder_layers_encoder_layer_11_ln_1_bias" -> "950 layer_norm_22" [style=solid, label="(768,)"]; -"93 encoder_layers_encoder_layer_11_self_attention_in_proj_bias" -> "957 linear_44" [style=solid, label="(2304,)"]; -"94 encoder_layers_encoder_layer_11_self_attention_out_proj_bias" -> "985 linear_45" [style=solid, label="(768,)"]; -"95 encoder_layers_encoder_layer_11_ln_2_weight" -> "999 layer_norm_23" [style=solid, label="(768,)"]; -"96 encoder_layers_encoder_layer_11_ln_2_bias" -> "999 layer_norm_23" [style=solid, label="(768,)"]; -"97 encoder_layers_encoder_layer_11_mlp_0_bias" -> "1005 linear_46" [style=solid, label="(3072,)"]; -"98 encoder_layers_encoder_layer_11_mlp_3_bias" -> "1015 linear_47" [style=solid, label="(768,)"]; -"99 encoder_ln_weight" -> "1024 layer_norm_24" [style=solid, label="(768,)"]; -"100 encoder_ln_bias" -> "1024 layer_norm_24" [style=solid, label="(768,)"]; -"101 heads_head_bias" -> "1032 linear_48" [style=solid, label="(1000,)"]; -"102 x" -> "103 quantize_per_tensor_1" [style=solid, label="(1, 3, 224, 224)"]; -"103 quantize_per_tensor_1" -> "104 dequantize_per_tensor_2" [style=solid, label="(1, 3, 224, 224)"]; -"104 dequantize_per_tensor_2" -> "107 conv2d" [style=solid, label="(1, 3, 224, 224)"]; -"105 _frozen_param1" -> "106 dequantize_per_tensor_3" [style=solid, label="(768, 3, 16, 16)"]; -"106 dequantize_per_tensor_3" -> "107 conv2d" [style=solid, label="(768, 3, 16, 16)"]; -"107 conv2d" -> "108 quantize_per_tensor_4" [style=solid, label="(1, 768, 14, 14)"]; -"108 quantize_per_tensor_4" -> "109 dequantize_per_tensor_5" [style=solid, label="(1, 768, 14, 14)"]; -"109 dequantize_per_tensor_5" -> "110 reshape" [style=solid, label="(1, 768, 14, 14)"]; -"110 reshape" -> "111 permute" [style=solid, label="(1, 768, 196)"]; -"111 permute" -> "112 quantize_per_tensor_6" [style=solid, label="(1, 196, 768)"]; -"112 quantize_per_tensor_6" -> "113 dequantize_per_tensor_7" [style=solid, label="(1, 196, 768)"]; -"113 dequantize_per_tensor_7" -> "116 cat" [style=solid, label="(1, 196, 768)"]; -"114 _frozen_param2" -> "115 dequantize_per_tensor_8" [style=solid, label="(1, 1, 768)"]; -"115 dequantize_per_tensor_8" -> "116 cat" [style=solid, label="(1, 1, 768)"]; -"116 cat" -> "117 quantize_per_tensor_9" [style=solid, label="(1, 197, 768)"]; -"117 quantize_per_tensor_9" -> "118 dequantize_per_tensor_10" [style=solid, label="(1, 197, 768)"]; -"118 dequantize_per_tensor_10" -> "119 add" [style=solid, label="(1, 197, 768)"]; -"119 add" -> "120 quantize_per_tensor_11" [style=solid, label="(1, 197, 768)"]; -"120 quantize_per_tensor_11" -> "121 dequantize_per_tensor_12" [style=solid, label="(1, 197, 768)"]; -"121 dequantize_per_tensor_12" -> "122 dropout" [style=solid, label="(1, 197, 768)"]; -"122 dropout" -> "123 layer_norm" [style=solid, label="(1, 197, 768)"]; -"122 dropout" -> "168 quantize_per_tensor_27" [style=solid, label="(1, 197, 768)"]; -"123 layer_norm" -> "124 transpose" [style=solid, label="(1, 197, 768)"]; -"124 transpose" -> "125 transpose_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"125 transpose_0_0_nncf_smooth_quant_0" -> "126 quantize_per_tensor_13" [style=solid, label="(197, 1, 768)"]; -"126 quantize_per_tensor_13" -> "127 dequantize_per_tensor_14" [style=solid, label="(197, 1, 768)"]; -"127 dequantize_per_tensor_14" -> "130 linear" [style=solid, label="(197, 1, 768)"]; -"128 _frozen_param3" -> "129 dequantize_per_tensor_15" [style=solid, label="(2304, 768)"]; -"129 dequantize_per_tensor_15" -> "130 linear" [style=solid, label="(2304, 768)"]; -"130 linear" -> "131 quantize_per_tensor_16" [style=solid, label="(197, 1, 2304)"]; -"131 quantize_per_tensor_16" -> "132 dequantize_per_tensor_17" [style=solid, label="(197, 1, 2304)"]; -"132 dequantize_per_tensor_17" -> "133 unflatten" [style=solid, label="(197, 1, 2304)"]; -"133 unflatten" -> "134 unsqueeze" [style=solid, label="(197, 1, 3, 768)"]; -"134 unsqueeze" -> "135 transpose_1" [style=solid, label="(1, 197, 1, 3, 768)"]; -"135 transpose_1" -> "136 squeeze" [style=solid, label="(3, 197, 1, 1, 768)"]; -"136 squeeze" -> "137 contiguous" [style=solid, label="(3, 197, 1, 768)"]; -"137 contiguous" -> "138 select" [style=solid, label="(3, 197, 1, 768)"]; -"137 contiguous" -> "139 select_1" [style=solid, label="(3, 197, 1, 768)"]; -"137 contiguous" -> "140 select_2" [style=solid, label="(3, 197, 1, 768)"]; -"138 select" -> "141 view" [style=solid, label="(197, 1, 768)"]; -"139 select_1" -> "143 view_1" [style=solid, label="(197, 1, 768)"]; -"140 select_2" -> "145 view_2" [style=solid, label="(197, 1, 768)"]; -"141 view" -> "142 transpose_2" [style=solid, label="(197, 12, 64)"]; -"142 transpose_2" -> "147 view_3" [style=solid, label="(12, 197, 64)"]; -"143 view_1" -> "144 transpose_3" [style=solid, label="(197, 12, 64)"]; -"144 transpose_3" -> "148 view_4" [style=solid, label="(12, 197, 64)"]; -"145 view_2" -> "146 transpose_4" [style=solid, label="(197, 12, 64)"]; -"146 transpose_4" -> "149 view_5" [style=solid, label="(12, 197, 64)"]; -"147 view_3" -> "150 scaled_dot_product_attention" [style=solid, label="(1, 12, 197, 64)"]; -"148 view_4" -> "150 scaled_dot_product_attention" [style=solid, label="(1, 12, 197, 64)"]; -"149 view_5" -> "150 scaled_dot_product_attention" [style=solid, label="(1, 12, 197, 64)"]; -"150 scaled_dot_product_attention" -> "151 permute_1" [style=solid, label="(1, 12, 197, 64)"]; -"151 permute_1" -> "152 view_6" [style=solid, label="(197, 1, 12, 64)"]; -"152 view_6" -> "153 view_6_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"153 view_6_0_0_nncf_smooth_quant_0" -> "154 quantize_per_tensor_18" [style=solid, label="(197, 768)"]; -"154 quantize_per_tensor_18" -> "155 dequantize_per_tensor_19" [style=solid, label="(197, 768)"]; -"155 dequantize_per_tensor_19" -> "158 linear_1" [style=solid, label="(197, 768)"]; -"156 _frozen_param4" -> "157 dequantize_per_tensor_20" [style=solid, label="(768, 768)"]; -"157 dequantize_per_tensor_20" -> "158 linear_1" [style=solid, label="(768, 768)"]; -"158 linear_1" -> "159 quantize_per_tensor_21" [style=solid, label="(197, 768)"]; -"159 quantize_per_tensor_21" -> "160 dequantize_per_tensor_22" [style=solid, label="(197, 768)"]; -"160 dequantize_per_tensor_22" -> "161 view_7" [style=solid, label="(197, 768)"]; -"161 view_7" -> "162 quantize_per_tensor_23" [style=solid, label="(197, 1, 768)"]; -"162 quantize_per_tensor_23" -> "163 dequantize_per_tensor_24" [style=solid, label="(197, 1, 768)"]; -"163 dequantize_per_tensor_24" -> "164 transpose_5" [style=solid, label="(197, 1, 768)"]; -"164 transpose_5" -> "165 dropout_1" [style=solid, label="(1, 197, 768)"]; -"165 dropout_1" -> "166 quantize_per_tensor_25" [style=solid, label="(1, 197, 768)"]; -"166 quantize_per_tensor_25" -> "167 dequantize_per_tensor_26" [style=solid, label="(1, 197, 768)"]; -"167 dequantize_per_tensor_26" -> "170 add_1" [style=solid, label="(1, 197, 768)"]; -"168 quantize_per_tensor_27" -> "169 dequantize_per_tensor_28" [style=solid, label="(1, 197, 768)"]; -"169 dequantize_per_tensor_28" -> "170 add_1" [style=solid, label="(1, 197, 768)"]; -"170 add_1" -> "171 quantize_per_tensor_29" [style=solid, label="(1, 197, 768)"]; -"171 quantize_per_tensor_29" -> "172 dequantize_per_tensor_30" [style=solid, label="(1, 197, 768)"]; -"171 quantize_per_tensor_29" -> "173 dequantize_per_tensor_31" [style=solid, label="(1, 197, 768)"]; -"172 dequantize_per_tensor_30" -> "196 add_2" [style=solid, label="(1, 197, 768)"]; -"173 dequantize_per_tensor_31" -> "174 layer_norm_1" [style=solid, label="(1, 197, 768)"]; -"174 layer_norm_1" -> "175 layer_norm_1_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"175 layer_norm_1_0_0_nncf_smooth_quant_0" -> "176 quantize_per_tensor_32" [style=solid, label="(1, 197, 768)"]; -"176 quantize_per_tensor_32" -> "177 dequantize_per_tensor_33" [style=solid, label="(1, 197, 768)"]; -"177 dequantize_per_tensor_33" -> "180 linear_2" [style=solid, label="(1, 197, 768)"]; -"178 _frozen_param5" -> "179 dequantize_per_tensor_34" [style=solid, label="(3072, 768)"]; -"179 dequantize_per_tensor_34" -> "180 linear_2" [style=solid, label="(3072, 768)"]; -"180 linear_2" -> "181 quantize_per_tensor_35" [style=solid, label="(1, 197, 3072)"]; -"181 quantize_per_tensor_35" -> "182 dequantize_per_tensor_36" [style=solid, label="(1, 197, 3072)"]; -"182 dequantize_per_tensor_36" -> "183 gelu" [style=solid, label="(1, 197, 3072)"]; -"183 gelu" -> "184 dropout_2" [style=solid, label="(1, 197, 3072)"]; -"184 dropout_2" -> "185 dropout_2_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"185 dropout_2_0_0_nncf_smooth_quant_0" -> "186 quantize_per_tensor_37" [style=solid, label="(1, 197, 3072)"]; -"186 quantize_per_tensor_37" -> "187 dequantize_per_tensor_38" [style=solid, label="(1, 197, 3072)"]; -"187 dequantize_per_tensor_38" -> "190 linear_3" [style=solid, label="(1, 197, 3072)"]; -"188 _frozen_param6" -> "189 dequantize_per_tensor_39" [style=solid, label="(768, 3072)"]; -"189 dequantize_per_tensor_39" -> "190 linear_3" [style=solid, label="(768, 3072)"]; -"190 linear_3" -> "191 quantize_per_tensor_40" [style=solid, label="(1, 197, 768)"]; -"191 quantize_per_tensor_40" -> "192 dequantize_per_tensor_41" [style=solid, label="(1, 197, 768)"]; -"192 dequantize_per_tensor_41" -> "193 dropout_3" [style=solid, label="(1, 197, 768)"]; -"193 dropout_3" -> "194 quantize_per_tensor_42" [style=solid, label="(1, 197, 768)"]; -"194 quantize_per_tensor_42" -> "195 dequantize_per_tensor_43" [style=solid, label="(1, 197, 768)"]; -"195 dequantize_per_tensor_43" -> "196 add_2" [style=solid, label="(1, 197, 768)"]; -"196 add_2" -> "197 quantize_per_tensor_44" [style=solid, label="(1, 197, 768)"]; -"197 quantize_per_tensor_44" -> "198 dequantize_per_tensor_45" [style=solid, label="(1, 197, 768)"]; -"197 quantize_per_tensor_44" -> "199 dequantize_per_tensor_46" [style=solid, label="(1, 197, 768)"]; -"198 dequantize_per_tensor_45" -> "245 add_3" [style=solid, label="(1, 197, 768)"]; -"199 dequantize_per_tensor_46" -> "200 layer_norm_2" [style=solid, label="(1, 197, 768)"]; -"200 layer_norm_2" -> "201 transpose_6" [style=solid, label="(1, 197, 768)"]; -"201 transpose_6" -> "202 transpose_6_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"202 transpose_6_0_0_nncf_smooth_quant_0" -> "203 quantize_per_tensor_47" [style=solid, label="(197, 1, 768)"]; -"203 quantize_per_tensor_47" -> "204 dequantize_per_tensor_48" [style=solid, label="(197, 1, 768)"]; -"204 dequantize_per_tensor_48" -> "207 linear_4" [style=solid, label="(197, 1, 768)"]; -"205 _frozen_param7" -> "206 dequantize_per_tensor_49" [style=solid, label="(2304, 768)"]; -"206 dequantize_per_tensor_49" -> "207 linear_4" [style=solid, label="(2304, 768)"]; -"207 linear_4" -> "208 quantize_per_tensor_50" [style=solid, label="(197, 1, 2304)"]; -"208 quantize_per_tensor_50" -> "209 dequantize_per_tensor_51" [style=solid, label="(197, 1, 2304)"]; -"209 dequantize_per_tensor_51" -> "210 unflatten_1" [style=solid, label="(197, 1, 2304)"]; -"210 unflatten_1" -> "211 unsqueeze_1" [style=solid, label="(197, 1, 3, 768)"]; -"211 unsqueeze_1" -> "212 transpose_7" [style=solid, label="(1, 197, 1, 3, 768)"]; -"212 transpose_7" -> "213 squeeze_1" [style=solid, label="(3, 197, 1, 1, 768)"]; -"213 squeeze_1" -> "214 contiguous_1" [style=solid, label="(3, 197, 1, 768)"]; -"214 contiguous_1" -> "215 select_3" [style=solid, label="(3, 197, 1, 768)"]; -"214 contiguous_1" -> "216 select_4" [style=solid, label="(3, 197, 1, 768)"]; -"214 contiguous_1" -> "217 select_5" [style=solid, label="(3, 197, 1, 768)"]; -"215 select_3" -> "218 view_8" [style=solid, label="(197, 1, 768)"]; -"216 select_4" -> "220 view_9" [style=solid, label="(197, 1, 768)"]; -"217 select_5" -> "222 view_10" [style=solid, label="(197, 1, 768)"]; -"218 view_8" -> "219 transpose_8" [style=solid, label="(197, 12, 64)"]; -"219 transpose_8" -> "224 view_11" [style=solid, label="(12, 197, 64)"]; -"220 view_9" -> "221 transpose_9" [style=solid, label="(197, 12, 64)"]; -"221 transpose_9" -> "225 view_12" [style=solid, label="(12, 197, 64)"]; -"222 view_10" -> "223 transpose_10" [style=solid, label="(197, 12, 64)"]; -"223 transpose_10" -> "226 view_13" [style=solid, label="(12, 197, 64)"]; -"224 view_11" -> "227 scaled_dot_product_attention_1" [style=solid, label="(1, 12, 197, 64)"]; -"225 view_12" -> "227 scaled_dot_product_attention_1" [style=solid, label="(1, 12, 197, 64)"]; -"226 view_13" -> "227 scaled_dot_product_attention_1" [style=solid, label="(1, 12, 197, 64)"]; -"227 scaled_dot_product_attention_1" -> "228 permute_2" [style=solid, label="(1, 12, 197, 64)"]; -"228 permute_2" -> "229 view_14" [style=solid, label="(197, 1, 12, 64)"]; -"229 view_14" -> "230 view_14_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"230 view_14_0_0_nncf_smooth_quant_0" -> "231 quantize_per_tensor_52" [style=solid, label="(197, 768)"]; -"231 quantize_per_tensor_52" -> "232 dequantize_per_tensor_53" [style=solid, label="(197, 768)"]; -"232 dequantize_per_tensor_53" -> "235 linear_5" [style=solid, label="(197, 768)"]; -"233 _frozen_param8" -> "234 dequantize_per_tensor_54" [style=solid, label="(768, 768)"]; -"234 dequantize_per_tensor_54" -> "235 linear_5" [style=solid, label="(768, 768)"]; -"235 linear_5" -> "236 quantize_per_tensor_55" [style=solid, label="(197, 768)"]; -"236 quantize_per_tensor_55" -> "237 dequantize_per_tensor_56" [style=solid, label="(197, 768)"]; -"237 dequantize_per_tensor_56" -> "238 view_15" [style=solid, label="(197, 768)"]; -"238 view_15" -> "239 quantize_per_tensor_57" [style=solid, label="(197, 1, 768)"]; -"239 quantize_per_tensor_57" -> "240 dequantize_per_tensor_58" [style=solid, label="(197, 1, 768)"]; -"240 dequantize_per_tensor_58" -> "241 transpose_11" [style=solid, label="(197, 1, 768)"]; -"241 transpose_11" -> "242 dropout_4" [style=solid, label="(1, 197, 768)"]; -"242 dropout_4" -> "243 quantize_per_tensor_59" [style=solid, label="(1, 197, 768)"]; -"243 quantize_per_tensor_59" -> "244 dequantize_per_tensor_60" [style=solid, label="(1, 197, 768)"]; -"244 dequantize_per_tensor_60" -> "245 add_3" [style=solid, label="(1, 197, 768)"]; -"245 add_3" -> "246 quantize_per_tensor_61" [style=solid, label="(1, 197, 768)"]; -"246 quantize_per_tensor_61" -> "247 dequantize_per_tensor_62" [style=solid, label="(1, 197, 768)"]; -"246 quantize_per_tensor_61" -> "248 dequantize_per_tensor_63" [style=solid, label="(1, 197, 768)"]; -"247 dequantize_per_tensor_62" -> "271 add_4" [style=solid, label="(1, 197, 768)"]; -"248 dequantize_per_tensor_63" -> "249 layer_norm_3" [style=solid, label="(1, 197, 768)"]; -"249 layer_norm_3" -> "250 layer_norm_3_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"250 layer_norm_3_0_0_nncf_smooth_quant_0" -> "251 quantize_per_tensor_64" [style=solid, label="(1, 197, 768)"]; -"251 quantize_per_tensor_64" -> "252 dequantize_per_tensor_65" [style=solid, label="(1, 197, 768)"]; -"252 dequantize_per_tensor_65" -> "255 linear_6" [style=solid, label="(1, 197, 768)"]; -"253 _frozen_param9" -> "254 dequantize_per_tensor_66" [style=solid, label="(3072, 768)"]; -"254 dequantize_per_tensor_66" -> "255 linear_6" [style=solid, label="(3072, 768)"]; -"255 linear_6" -> "256 quantize_per_tensor_67" [style=solid, label="(1, 197, 3072)"]; -"256 quantize_per_tensor_67" -> "257 dequantize_per_tensor_68" [style=solid, label="(1, 197, 3072)"]; -"257 dequantize_per_tensor_68" -> "258 gelu_1" [style=solid, label="(1, 197, 3072)"]; -"258 gelu_1" -> "259 dropout_5" [style=solid, label="(1, 197, 3072)"]; -"259 dropout_5" -> "260 dropout_5_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"260 dropout_5_0_0_nncf_smooth_quant_0" -> "261 quantize_per_tensor_69" [style=solid, label="(1, 197, 3072)"]; -"261 quantize_per_tensor_69" -> "262 dequantize_per_tensor_70" [style=solid, label="(1, 197, 3072)"]; -"262 dequantize_per_tensor_70" -> "265 linear_7" [style=solid, label="(1, 197, 3072)"]; -"263 _frozen_param10" -> "264 dequantize_per_tensor_71" [style=solid, label="(768, 3072)"]; -"264 dequantize_per_tensor_71" -> "265 linear_7" [style=solid, label="(768, 3072)"]; -"265 linear_7" -> "266 quantize_per_tensor_72" [style=solid, label="(1, 197, 768)"]; -"266 quantize_per_tensor_72" -> "267 dequantize_per_tensor_73" [style=solid, label="(1, 197, 768)"]; -"267 dequantize_per_tensor_73" -> "268 dropout_6" [style=solid, label="(1, 197, 768)"]; -"268 dropout_6" -> "269 quantize_per_tensor_74" [style=solid, label="(1, 197, 768)"]; -"269 quantize_per_tensor_74" -> "270 dequantize_per_tensor_75" [style=solid, label="(1, 197, 768)"]; -"270 dequantize_per_tensor_75" -> "271 add_4" [style=solid, label="(1, 197, 768)"]; -"271 add_4" -> "272 quantize_per_tensor_76" [style=solid, label="(1, 197, 768)"]; -"272 quantize_per_tensor_76" -> "273 dequantize_per_tensor_77" [style=solid, label="(1, 197, 768)"]; -"272 quantize_per_tensor_76" -> "274 dequantize_per_tensor_78" [style=solid, label="(1, 197, 768)"]; -"273 dequantize_per_tensor_77" -> "320 add_5" [style=solid, label="(1, 197, 768)"]; -"274 dequantize_per_tensor_78" -> "275 layer_norm_4" [style=solid, label="(1, 197, 768)"]; -"275 layer_norm_4" -> "276 transpose_12" [style=solid, label="(1, 197, 768)"]; -"276 transpose_12" -> "277 transpose_12_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"277 transpose_12_0_0_nncf_smooth_quant_0" -> "278 quantize_per_tensor_79" [style=solid, label="(197, 1, 768)"]; -"278 quantize_per_tensor_79" -> "279 dequantize_per_tensor_80" [style=solid, label="(197, 1, 768)"]; -"279 dequantize_per_tensor_80" -> "282 linear_8" [style=solid, label="(197, 1, 768)"]; -"280 _frozen_param11" -> "281 dequantize_per_tensor_81" [style=solid, label="(2304, 768)"]; -"281 dequantize_per_tensor_81" -> "282 linear_8" [style=solid, label="(2304, 768)"]; -"282 linear_8" -> "283 quantize_per_tensor_82" [style=solid, label="(197, 1, 2304)"]; -"283 quantize_per_tensor_82" -> "284 dequantize_per_tensor_83" [style=solid, label="(197, 1, 2304)"]; -"284 dequantize_per_tensor_83" -> "285 unflatten_2" [style=solid, label="(197, 1, 2304)"]; -"285 unflatten_2" -> "286 unsqueeze_2" [style=solid, label="(197, 1, 3, 768)"]; -"286 unsqueeze_2" -> "287 transpose_13" [style=solid, label="(1, 197, 1, 3, 768)"]; -"287 transpose_13" -> "288 squeeze_2" [style=solid, label="(3, 197, 1, 1, 768)"]; -"288 squeeze_2" -> "289 contiguous_2" [style=solid, label="(3, 197, 1, 768)"]; -"289 contiguous_2" -> "290 select_6" [style=solid, label="(3, 197, 1, 768)"]; -"289 contiguous_2" -> "291 select_7" [style=solid, label="(3, 197, 1, 768)"]; -"289 contiguous_2" -> "292 select_8" [style=solid, label="(3, 197, 1, 768)"]; -"290 select_6" -> "293 view_16" [style=solid, label="(197, 1, 768)"]; -"291 select_7" -> "295 view_17" [style=solid, label="(197, 1, 768)"]; -"292 select_8" -> "297 view_18" [style=solid, label="(197, 1, 768)"]; -"293 view_16" -> "294 transpose_14" [style=solid, label="(197, 12, 64)"]; -"294 transpose_14" -> "299 view_19" [style=solid, label="(12, 197, 64)"]; -"295 view_17" -> "296 transpose_15" [style=solid, label="(197, 12, 64)"]; -"296 transpose_15" -> "300 view_20" [style=solid, label="(12, 197, 64)"]; -"297 view_18" -> "298 transpose_16" [style=solid, label="(197, 12, 64)"]; -"298 transpose_16" -> "301 view_21" [style=solid, label="(12, 197, 64)"]; -"299 view_19" -> "302 scaled_dot_product_attention_2" [style=solid, label="(1, 12, 197, 64)"]; -"300 view_20" -> "302 scaled_dot_product_attention_2" [style=solid, label="(1, 12, 197, 64)"]; -"301 view_21" -> "302 scaled_dot_product_attention_2" [style=solid, label="(1, 12, 197, 64)"]; -"302 scaled_dot_product_attention_2" -> "303 permute_3" [style=solid, label="(1, 12, 197, 64)"]; -"303 permute_3" -> "304 view_22" [style=solid, label="(197, 1, 12, 64)"]; -"304 view_22" -> "305 view_22_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"305 view_22_0_0_nncf_smooth_quant_0" -> "306 quantize_per_tensor_84" [style=solid, label="(197, 768)"]; -"306 quantize_per_tensor_84" -> "307 dequantize_per_tensor_85" [style=solid, label="(197, 768)"]; -"307 dequantize_per_tensor_85" -> "310 linear_9" [style=solid, label="(197, 768)"]; -"308 _frozen_param12" -> "309 dequantize_per_tensor_86" [style=solid, label="(768, 768)"]; -"309 dequantize_per_tensor_86" -> "310 linear_9" [style=solid, label="(768, 768)"]; -"310 linear_9" -> "311 quantize_per_tensor_87" [style=solid, label="(197, 768)"]; -"311 quantize_per_tensor_87" -> "312 dequantize_per_tensor_88" [style=solid, label="(197, 768)"]; -"312 dequantize_per_tensor_88" -> "313 view_23" [style=solid, label="(197, 768)"]; -"313 view_23" -> "314 quantize_per_tensor_89" [style=solid, label="(197, 1, 768)"]; -"314 quantize_per_tensor_89" -> "315 dequantize_per_tensor_90" [style=solid, label="(197, 1, 768)"]; -"315 dequantize_per_tensor_90" -> "316 transpose_17" [style=solid, label="(197, 1, 768)"]; -"316 transpose_17" -> "317 dropout_7" [style=solid, label="(1, 197, 768)"]; -"317 dropout_7" -> "318 quantize_per_tensor_91" [style=solid, label="(1, 197, 768)"]; -"318 quantize_per_tensor_91" -> "319 dequantize_per_tensor_92" [style=solid, label="(1, 197, 768)"]; -"319 dequantize_per_tensor_92" -> "320 add_5" [style=solid, label="(1, 197, 768)"]; -"320 add_5" -> "321 quantize_per_tensor_93" [style=solid, label="(1, 197, 768)"]; -"321 quantize_per_tensor_93" -> "322 dequantize_per_tensor_94" [style=solid, label="(1, 197, 768)"]; -"321 quantize_per_tensor_93" -> "323 dequantize_per_tensor_95" [style=solid, label="(1, 197, 768)"]; -"322 dequantize_per_tensor_94" -> "346 add_6" [style=solid, label="(1, 197, 768)"]; -"323 dequantize_per_tensor_95" -> "324 layer_norm_5" [style=solid, label="(1, 197, 768)"]; -"324 layer_norm_5" -> "325 layer_norm_5_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"325 layer_norm_5_0_0_nncf_smooth_quant_0" -> "326 quantize_per_tensor_96" [style=solid, label="(1, 197, 768)"]; -"326 quantize_per_tensor_96" -> "327 dequantize_per_tensor_97" [style=solid, label="(1, 197, 768)"]; -"327 dequantize_per_tensor_97" -> "330 linear_10" [style=solid, label="(1, 197, 768)"]; -"328 _frozen_param13" -> "329 dequantize_per_tensor_98" [style=solid, label="(3072, 768)"]; -"329 dequantize_per_tensor_98" -> "330 linear_10" [style=solid, label="(3072, 768)"]; -"330 linear_10" -> "331 quantize_per_tensor_99" [style=solid, label="(1, 197, 3072)"]; -"331 quantize_per_tensor_99" -> "332 dequantize_per_tensor_100" [style=solid, label="(1, 197, 3072)"]; -"332 dequantize_per_tensor_100" -> "333 gelu_2" [style=solid, label="(1, 197, 3072)"]; -"333 gelu_2" -> "334 dropout_8" [style=solid, label="(1, 197, 3072)"]; -"334 dropout_8" -> "335 dropout_8_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"335 dropout_8_0_0_nncf_smooth_quant_0" -> "336 quantize_per_tensor_101" [style=solid, label="(1, 197, 3072)"]; -"336 quantize_per_tensor_101" -> "337 dequantize_per_tensor_102" [style=solid, label="(1, 197, 3072)"]; -"337 dequantize_per_tensor_102" -> "340 linear_11" [style=solid, label="(1, 197, 3072)"]; -"338 _frozen_param14" -> "339 dequantize_per_tensor_103" [style=solid, label="(768, 3072)"]; -"339 dequantize_per_tensor_103" -> "340 linear_11" [style=solid, label="(768, 3072)"]; -"340 linear_11" -> "341 quantize_per_tensor_104" [style=solid, label="(1, 197, 768)"]; -"341 quantize_per_tensor_104" -> "342 dequantize_per_tensor_105" [style=solid, label="(1, 197, 768)"]; -"342 dequantize_per_tensor_105" -> "343 dropout_9" [style=solid, label="(1, 197, 768)"]; -"343 dropout_9" -> "344 quantize_per_tensor_106" [style=solid, label="(1, 197, 768)"]; -"344 quantize_per_tensor_106" -> "345 dequantize_per_tensor_107" [style=solid, label="(1, 197, 768)"]; -"345 dequantize_per_tensor_107" -> "346 add_6" [style=solid, label="(1, 197, 768)"]; -"346 add_6" -> "347 quantize_per_tensor_108" [style=solid, label="(1, 197, 768)"]; -"347 quantize_per_tensor_108" -> "348 dequantize_per_tensor_109" [style=solid, label="(1, 197, 768)"]; -"347 quantize_per_tensor_108" -> "349 dequantize_per_tensor_110" [style=solid, label="(1, 197, 768)"]; -"348 dequantize_per_tensor_109" -> "395 add_7" [style=solid, label="(1, 197, 768)"]; -"349 dequantize_per_tensor_110" -> "350 layer_norm_6" [style=solid, label="(1, 197, 768)"]; -"350 layer_norm_6" -> "351 transpose_18" [style=solid, label="(1, 197, 768)"]; -"351 transpose_18" -> "352 transpose_18_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"352 transpose_18_0_0_nncf_smooth_quant_0" -> "353 quantize_per_tensor_111" [style=solid, label="(197, 1, 768)"]; -"353 quantize_per_tensor_111" -> "354 dequantize_per_tensor_112" [style=solid, label="(197, 1, 768)"]; -"354 dequantize_per_tensor_112" -> "357 linear_12" [style=solid, label="(197, 1, 768)"]; -"355 _frozen_param15" -> "356 dequantize_per_tensor_113" [style=solid, label="(2304, 768)"]; -"356 dequantize_per_tensor_113" -> "357 linear_12" [style=solid, label="(2304, 768)"]; -"357 linear_12" -> "358 quantize_per_tensor_114" [style=solid, label="(197, 1, 2304)"]; -"358 quantize_per_tensor_114" -> "359 dequantize_per_tensor_115" [style=solid, label="(197, 1, 2304)"]; -"359 dequantize_per_tensor_115" -> "360 unflatten_3" [style=solid, label="(197, 1, 2304)"]; -"360 unflatten_3" -> "361 unsqueeze_3" [style=solid, label="(197, 1, 3, 768)"]; -"361 unsqueeze_3" -> "362 transpose_19" [style=solid, label="(1, 197, 1, 3, 768)"]; -"362 transpose_19" -> "363 squeeze_3" [style=solid, label="(3, 197, 1, 1, 768)"]; -"363 squeeze_3" -> "364 contiguous_3" [style=solid, label="(3, 197, 1, 768)"]; -"364 contiguous_3" -> "365 select_9" [style=solid, label="(3, 197, 1, 768)"]; -"364 contiguous_3" -> "366 select_10" [style=solid, label="(3, 197, 1, 768)"]; -"364 contiguous_3" -> "367 select_11" [style=solid, label="(3, 197, 1, 768)"]; -"365 select_9" -> "368 view_24" [style=solid, label="(197, 1, 768)"]; -"366 select_10" -> "370 view_25" [style=solid, label="(197, 1, 768)"]; -"367 select_11" -> "372 view_26" [style=solid, label="(197, 1, 768)"]; -"368 view_24" -> "369 transpose_20" [style=solid, label="(197, 12, 64)"]; -"369 transpose_20" -> "374 view_27" [style=solid, label="(12, 197, 64)"]; -"370 view_25" -> "371 transpose_21" [style=solid, label="(197, 12, 64)"]; -"371 transpose_21" -> "375 view_28" [style=solid, label="(12, 197, 64)"]; -"372 view_26" -> "373 transpose_22" [style=solid, label="(197, 12, 64)"]; -"373 transpose_22" -> "376 view_29" [style=solid, label="(12, 197, 64)"]; -"374 view_27" -> "377 scaled_dot_product_attention_3" [style=solid, label="(1, 12, 197, 64)"]; -"375 view_28" -> "377 scaled_dot_product_attention_3" [style=solid, label="(1, 12, 197, 64)"]; -"376 view_29" -> "377 scaled_dot_product_attention_3" [style=solid, label="(1, 12, 197, 64)"]; -"377 scaled_dot_product_attention_3" -> "378 permute_4" [style=solid, label="(1, 12, 197, 64)"]; -"378 permute_4" -> "379 view_30" [style=solid, label="(197, 1, 12, 64)"]; -"379 view_30" -> "380 view_30_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"380 view_30_0_0_nncf_smooth_quant_0" -> "381 quantize_per_tensor_116" [style=solid, label="(197, 768)"]; -"381 quantize_per_tensor_116" -> "382 dequantize_per_tensor_117" [style=solid, label="(197, 768)"]; -"382 dequantize_per_tensor_117" -> "385 linear_13" [style=solid, label="(197, 768)"]; -"383 _frozen_param16" -> "384 dequantize_per_tensor_118" [style=solid, label="(768, 768)"]; -"384 dequantize_per_tensor_118" -> "385 linear_13" [style=solid, label="(768, 768)"]; -"385 linear_13" -> "386 quantize_per_tensor_119" [style=solid, label="(197, 768)"]; -"386 quantize_per_tensor_119" -> "387 dequantize_per_tensor_120" [style=solid, label="(197, 768)"]; -"387 dequantize_per_tensor_120" -> "388 view_31" [style=solid, label="(197, 768)"]; -"388 view_31" -> "389 quantize_per_tensor_121" [style=solid, label="(197, 1, 768)"]; -"389 quantize_per_tensor_121" -> "390 dequantize_per_tensor_122" [style=solid, label="(197, 1, 768)"]; -"390 dequantize_per_tensor_122" -> "391 transpose_23" [style=solid, label="(197, 1, 768)"]; -"391 transpose_23" -> "392 dropout_10" [style=solid, label="(1, 197, 768)"]; -"392 dropout_10" -> "393 quantize_per_tensor_123" [style=solid, label="(1, 197, 768)"]; -"393 quantize_per_tensor_123" -> "394 dequantize_per_tensor_124" [style=solid, label="(1, 197, 768)"]; -"394 dequantize_per_tensor_124" -> "395 add_7" [style=solid, label="(1, 197, 768)"]; -"395 add_7" -> "396 quantize_per_tensor_125" [style=solid, label="(1, 197, 768)"]; -"396 quantize_per_tensor_125" -> "397 dequantize_per_tensor_126" [style=solid, label="(1, 197, 768)"]; -"396 quantize_per_tensor_125" -> "398 dequantize_per_tensor_127" [style=solid, label="(1, 197, 768)"]; -"397 dequantize_per_tensor_126" -> "421 add_8" [style=solid, label="(1, 197, 768)"]; -"398 dequantize_per_tensor_127" -> "399 layer_norm_7" [style=solid, label="(1, 197, 768)"]; -"399 layer_norm_7" -> "400 layer_norm_7_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"400 layer_norm_7_0_0_nncf_smooth_quant_0" -> "401 quantize_per_tensor_128" [style=solid, label="(1, 197, 768)"]; -"401 quantize_per_tensor_128" -> "402 dequantize_per_tensor_129" [style=solid, label="(1, 197, 768)"]; -"402 dequantize_per_tensor_129" -> "405 linear_14" [style=solid, label="(1, 197, 768)"]; -"403 _frozen_param17" -> "404 dequantize_per_tensor_130" [style=solid, label="(3072, 768)"]; -"404 dequantize_per_tensor_130" -> "405 linear_14" [style=solid, label="(3072, 768)"]; -"405 linear_14" -> "406 quantize_per_tensor_131" [style=solid, label="(1, 197, 3072)"]; -"406 quantize_per_tensor_131" -> "407 dequantize_per_tensor_132" [style=solid, label="(1, 197, 3072)"]; -"407 dequantize_per_tensor_132" -> "408 gelu_3" [style=solid, label="(1, 197, 3072)"]; -"408 gelu_3" -> "409 dropout_11" [style=solid, label="(1, 197, 3072)"]; -"409 dropout_11" -> "410 dropout_11_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"410 dropout_11_0_0_nncf_smooth_quant_0" -> "411 quantize_per_tensor_133" [style=solid, label="(1, 197, 3072)"]; -"411 quantize_per_tensor_133" -> "412 dequantize_per_tensor_134" [style=solid, label="(1, 197, 3072)"]; -"412 dequantize_per_tensor_134" -> "415 linear_15" [style=solid, label="(1, 197, 3072)"]; -"413 _frozen_param18" -> "414 dequantize_per_tensor_135" [style=solid, label="(768, 3072)"]; -"414 dequantize_per_tensor_135" -> "415 linear_15" [style=solid, label="(768, 3072)"]; -"415 linear_15" -> "416 quantize_per_tensor_136" [style=solid, label="(1, 197, 768)"]; -"416 quantize_per_tensor_136" -> "417 dequantize_per_tensor_137" [style=solid, label="(1, 197, 768)"]; -"417 dequantize_per_tensor_137" -> "418 dropout_12" [style=solid, label="(1, 197, 768)"]; -"418 dropout_12" -> "419 quantize_per_tensor_138" [style=solid, label="(1, 197, 768)"]; -"419 quantize_per_tensor_138" -> "420 dequantize_per_tensor_139" [style=solid, label="(1, 197, 768)"]; -"420 dequantize_per_tensor_139" -> "421 add_8" [style=solid, label="(1, 197, 768)"]; -"421 add_8" -> "422 quantize_per_tensor_140" [style=solid, label="(1, 197, 768)"]; -"422 quantize_per_tensor_140" -> "423 dequantize_per_tensor_141" [style=solid, label="(1, 197, 768)"]; -"422 quantize_per_tensor_140" -> "424 dequantize_per_tensor_142" [style=solid, label="(1, 197, 768)"]; -"423 dequantize_per_tensor_141" -> "470 add_9" [style=solid, label="(1, 197, 768)"]; -"424 dequantize_per_tensor_142" -> "425 layer_norm_8" [style=solid, label="(1, 197, 768)"]; -"425 layer_norm_8" -> "426 transpose_24" [style=solid, label="(1, 197, 768)"]; -"426 transpose_24" -> "427 transpose_24_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"427 transpose_24_0_0_nncf_smooth_quant_0" -> "428 quantize_per_tensor_143" [style=solid, label="(197, 1, 768)"]; -"428 quantize_per_tensor_143" -> "429 dequantize_per_tensor_144" [style=solid, label="(197, 1, 768)"]; -"429 dequantize_per_tensor_144" -> "432 linear_16" [style=solid, label="(197, 1, 768)"]; -"430 _frozen_param19" -> "431 dequantize_per_tensor_145" [style=solid, label="(2304, 768)"]; -"431 dequantize_per_tensor_145" -> "432 linear_16" [style=solid, label="(2304, 768)"]; -"432 linear_16" -> "433 quantize_per_tensor_146" [style=solid, label="(197, 1, 2304)"]; -"433 quantize_per_tensor_146" -> "434 dequantize_per_tensor_147" [style=solid, label="(197, 1, 2304)"]; -"434 dequantize_per_tensor_147" -> "435 unflatten_4" [style=solid, label="(197, 1, 2304)"]; -"435 unflatten_4" -> "436 unsqueeze_4" [style=solid, label="(197, 1, 3, 768)"]; -"436 unsqueeze_4" -> "437 transpose_25" [style=solid, label="(1, 197, 1, 3, 768)"]; -"437 transpose_25" -> "438 squeeze_4" [style=solid, label="(3, 197, 1, 1, 768)"]; -"438 squeeze_4" -> "439 contiguous_4" [style=solid, label="(3, 197, 1, 768)"]; -"439 contiguous_4" -> "440 select_12" [style=solid, label="(3, 197, 1, 768)"]; -"439 contiguous_4" -> "441 select_13" [style=solid, label="(3, 197, 1, 768)"]; -"439 contiguous_4" -> "442 select_14" [style=solid, label="(3, 197, 1, 768)"]; -"440 select_12" -> "443 view_32" [style=solid, label="(197, 1, 768)"]; -"441 select_13" -> "445 view_33" [style=solid, label="(197, 1, 768)"]; -"442 select_14" -> "447 view_34" [style=solid, label="(197, 1, 768)"]; -"443 view_32" -> "444 transpose_26" [style=solid, label="(197, 12, 64)"]; -"444 transpose_26" -> "449 view_35" [style=solid, label="(12, 197, 64)"]; -"445 view_33" -> "446 transpose_27" [style=solid, label="(197, 12, 64)"]; -"446 transpose_27" -> "450 view_36" [style=solid, label="(12, 197, 64)"]; -"447 view_34" -> "448 transpose_28" [style=solid, label="(197, 12, 64)"]; -"448 transpose_28" -> "451 view_37" [style=solid, label="(12, 197, 64)"]; -"449 view_35" -> "452 scaled_dot_product_attention_4" [style=solid, label="(1, 12, 197, 64)"]; -"450 view_36" -> "452 scaled_dot_product_attention_4" [style=solid, label="(1, 12, 197, 64)"]; -"451 view_37" -> "452 scaled_dot_product_attention_4" [style=solid, label="(1, 12, 197, 64)"]; -"452 scaled_dot_product_attention_4" -> "453 permute_5" [style=solid, label="(1, 12, 197, 64)"]; -"453 permute_5" -> "454 view_38" [style=solid, label="(197, 1, 12, 64)"]; -"454 view_38" -> "455 view_38_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"455 view_38_0_0_nncf_smooth_quant_0" -> "456 quantize_per_tensor_148" [style=solid, label="(197, 768)"]; -"456 quantize_per_tensor_148" -> "457 dequantize_per_tensor_149" [style=solid, label="(197, 768)"]; -"457 dequantize_per_tensor_149" -> "460 linear_17" [style=solid, label="(197, 768)"]; -"458 _frozen_param20" -> "459 dequantize_per_tensor_150" [style=solid, label="(768, 768)"]; -"459 dequantize_per_tensor_150" -> "460 linear_17" [style=solid, label="(768, 768)"]; -"460 linear_17" -> "461 quantize_per_tensor_151" [style=solid, label="(197, 768)"]; -"461 quantize_per_tensor_151" -> "462 dequantize_per_tensor_152" [style=solid, label="(197, 768)"]; -"462 dequantize_per_tensor_152" -> "463 view_39" [style=solid, label="(197, 768)"]; -"463 view_39" -> "464 quantize_per_tensor_153" [style=solid, label="(197, 1, 768)"]; -"464 quantize_per_tensor_153" -> "465 dequantize_per_tensor_154" [style=solid, label="(197, 1, 768)"]; -"465 dequantize_per_tensor_154" -> "466 transpose_29" [style=solid, label="(197, 1, 768)"]; -"466 transpose_29" -> "467 dropout_13" [style=solid, label="(1, 197, 768)"]; -"467 dropout_13" -> "468 quantize_per_tensor_155" [style=solid, label="(1, 197, 768)"]; -"468 quantize_per_tensor_155" -> "469 dequantize_per_tensor_156" [style=solid, label="(1, 197, 768)"]; -"469 dequantize_per_tensor_156" -> "470 add_9" [style=solid, label="(1, 197, 768)"]; -"470 add_9" -> "471 quantize_per_tensor_157" [style=solid, label="(1, 197, 768)"]; -"471 quantize_per_tensor_157" -> "472 dequantize_per_tensor_158" [style=solid, label="(1, 197, 768)"]; -"471 quantize_per_tensor_157" -> "473 dequantize_per_tensor_159" [style=solid, label="(1, 197, 768)"]; -"472 dequantize_per_tensor_158" -> "496 add_10" [style=solid, label="(1, 197, 768)"]; -"473 dequantize_per_tensor_159" -> "474 layer_norm_9" [style=solid, label="(1, 197, 768)"]; -"474 layer_norm_9" -> "475 layer_norm_9_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"475 layer_norm_9_0_0_nncf_smooth_quant_0" -> "476 quantize_per_tensor_160" [style=solid, label="(1, 197, 768)"]; -"476 quantize_per_tensor_160" -> "477 dequantize_per_tensor_161" [style=solid, label="(1, 197, 768)"]; -"477 dequantize_per_tensor_161" -> "480 linear_18" [style=solid, label="(1, 197, 768)"]; -"478 _frozen_param21" -> "479 dequantize_per_tensor_162" [style=solid, label="(3072, 768)"]; -"479 dequantize_per_tensor_162" -> "480 linear_18" [style=solid, label="(3072, 768)"]; -"480 linear_18" -> "481 quantize_per_tensor_163" [style=solid, label="(1, 197, 3072)"]; -"481 quantize_per_tensor_163" -> "482 dequantize_per_tensor_164" [style=solid, label="(1, 197, 3072)"]; -"482 dequantize_per_tensor_164" -> "483 gelu_4" [style=solid, label="(1, 197, 3072)"]; -"483 gelu_4" -> "484 dropout_14" [style=solid, label="(1, 197, 3072)"]; -"484 dropout_14" -> "485 dropout_14_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"485 dropout_14_0_0_nncf_smooth_quant_0" -> "486 quantize_per_tensor_165" [style=solid, label="(1, 197, 3072)"]; -"486 quantize_per_tensor_165" -> "487 dequantize_per_tensor_166" [style=solid, label="(1, 197, 3072)"]; -"487 dequantize_per_tensor_166" -> "490 linear_19" [style=solid, label="(1, 197, 3072)"]; -"488 _frozen_param22" -> "489 dequantize_per_tensor_167" [style=solid, label="(768, 3072)"]; -"489 dequantize_per_tensor_167" -> "490 linear_19" [style=solid, label="(768, 3072)"]; -"490 linear_19" -> "491 quantize_per_tensor_168" [style=solid, label="(1, 197, 768)"]; -"491 quantize_per_tensor_168" -> "492 dequantize_per_tensor_169" [style=solid, label="(1, 197, 768)"]; -"492 dequantize_per_tensor_169" -> "493 dropout_15" [style=solid, label="(1, 197, 768)"]; -"493 dropout_15" -> "494 quantize_per_tensor_170" [style=solid, label="(1, 197, 768)"]; -"494 quantize_per_tensor_170" -> "495 dequantize_per_tensor_171" [style=solid, label="(1, 197, 768)"]; -"495 dequantize_per_tensor_171" -> "496 add_10" [style=solid, label="(1, 197, 768)"]; -"496 add_10" -> "497 quantize_per_tensor_172" [style=solid, label="(1, 197, 768)"]; -"497 quantize_per_tensor_172" -> "498 dequantize_per_tensor_173" [style=solid, label="(1, 197, 768)"]; -"497 quantize_per_tensor_172" -> "499 dequantize_per_tensor_174" [style=solid, label="(1, 197, 768)"]; -"498 dequantize_per_tensor_173" -> "545 add_11" [style=solid, label="(1, 197, 768)"]; -"499 dequantize_per_tensor_174" -> "500 layer_norm_10" [style=solid, label="(1, 197, 768)"]; -"500 layer_norm_10" -> "501 transpose_30" [style=solid, label="(1, 197, 768)"]; -"501 transpose_30" -> "502 transpose_30_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"502 transpose_30_0_0_nncf_smooth_quant_0" -> "503 quantize_per_tensor_175" [style=solid, label="(197, 1, 768)"]; -"503 quantize_per_tensor_175" -> "504 dequantize_per_tensor_176" [style=solid, label="(197, 1, 768)"]; -"504 dequantize_per_tensor_176" -> "507 linear_20" [style=solid, label="(197, 1, 768)"]; -"505 _frozen_param23" -> "506 dequantize_per_tensor_177" [style=solid, label="(2304, 768)"]; -"506 dequantize_per_tensor_177" -> "507 linear_20" [style=solid, label="(2304, 768)"]; -"507 linear_20" -> "508 quantize_per_tensor_178" [style=solid, label="(197, 1, 2304)"]; -"508 quantize_per_tensor_178" -> "509 dequantize_per_tensor_179" [style=solid, label="(197, 1, 2304)"]; -"509 dequantize_per_tensor_179" -> "510 unflatten_5" [style=solid, label="(197, 1, 2304)"]; -"510 unflatten_5" -> "511 unsqueeze_5" [style=solid, label="(197, 1, 3, 768)"]; -"511 unsqueeze_5" -> "512 transpose_31" [style=solid, label="(1, 197, 1, 3, 768)"]; -"512 transpose_31" -> "513 squeeze_5" [style=solid, label="(3, 197, 1, 1, 768)"]; -"513 squeeze_5" -> "514 contiguous_5" [style=solid, label="(3, 197, 1, 768)"]; -"514 contiguous_5" -> "515 select_15" [style=solid, label="(3, 197, 1, 768)"]; -"514 contiguous_5" -> "516 select_16" [style=solid, label="(3, 197, 1, 768)"]; -"514 contiguous_5" -> "517 select_17" [style=solid, label="(3, 197, 1, 768)"]; -"515 select_15" -> "518 view_40" [style=solid, label="(197, 1, 768)"]; -"516 select_16" -> "520 view_41" [style=solid, label="(197, 1, 768)"]; -"517 select_17" -> "522 view_42" [style=solid, label="(197, 1, 768)"]; -"518 view_40" -> "519 transpose_32" [style=solid, label="(197, 12, 64)"]; -"519 transpose_32" -> "524 view_43" [style=solid, label="(12, 197, 64)"]; -"520 view_41" -> "521 transpose_33" [style=solid, label="(197, 12, 64)"]; -"521 transpose_33" -> "525 view_44" [style=solid, label="(12, 197, 64)"]; -"522 view_42" -> "523 transpose_34" [style=solid, label="(197, 12, 64)"]; -"523 transpose_34" -> "526 view_45" [style=solid, label="(12, 197, 64)"]; -"524 view_43" -> "527 scaled_dot_product_attention_5" [style=solid, label="(1, 12, 197, 64)"]; -"525 view_44" -> "527 scaled_dot_product_attention_5" [style=solid, label="(1, 12, 197, 64)"]; -"526 view_45" -> "527 scaled_dot_product_attention_5" [style=solid, label="(1, 12, 197, 64)"]; -"527 scaled_dot_product_attention_5" -> "528 permute_6" [style=solid, label="(1, 12, 197, 64)"]; -"528 permute_6" -> "529 view_46" [style=solid, label="(197, 1, 12, 64)"]; -"529 view_46" -> "530 view_46_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"530 view_46_0_0_nncf_smooth_quant_0" -> "531 quantize_per_tensor_180" [style=solid, label="(197, 768)"]; -"531 quantize_per_tensor_180" -> "532 dequantize_per_tensor_181" [style=solid, label="(197, 768)"]; -"532 dequantize_per_tensor_181" -> "535 linear_21" [style=solid, label="(197, 768)"]; -"533 _frozen_param24" -> "534 dequantize_per_tensor_182" [style=solid, label="(768, 768)"]; -"534 dequantize_per_tensor_182" -> "535 linear_21" [style=solid, label="(768, 768)"]; -"535 linear_21" -> "536 quantize_per_tensor_183" [style=solid, label="(197, 768)"]; -"536 quantize_per_tensor_183" -> "537 dequantize_per_tensor_184" [style=solid, label="(197, 768)"]; -"537 dequantize_per_tensor_184" -> "538 view_47" [style=solid, label="(197, 768)"]; -"538 view_47" -> "539 quantize_per_tensor_185" [style=solid, label="(197, 1, 768)"]; -"539 quantize_per_tensor_185" -> "540 dequantize_per_tensor_186" [style=solid, label="(197, 1, 768)"]; -"540 dequantize_per_tensor_186" -> "541 transpose_35" [style=solid, label="(197, 1, 768)"]; -"541 transpose_35" -> "542 dropout_16" [style=solid, label="(1, 197, 768)"]; -"542 dropout_16" -> "543 quantize_per_tensor_187" [style=solid, label="(1, 197, 768)"]; -"543 quantize_per_tensor_187" -> "544 dequantize_per_tensor_188" [style=solid, label="(1, 197, 768)"]; -"544 dequantize_per_tensor_188" -> "545 add_11" [style=solid, label="(1, 197, 768)"]; -"545 add_11" -> "546 quantize_per_tensor_189" [style=solid, label="(1, 197, 768)"]; -"546 quantize_per_tensor_189" -> "547 dequantize_per_tensor_190" [style=solid, label="(1, 197, 768)"]; -"546 quantize_per_tensor_189" -> "548 dequantize_per_tensor_191" [style=solid, label="(1, 197, 768)"]; -"547 dequantize_per_tensor_190" -> "571 add_12" [style=solid, label="(1, 197, 768)"]; -"548 dequantize_per_tensor_191" -> "549 layer_norm_11" [style=solid, label="(1, 197, 768)"]; -"549 layer_norm_11" -> "550 layer_norm_11_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"550 layer_norm_11_0_0_nncf_smooth_quant_0" -> "551 quantize_per_tensor_192" [style=solid, label="(1, 197, 768)"]; -"551 quantize_per_tensor_192" -> "552 dequantize_per_tensor_193" [style=solid, label="(1, 197, 768)"]; -"552 dequantize_per_tensor_193" -> "555 linear_22" [style=solid, label="(1, 197, 768)"]; -"553 _frozen_param25" -> "554 dequantize_per_tensor_194" [style=solid, label="(3072, 768)"]; -"554 dequantize_per_tensor_194" -> "555 linear_22" [style=solid, label="(3072, 768)"]; -"555 linear_22" -> "556 quantize_per_tensor_195" [style=solid, label="(1, 197, 3072)"]; -"556 quantize_per_tensor_195" -> "557 dequantize_per_tensor_196" [style=solid, label="(1, 197, 3072)"]; -"557 dequantize_per_tensor_196" -> "558 gelu_5" [style=solid, label="(1, 197, 3072)"]; -"558 gelu_5" -> "559 dropout_17" [style=solid, label="(1, 197, 3072)"]; -"559 dropout_17" -> "560 dropout_17_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"560 dropout_17_0_0_nncf_smooth_quant_0" -> "561 quantize_per_tensor_197" [style=solid, label="(1, 197, 3072)"]; -"561 quantize_per_tensor_197" -> "562 dequantize_per_tensor_198" [style=solid, label="(1, 197, 3072)"]; -"562 dequantize_per_tensor_198" -> "565 linear_23" [style=solid, label="(1, 197, 3072)"]; -"563 _frozen_param26" -> "564 dequantize_per_tensor_199" [style=solid, label="(768, 3072)"]; -"564 dequantize_per_tensor_199" -> "565 linear_23" [style=solid, label="(768, 3072)"]; -"565 linear_23" -> "566 quantize_per_tensor_200" [style=solid, label="(1, 197, 768)"]; -"566 quantize_per_tensor_200" -> "567 dequantize_per_tensor_201" [style=solid, label="(1, 197, 768)"]; -"567 dequantize_per_tensor_201" -> "568 dropout_18" [style=solid, label="(1, 197, 768)"]; -"568 dropout_18" -> "569 quantize_per_tensor_202" [style=solid, label="(1, 197, 768)"]; -"569 quantize_per_tensor_202" -> "570 dequantize_per_tensor_203" [style=solid, label="(1, 197, 768)"]; -"570 dequantize_per_tensor_203" -> "571 add_12" [style=solid, label="(1, 197, 768)"]; -"571 add_12" -> "572 quantize_per_tensor_204" [style=solid, label="(1, 197, 768)"]; -"572 quantize_per_tensor_204" -> "573 dequantize_per_tensor_205" [style=solid, label="(1, 197, 768)"]; -"572 quantize_per_tensor_204" -> "574 dequantize_per_tensor_206" [style=solid, label="(1, 197, 768)"]; -"573 dequantize_per_tensor_205" -> "620 add_13" [style=solid, label="(1, 197, 768)"]; -"574 dequantize_per_tensor_206" -> "575 layer_norm_12" [style=solid, label="(1, 197, 768)"]; -"575 layer_norm_12" -> "576 transpose_36" [style=solid, label="(1, 197, 768)"]; -"576 transpose_36" -> "577 transpose_36_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"577 transpose_36_0_0_nncf_smooth_quant_0" -> "578 quantize_per_tensor_207" [style=solid, label="(197, 1, 768)"]; -"578 quantize_per_tensor_207" -> "579 dequantize_per_tensor_208" [style=solid, label="(197, 1, 768)"]; -"579 dequantize_per_tensor_208" -> "582 linear_24" [style=solid, label="(197, 1, 768)"]; -"580 _frozen_param27" -> "581 dequantize_per_tensor_209" [style=solid, label="(2304, 768)"]; -"581 dequantize_per_tensor_209" -> "582 linear_24" [style=solid, label="(2304, 768)"]; -"582 linear_24" -> "583 quantize_per_tensor_210" [style=solid, label="(197, 1, 2304)"]; -"583 quantize_per_tensor_210" -> "584 dequantize_per_tensor_211" [style=solid, label="(197, 1, 2304)"]; -"584 dequantize_per_tensor_211" -> "585 unflatten_6" [style=solid, label="(197, 1, 2304)"]; -"585 unflatten_6" -> "586 unsqueeze_6" [style=solid, label="(197, 1, 3, 768)"]; -"586 unsqueeze_6" -> "587 transpose_37" [style=solid, label="(1, 197, 1, 3, 768)"]; -"587 transpose_37" -> "588 squeeze_6" [style=solid, label="(3, 197, 1, 1, 768)"]; -"588 squeeze_6" -> "589 contiguous_6" [style=solid, label="(3, 197, 1, 768)"]; -"589 contiguous_6" -> "590 select_18" [style=solid, label="(3, 197, 1, 768)"]; -"589 contiguous_6" -> "591 select_19" [style=solid, label="(3, 197, 1, 768)"]; -"589 contiguous_6" -> "592 select_20" [style=solid, label="(3, 197, 1, 768)"]; -"590 select_18" -> "593 view_48" [style=solid, label="(197, 1, 768)"]; -"591 select_19" -> "595 view_49" [style=solid, label="(197, 1, 768)"]; -"592 select_20" -> "597 view_50" [style=solid, label="(197, 1, 768)"]; -"593 view_48" -> "594 transpose_38" [style=solid, label="(197, 12, 64)"]; -"594 transpose_38" -> "599 view_51" [style=solid, label="(12, 197, 64)"]; -"595 view_49" -> "596 transpose_39" [style=solid, label="(197, 12, 64)"]; -"596 transpose_39" -> "600 view_52" [style=solid, label="(12, 197, 64)"]; -"597 view_50" -> "598 transpose_40" [style=solid, label="(197, 12, 64)"]; -"598 transpose_40" -> "601 view_53" [style=solid, label="(12, 197, 64)"]; -"599 view_51" -> "602 scaled_dot_product_attention_6" [style=solid, label="(1, 12, 197, 64)"]; -"600 view_52" -> "602 scaled_dot_product_attention_6" [style=solid, label="(1, 12, 197, 64)"]; -"601 view_53" -> "602 scaled_dot_product_attention_6" [style=solid, label="(1, 12, 197, 64)"]; -"602 scaled_dot_product_attention_6" -> "603 permute_7" [style=solid, label="(1, 12, 197, 64)"]; -"603 permute_7" -> "604 view_54" [style=solid, label="(197, 1, 12, 64)"]; -"604 view_54" -> "605 view_54_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"605 view_54_0_0_nncf_smooth_quant_0" -> "606 quantize_per_tensor_212" [style=solid, label="(197, 768)"]; -"606 quantize_per_tensor_212" -> "607 dequantize_per_tensor_213" [style=solid, label="(197, 768)"]; -"607 dequantize_per_tensor_213" -> "610 linear_25" [style=solid, label="(197, 768)"]; -"608 _frozen_param28" -> "609 dequantize_per_tensor_214" [style=solid, label="(768, 768)"]; -"609 dequantize_per_tensor_214" -> "610 linear_25" [style=solid, label="(768, 768)"]; -"610 linear_25" -> "611 quantize_per_tensor_215" [style=solid, label="(197, 768)"]; -"611 quantize_per_tensor_215" -> "612 dequantize_per_tensor_216" [style=solid, label="(197, 768)"]; -"612 dequantize_per_tensor_216" -> "613 view_55" [style=solid, label="(197, 768)"]; -"613 view_55" -> "614 quantize_per_tensor_217" [style=solid, label="(197, 1, 768)"]; -"614 quantize_per_tensor_217" -> "615 dequantize_per_tensor_218" [style=solid, label="(197, 1, 768)"]; -"615 dequantize_per_tensor_218" -> "616 transpose_41" [style=solid, label="(197, 1, 768)"]; -"616 transpose_41" -> "617 dropout_19" [style=solid, label="(1, 197, 768)"]; -"617 dropout_19" -> "618 quantize_per_tensor_219" [style=solid, label="(1, 197, 768)"]; -"618 quantize_per_tensor_219" -> "619 dequantize_per_tensor_220" [style=solid, label="(1, 197, 768)"]; -"619 dequantize_per_tensor_220" -> "620 add_13" [style=solid, label="(1, 197, 768)"]; -"620 add_13" -> "621 quantize_per_tensor_221" [style=solid, label="(1, 197, 768)"]; -"621 quantize_per_tensor_221" -> "622 dequantize_per_tensor_222" [style=solid, label="(1, 197, 768)"]; -"621 quantize_per_tensor_221" -> "623 dequantize_per_tensor_223" [style=solid, label="(1, 197, 768)"]; -"622 dequantize_per_tensor_222" -> "646 add_14" [style=solid, label="(1, 197, 768)"]; -"623 dequantize_per_tensor_223" -> "624 layer_norm_13" [style=solid, label="(1, 197, 768)"]; -"624 layer_norm_13" -> "625 layer_norm_13_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"625 layer_norm_13_0_0_nncf_smooth_quant_0" -> "626 quantize_per_tensor_224" [style=solid, label="(1, 197, 768)"]; -"626 quantize_per_tensor_224" -> "627 dequantize_per_tensor_225" [style=solid, label="(1, 197, 768)"]; -"627 dequantize_per_tensor_225" -> "630 linear_26" [style=solid, label="(1, 197, 768)"]; -"628 _frozen_param29" -> "629 dequantize_per_tensor_226" [style=solid, label="(3072, 768)"]; -"629 dequantize_per_tensor_226" -> "630 linear_26" [style=solid, label="(3072, 768)"]; -"630 linear_26" -> "631 quantize_per_tensor_227" [style=solid, label="(1, 197, 3072)"]; -"631 quantize_per_tensor_227" -> "632 dequantize_per_tensor_228" [style=solid, label="(1, 197, 3072)"]; -"632 dequantize_per_tensor_228" -> "633 gelu_6" [style=solid, label="(1, 197, 3072)"]; -"633 gelu_6" -> "634 dropout_20" [style=solid, label="(1, 197, 3072)"]; -"634 dropout_20" -> "635 dropout_20_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"635 dropout_20_0_0_nncf_smooth_quant_0" -> "636 quantize_per_tensor_229" [style=solid, label="(1, 197, 3072)"]; -"636 quantize_per_tensor_229" -> "637 dequantize_per_tensor_230" [style=solid, label="(1, 197, 3072)"]; -"637 dequantize_per_tensor_230" -> "640 linear_27" [style=solid, label="(1, 197, 3072)"]; -"638 _frozen_param30" -> "639 dequantize_per_tensor_231" [style=solid, label="(768, 3072)"]; -"639 dequantize_per_tensor_231" -> "640 linear_27" [style=solid, label="(768, 3072)"]; -"640 linear_27" -> "641 quantize_per_tensor_232" [style=solid, label="(1, 197, 768)"]; -"641 quantize_per_tensor_232" -> "642 dequantize_per_tensor_233" [style=solid, label="(1, 197, 768)"]; -"642 dequantize_per_tensor_233" -> "643 dropout_21" [style=solid, label="(1, 197, 768)"]; -"643 dropout_21" -> "644 quantize_per_tensor_234" [style=solid, label="(1, 197, 768)"]; -"644 quantize_per_tensor_234" -> "645 dequantize_per_tensor_235" [style=solid, label="(1, 197, 768)"]; -"645 dequantize_per_tensor_235" -> "646 add_14" [style=solid, label="(1, 197, 768)"]; -"646 add_14" -> "647 quantize_per_tensor_236" [style=solid, label="(1, 197, 768)"]; -"647 quantize_per_tensor_236" -> "648 dequantize_per_tensor_237" [style=solid, label="(1, 197, 768)"]; -"647 quantize_per_tensor_236" -> "649 dequantize_per_tensor_238" [style=solid, label="(1, 197, 768)"]; -"648 dequantize_per_tensor_237" -> "695 add_15" [style=solid, label="(1, 197, 768)"]; -"649 dequantize_per_tensor_238" -> "650 layer_norm_14" [style=solid, label="(1, 197, 768)"]; -"650 layer_norm_14" -> "651 transpose_42" [style=solid, label="(1, 197, 768)"]; -"651 transpose_42" -> "652 transpose_42_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"652 transpose_42_0_0_nncf_smooth_quant_0" -> "653 quantize_per_tensor_239" [style=solid, label="(197, 1, 768)"]; -"653 quantize_per_tensor_239" -> "654 dequantize_per_tensor_240" [style=solid, label="(197, 1, 768)"]; -"654 dequantize_per_tensor_240" -> "657 linear_28" [style=solid, label="(197, 1, 768)"]; -"655 _frozen_param31" -> "656 dequantize_per_tensor_241" [style=solid, label="(2304, 768)"]; -"656 dequantize_per_tensor_241" -> "657 linear_28" [style=solid, label="(2304, 768)"]; -"657 linear_28" -> "658 quantize_per_tensor_242" [style=solid, label="(197, 1, 2304)"]; -"658 quantize_per_tensor_242" -> "659 dequantize_per_tensor_243" [style=solid, label="(197, 1, 2304)"]; -"659 dequantize_per_tensor_243" -> "660 unflatten_7" [style=solid, label="(197, 1, 2304)"]; -"660 unflatten_7" -> "661 unsqueeze_7" [style=solid, label="(197, 1, 3, 768)"]; -"661 unsqueeze_7" -> "662 transpose_43" [style=solid, label="(1, 197, 1, 3, 768)"]; -"662 transpose_43" -> "663 squeeze_7" [style=solid, label="(3, 197, 1, 1, 768)"]; -"663 squeeze_7" -> "664 contiguous_7" [style=solid, label="(3, 197, 1, 768)"]; -"664 contiguous_7" -> "665 select_21" [style=solid, label="(3, 197, 1, 768)"]; -"664 contiguous_7" -> "666 select_22" [style=solid, label="(3, 197, 1, 768)"]; -"664 contiguous_7" -> "667 select_23" [style=solid, label="(3, 197, 1, 768)"]; -"665 select_21" -> "668 view_56" [style=solid, label="(197, 1, 768)"]; -"666 select_22" -> "670 view_57" [style=solid, label="(197, 1, 768)"]; -"667 select_23" -> "672 view_58" [style=solid, label="(197, 1, 768)"]; -"668 view_56" -> "669 transpose_44" [style=solid, label="(197, 12, 64)"]; -"669 transpose_44" -> "674 view_59" [style=solid, label="(12, 197, 64)"]; -"670 view_57" -> "671 transpose_45" [style=solid, label="(197, 12, 64)"]; -"671 transpose_45" -> "675 view_60" [style=solid, label="(12, 197, 64)"]; -"672 view_58" -> "673 transpose_46" [style=solid, label="(197, 12, 64)"]; -"673 transpose_46" -> "676 view_61" [style=solid, label="(12, 197, 64)"]; -"674 view_59" -> "677 scaled_dot_product_attention_7" [style=solid, label="(1, 12, 197, 64)"]; -"675 view_60" -> "677 scaled_dot_product_attention_7" [style=solid, label="(1, 12, 197, 64)"]; -"676 view_61" -> "677 scaled_dot_product_attention_7" [style=solid, label="(1, 12, 197, 64)"]; -"677 scaled_dot_product_attention_7" -> "678 permute_8" [style=solid, label="(1, 12, 197, 64)"]; -"678 permute_8" -> "679 view_62" [style=solid, label="(197, 1, 12, 64)"]; -"679 view_62" -> "680 view_62_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"680 view_62_0_0_nncf_smooth_quant_0" -> "681 quantize_per_tensor_244" [style=solid, label="(197, 768)"]; -"681 quantize_per_tensor_244" -> "682 dequantize_per_tensor_245" [style=solid, label="(197, 768)"]; -"682 dequantize_per_tensor_245" -> "685 linear_29" [style=solid, label="(197, 768)"]; -"683 _frozen_param32" -> "684 dequantize_per_tensor_246" [style=solid, label="(768, 768)"]; -"684 dequantize_per_tensor_246" -> "685 linear_29" [style=solid, label="(768, 768)"]; -"685 linear_29" -> "686 quantize_per_tensor_247" [style=solid, label="(197, 768)"]; -"686 quantize_per_tensor_247" -> "687 dequantize_per_tensor_248" [style=solid, label="(197, 768)"]; -"687 dequantize_per_tensor_248" -> "688 view_63" [style=solid, label="(197, 768)"]; -"688 view_63" -> "689 quantize_per_tensor_249" [style=solid, label="(197, 1, 768)"]; -"689 quantize_per_tensor_249" -> "690 dequantize_per_tensor_250" [style=solid, label="(197, 1, 768)"]; -"690 dequantize_per_tensor_250" -> "691 transpose_47" [style=solid, label="(197, 1, 768)"]; -"691 transpose_47" -> "692 dropout_22" [style=solid, label="(1, 197, 768)"]; -"692 dropout_22" -> "693 quantize_per_tensor_251" [style=solid, label="(1, 197, 768)"]; -"693 quantize_per_tensor_251" -> "694 dequantize_per_tensor_252" [style=solid, label="(1, 197, 768)"]; -"694 dequantize_per_tensor_252" -> "695 add_15" [style=solid, label="(1, 197, 768)"]; -"695 add_15" -> "696 quantize_per_tensor_253" [style=solid, label="(1, 197, 768)"]; -"696 quantize_per_tensor_253" -> "697 dequantize_per_tensor_254" [style=solid, label="(1, 197, 768)"]; -"696 quantize_per_tensor_253" -> "698 dequantize_per_tensor_255" [style=solid, label="(1, 197, 768)"]; -"697 dequantize_per_tensor_254" -> "721 add_16" [style=solid, label="(1, 197, 768)"]; -"698 dequantize_per_tensor_255" -> "699 layer_norm_15" [style=solid, label="(1, 197, 768)"]; -"699 layer_norm_15" -> "700 layer_norm_15_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"700 layer_norm_15_0_0_nncf_smooth_quant_0" -> "701 quantize_per_tensor_256" [style=solid, label="(1, 197, 768)"]; -"701 quantize_per_tensor_256" -> "702 dequantize_per_tensor_257" [style=solid, label="(1, 197, 768)"]; -"702 dequantize_per_tensor_257" -> "705 linear_30" [style=solid, label="(1, 197, 768)"]; -"703 _frozen_param33" -> "704 dequantize_per_tensor_258" [style=solid, label="(3072, 768)"]; -"704 dequantize_per_tensor_258" -> "705 linear_30" [style=solid, label="(3072, 768)"]; -"705 linear_30" -> "706 quantize_per_tensor_259" [style=solid, label="(1, 197, 3072)"]; -"706 quantize_per_tensor_259" -> "707 dequantize_per_tensor_260" [style=solid, label="(1, 197, 3072)"]; -"707 dequantize_per_tensor_260" -> "708 gelu_7" [style=solid, label="(1, 197, 3072)"]; -"708 gelu_7" -> "709 dropout_23" [style=solid, label="(1, 197, 3072)"]; -"709 dropout_23" -> "710 dropout_23_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"710 dropout_23_0_0_nncf_smooth_quant_0" -> "711 quantize_per_tensor_261" [style=solid, label="(1, 197, 3072)"]; -"711 quantize_per_tensor_261" -> "712 dequantize_per_tensor_262" [style=solid, label="(1, 197, 3072)"]; -"712 dequantize_per_tensor_262" -> "715 linear_31" [style=solid, label="(1, 197, 3072)"]; -"713 _frozen_param34" -> "714 dequantize_per_tensor_263" [style=solid, label="(768, 3072)"]; -"714 dequantize_per_tensor_263" -> "715 linear_31" [style=solid, label="(768, 3072)"]; -"715 linear_31" -> "716 quantize_per_tensor_264" [style=solid, label="(1, 197, 768)"]; -"716 quantize_per_tensor_264" -> "717 dequantize_per_tensor_265" [style=solid, label="(1, 197, 768)"]; -"717 dequantize_per_tensor_265" -> "718 dropout_24" [style=solid, label="(1, 197, 768)"]; -"718 dropout_24" -> "719 quantize_per_tensor_266" [style=solid, label="(1, 197, 768)"]; -"719 quantize_per_tensor_266" -> "720 dequantize_per_tensor_267" [style=solid, label="(1, 197, 768)"]; -"720 dequantize_per_tensor_267" -> "721 add_16" [style=solid, label="(1, 197, 768)"]; -"721 add_16" -> "722 quantize_per_tensor_268" [style=solid, label="(1, 197, 768)"]; -"722 quantize_per_tensor_268" -> "723 dequantize_per_tensor_269" [style=solid, label="(1, 197, 768)"]; -"722 quantize_per_tensor_268" -> "724 dequantize_per_tensor_270" [style=solid, label="(1, 197, 768)"]; -"723 dequantize_per_tensor_269" -> "770 add_17" [style=solid, label="(1, 197, 768)"]; -"724 dequantize_per_tensor_270" -> "725 layer_norm_16" [style=solid, label="(1, 197, 768)"]; -"725 layer_norm_16" -> "726 transpose_48" [style=solid, label="(1, 197, 768)"]; -"726 transpose_48" -> "727 transpose_48_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"727 transpose_48_0_0_nncf_smooth_quant_0" -> "728 quantize_per_tensor_271" [style=solid, label="(197, 1, 768)"]; -"728 quantize_per_tensor_271" -> "729 dequantize_per_tensor_272" [style=solid, label="(197, 1, 768)"]; -"729 dequantize_per_tensor_272" -> "732 linear_32" [style=solid, label="(197, 1, 768)"]; -"730 _frozen_param35" -> "731 dequantize_per_tensor_273" [style=solid, label="(2304, 768)"]; -"731 dequantize_per_tensor_273" -> "732 linear_32" [style=solid, label="(2304, 768)"]; -"732 linear_32" -> "733 quantize_per_tensor_274" [style=solid, label="(197, 1, 2304)"]; -"733 quantize_per_tensor_274" -> "734 dequantize_per_tensor_275" [style=solid, label="(197, 1, 2304)"]; -"734 dequantize_per_tensor_275" -> "735 unflatten_8" [style=solid, label="(197, 1, 2304)"]; -"735 unflatten_8" -> "736 unsqueeze_8" [style=solid, label="(197, 1, 3, 768)"]; -"736 unsqueeze_8" -> "737 transpose_49" [style=solid, label="(1, 197, 1, 3, 768)"]; -"737 transpose_49" -> "738 squeeze_8" [style=solid, label="(3, 197, 1, 1, 768)"]; -"738 squeeze_8" -> "739 contiguous_8" [style=solid, label="(3, 197, 1, 768)"]; -"739 contiguous_8" -> "740 select_24" [style=solid, label="(3, 197, 1, 768)"]; -"739 contiguous_8" -> "741 select_25" [style=solid, label="(3, 197, 1, 768)"]; -"739 contiguous_8" -> "742 select_26" [style=solid, label="(3, 197, 1, 768)"]; -"740 select_24" -> "743 view_64" [style=solid, label="(197, 1, 768)"]; -"741 select_25" -> "745 view_65" [style=solid, label="(197, 1, 768)"]; -"742 select_26" -> "747 view_66" [style=solid, label="(197, 1, 768)"]; -"743 view_64" -> "744 transpose_50" [style=solid, label="(197, 12, 64)"]; -"744 transpose_50" -> "749 view_67" [style=solid, label="(12, 197, 64)"]; -"745 view_65" -> "746 transpose_51" [style=solid, label="(197, 12, 64)"]; -"746 transpose_51" -> "750 view_68" [style=solid, label="(12, 197, 64)"]; -"747 view_66" -> "748 transpose_52" [style=solid, label="(197, 12, 64)"]; -"748 transpose_52" -> "751 view_69" [style=solid, label="(12, 197, 64)"]; -"749 view_67" -> "752 scaled_dot_product_attention_8" [style=solid, label="(1, 12, 197, 64)"]; -"750 view_68" -> "752 scaled_dot_product_attention_8" [style=solid, label="(1, 12, 197, 64)"]; -"751 view_69" -> "752 scaled_dot_product_attention_8" [style=solid, label="(1, 12, 197, 64)"]; -"752 scaled_dot_product_attention_8" -> "753 permute_9" [style=solid, label="(1, 12, 197, 64)"]; -"753 permute_9" -> "754 view_70" [style=solid, label="(197, 1, 12, 64)"]; -"754 view_70" -> "755 view_70_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"755 view_70_0_0_nncf_smooth_quant_0" -> "756 quantize_per_tensor_276" [style=solid, label="(197, 768)"]; -"756 quantize_per_tensor_276" -> "757 dequantize_per_tensor_277" [style=solid, label="(197, 768)"]; -"757 dequantize_per_tensor_277" -> "760 linear_33" [style=solid, label="(197, 768)"]; -"758 _frozen_param36" -> "759 dequantize_per_tensor_278" [style=solid, label="(768, 768)"]; -"759 dequantize_per_tensor_278" -> "760 linear_33" [style=solid, label="(768, 768)"]; -"760 linear_33" -> "761 quantize_per_tensor_279" [style=solid, label="(197, 768)"]; -"761 quantize_per_tensor_279" -> "762 dequantize_per_tensor_280" [style=solid, label="(197, 768)"]; -"762 dequantize_per_tensor_280" -> "763 view_71" [style=solid, label="(197, 768)"]; -"763 view_71" -> "764 quantize_per_tensor_281" [style=solid, label="(197, 1, 768)"]; -"764 quantize_per_tensor_281" -> "765 dequantize_per_tensor_282" [style=solid, label="(197, 1, 768)"]; -"765 dequantize_per_tensor_282" -> "766 transpose_53" [style=solid, label="(197, 1, 768)"]; -"766 transpose_53" -> "767 dropout_25" [style=solid, label="(1, 197, 768)"]; -"767 dropout_25" -> "768 quantize_per_tensor_283" [style=solid, label="(1, 197, 768)"]; -"768 quantize_per_tensor_283" -> "769 dequantize_per_tensor_284" [style=solid, label="(1, 197, 768)"]; -"769 dequantize_per_tensor_284" -> "770 add_17" [style=solid, label="(1, 197, 768)"]; -"770 add_17" -> "771 quantize_per_tensor_285" [style=solid, label="(1, 197, 768)"]; -"771 quantize_per_tensor_285" -> "772 dequantize_per_tensor_286" [style=solid, label="(1, 197, 768)"]; -"771 quantize_per_tensor_285" -> "773 dequantize_per_tensor_287" [style=solid, label="(1, 197, 768)"]; -"772 dequantize_per_tensor_286" -> "796 add_18" [style=solid, label="(1, 197, 768)"]; -"773 dequantize_per_tensor_287" -> "774 layer_norm_17" [style=solid, label="(1, 197, 768)"]; -"774 layer_norm_17" -> "775 layer_norm_17_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"775 layer_norm_17_0_0_nncf_smooth_quant_0" -> "776 quantize_per_tensor_288" [style=solid, label="(1, 197, 768)"]; -"776 quantize_per_tensor_288" -> "777 dequantize_per_tensor_289" [style=solid, label="(1, 197, 768)"]; -"777 dequantize_per_tensor_289" -> "780 linear_34" [style=solid, label="(1, 197, 768)"]; -"778 _frozen_param37" -> "779 dequantize_per_tensor_290" [style=solid, label="(3072, 768)"]; -"779 dequantize_per_tensor_290" -> "780 linear_34" [style=solid, label="(3072, 768)"]; -"780 linear_34" -> "781 quantize_per_tensor_291" [style=solid, label="(1, 197, 3072)"]; -"781 quantize_per_tensor_291" -> "782 dequantize_per_tensor_292" [style=solid, label="(1, 197, 3072)"]; -"782 dequantize_per_tensor_292" -> "783 gelu_8" [style=solid, label="(1, 197, 3072)"]; -"783 gelu_8" -> "784 dropout_26" [style=solid, label="(1, 197, 3072)"]; -"784 dropout_26" -> "785 dropout_26_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"785 dropout_26_0_0_nncf_smooth_quant_0" -> "786 quantize_per_tensor_293" [style=solid, label="(1, 197, 3072)"]; -"786 quantize_per_tensor_293" -> "787 dequantize_per_tensor_294" [style=solid, label="(1, 197, 3072)"]; -"787 dequantize_per_tensor_294" -> "790 linear_35" [style=solid, label="(1, 197, 3072)"]; -"788 _frozen_param38" -> "789 dequantize_per_tensor_295" [style=solid, label="(768, 3072)"]; -"789 dequantize_per_tensor_295" -> "790 linear_35" [style=solid, label="(768, 3072)"]; -"790 linear_35" -> "791 quantize_per_tensor_296" [style=solid, label="(1, 197, 768)"]; -"791 quantize_per_tensor_296" -> "792 dequantize_per_tensor_297" [style=solid, label="(1, 197, 768)"]; -"792 dequantize_per_tensor_297" -> "793 dropout_27" [style=solid, label="(1, 197, 768)"]; -"793 dropout_27" -> "794 quantize_per_tensor_298" [style=solid, label="(1, 197, 768)"]; -"794 quantize_per_tensor_298" -> "795 dequantize_per_tensor_299" [style=solid, label="(1, 197, 768)"]; -"795 dequantize_per_tensor_299" -> "796 add_18" [style=solid, label="(1, 197, 768)"]; -"796 add_18" -> "797 quantize_per_tensor_300" [style=solid, label="(1, 197, 768)"]; -"797 quantize_per_tensor_300" -> "798 dequantize_per_tensor_301" [style=solid, label="(1, 197, 768)"]; -"797 quantize_per_tensor_300" -> "799 dequantize_per_tensor_302" [style=solid, label="(1, 197, 768)"]; -"798 dequantize_per_tensor_301" -> "845 add_19" [style=solid, label="(1, 197, 768)"]; -"799 dequantize_per_tensor_302" -> "800 layer_norm_18" [style=solid, label="(1, 197, 768)"]; -"800 layer_norm_18" -> "801 transpose_54" [style=solid, label="(1, 197, 768)"]; -"801 transpose_54" -> "802 transpose_54_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"802 transpose_54_0_0_nncf_smooth_quant_0" -> "803 quantize_per_tensor_303" [style=solid, label="(197, 1, 768)"]; -"803 quantize_per_tensor_303" -> "804 dequantize_per_tensor_304" [style=solid, label="(197, 1, 768)"]; -"804 dequantize_per_tensor_304" -> "807 linear_36" [style=solid, label="(197, 1, 768)"]; -"805 _frozen_param39" -> "806 dequantize_per_tensor_305" [style=solid, label="(2304, 768)"]; -"806 dequantize_per_tensor_305" -> "807 linear_36" [style=solid, label="(2304, 768)"]; -"807 linear_36" -> "808 quantize_per_tensor_306" [style=solid, label="(197, 1, 2304)"]; -"808 quantize_per_tensor_306" -> "809 dequantize_per_tensor_307" [style=solid, label="(197, 1, 2304)"]; -"809 dequantize_per_tensor_307" -> "810 unflatten_9" [style=solid, label="(197, 1, 2304)"]; -"810 unflatten_9" -> "811 unsqueeze_9" [style=solid, label="(197, 1, 3, 768)"]; -"811 unsqueeze_9" -> "812 transpose_55" [style=solid, label="(1, 197, 1, 3, 768)"]; -"812 transpose_55" -> "813 squeeze_9" [style=solid, label="(3, 197, 1, 1, 768)"]; -"813 squeeze_9" -> "814 contiguous_9" [style=solid, label="(3, 197, 1, 768)"]; -"814 contiguous_9" -> "815 select_27" [style=solid, label="(3, 197, 1, 768)"]; -"814 contiguous_9" -> "816 select_28" [style=solid, label="(3, 197, 1, 768)"]; -"814 contiguous_9" -> "817 select_29" [style=solid, label="(3, 197, 1, 768)"]; -"815 select_27" -> "818 view_72" [style=solid, label="(197, 1, 768)"]; -"816 select_28" -> "820 view_73" [style=solid, label="(197, 1, 768)"]; -"817 select_29" -> "822 view_74" [style=solid, label="(197, 1, 768)"]; -"818 view_72" -> "819 transpose_56" [style=solid, label="(197, 12, 64)"]; -"819 transpose_56" -> "824 view_75" [style=solid, label="(12, 197, 64)"]; -"820 view_73" -> "821 transpose_57" [style=solid, label="(197, 12, 64)"]; -"821 transpose_57" -> "825 view_76" [style=solid, label="(12, 197, 64)"]; -"822 view_74" -> "823 transpose_58" [style=solid, label="(197, 12, 64)"]; -"823 transpose_58" -> "826 view_77" [style=solid, label="(12, 197, 64)"]; -"824 view_75" -> "827 scaled_dot_product_attention_9" [style=solid, label="(1, 12, 197, 64)"]; -"825 view_76" -> "827 scaled_dot_product_attention_9" [style=solid, label="(1, 12, 197, 64)"]; -"826 view_77" -> "827 scaled_dot_product_attention_9" [style=solid, label="(1, 12, 197, 64)"]; -"827 scaled_dot_product_attention_9" -> "828 permute_10" [style=solid, label="(1, 12, 197, 64)"]; -"828 permute_10" -> "829 view_78" [style=solid, label="(197, 1, 12, 64)"]; -"829 view_78" -> "830 view_78_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"830 view_78_0_0_nncf_smooth_quant_0" -> "831 quantize_per_tensor_308" [style=solid, label="(197, 768)"]; -"831 quantize_per_tensor_308" -> "832 dequantize_per_tensor_309" [style=solid, label="(197, 768)"]; -"832 dequantize_per_tensor_309" -> "835 linear_37" [style=solid, label="(197, 768)"]; -"833 _frozen_param40" -> "834 dequantize_per_tensor_310" [style=solid, label="(768, 768)"]; -"834 dequantize_per_tensor_310" -> "835 linear_37" [style=solid, label="(768, 768)"]; -"835 linear_37" -> "836 quantize_per_tensor_311" [style=solid, label="(197, 768)"]; -"836 quantize_per_tensor_311" -> "837 dequantize_per_tensor_312" [style=solid, label="(197, 768)"]; -"837 dequantize_per_tensor_312" -> "838 view_79" [style=solid, label="(197, 768)"]; -"838 view_79" -> "839 quantize_per_tensor_313" [style=solid, label="(197, 1, 768)"]; -"839 quantize_per_tensor_313" -> "840 dequantize_per_tensor_314" [style=solid, label="(197, 1, 768)"]; -"840 dequantize_per_tensor_314" -> "841 transpose_59" [style=solid, label="(197, 1, 768)"]; -"841 transpose_59" -> "842 dropout_28" [style=solid, label="(1, 197, 768)"]; -"842 dropout_28" -> "843 quantize_per_tensor_315" [style=solid, label="(1, 197, 768)"]; -"843 quantize_per_tensor_315" -> "844 dequantize_per_tensor_316" [style=solid, label="(1, 197, 768)"]; -"844 dequantize_per_tensor_316" -> "845 add_19" [style=solid, label="(1, 197, 768)"]; -"845 add_19" -> "846 quantize_per_tensor_317" [style=solid, label="(1, 197, 768)"]; -"846 quantize_per_tensor_317" -> "847 dequantize_per_tensor_318" [style=solid, label="(1, 197, 768)"]; -"846 quantize_per_tensor_317" -> "848 dequantize_per_tensor_319" [style=solid, label="(1, 197, 768)"]; -"847 dequantize_per_tensor_318" -> "871 add_20" [style=solid, label="(1, 197, 768)"]; -"848 dequantize_per_tensor_319" -> "849 layer_norm_19" [style=solid, label="(1, 197, 768)"]; -"849 layer_norm_19" -> "850 layer_norm_19_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"850 layer_norm_19_0_0_nncf_smooth_quant_0" -> "851 quantize_per_tensor_320" [style=solid, label="(1, 197, 768)"]; -"851 quantize_per_tensor_320" -> "852 dequantize_per_tensor_321" [style=solid, label="(1, 197, 768)"]; -"852 dequantize_per_tensor_321" -> "855 linear_38" [style=solid, label="(1, 197, 768)"]; -"853 _frozen_param41" -> "854 dequantize_per_tensor_322" [style=solid, label="(3072, 768)"]; -"854 dequantize_per_tensor_322" -> "855 linear_38" [style=solid, label="(3072, 768)"]; -"855 linear_38" -> "856 quantize_per_tensor_323" [style=solid, label="(1, 197, 3072)"]; -"856 quantize_per_tensor_323" -> "857 dequantize_per_tensor_324" [style=solid, label="(1, 197, 3072)"]; -"857 dequantize_per_tensor_324" -> "858 gelu_9" [style=solid, label="(1, 197, 3072)"]; -"858 gelu_9" -> "859 dropout_29" [style=solid, label="(1, 197, 3072)"]; -"859 dropout_29" -> "860 dropout_29_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"860 dropout_29_0_0_nncf_smooth_quant_0" -> "861 quantize_per_tensor_325" [style=solid, label="(1, 197, 3072)"]; -"861 quantize_per_tensor_325" -> "862 dequantize_per_tensor_326" [style=solid, label="(1, 197, 3072)"]; -"862 dequantize_per_tensor_326" -> "865 linear_39" [style=solid, label="(1, 197, 3072)"]; -"863 _frozen_param42" -> "864 dequantize_per_tensor_327" [style=solid, label="(768, 3072)"]; -"864 dequantize_per_tensor_327" -> "865 linear_39" [style=solid, label="(768, 3072)"]; -"865 linear_39" -> "866 quantize_per_tensor_328" [style=solid, label="(1, 197, 768)"]; -"866 quantize_per_tensor_328" -> "867 dequantize_per_tensor_329" [style=solid, label="(1, 197, 768)"]; -"867 dequantize_per_tensor_329" -> "868 dropout_30" [style=solid, label="(1, 197, 768)"]; -"868 dropout_30" -> "869 quantize_per_tensor_330" [style=solid, label="(1, 197, 768)"]; -"869 quantize_per_tensor_330" -> "870 dequantize_per_tensor_331" [style=solid, label="(1, 197, 768)"]; -"870 dequantize_per_tensor_331" -> "871 add_20" [style=solid, label="(1, 197, 768)"]; -"871 add_20" -> "872 quantize_per_tensor_332" [style=solid, label="(1, 197, 768)"]; -"872 quantize_per_tensor_332" -> "873 dequantize_per_tensor_333" [style=solid, label="(1, 197, 768)"]; -"872 quantize_per_tensor_332" -> "874 dequantize_per_tensor_334" [style=solid, label="(1, 197, 768)"]; -"873 dequantize_per_tensor_333" -> "920 add_21" [style=solid, label="(1, 197, 768)"]; -"874 dequantize_per_tensor_334" -> "875 layer_norm_20" [style=solid, label="(1, 197, 768)"]; -"875 layer_norm_20" -> "876 transpose_60" [style=solid, label="(1, 197, 768)"]; -"876 transpose_60" -> "877 transpose_60_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"877 transpose_60_0_0_nncf_smooth_quant_0" -> "878 quantize_per_tensor_335" [style=solid, label="(197, 1, 768)"]; -"878 quantize_per_tensor_335" -> "879 dequantize_per_tensor_336" [style=solid, label="(197, 1, 768)"]; -"879 dequantize_per_tensor_336" -> "882 linear_40" [style=solid, label="(197, 1, 768)"]; -"880 _frozen_param43" -> "881 dequantize_per_tensor_337" [style=solid, label="(2304, 768)"]; -"881 dequantize_per_tensor_337" -> "882 linear_40" [style=solid, label="(2304, 768)"]; -"882 linear_40" -> "883 quantize_per_tensor_338" [style=solid, label="(197, 1, 2304)"]; -"883 quantize_per_tensor_338" -> "884 dequantize_per_tensor_339" [style=solid, label="(197, 1, 2304)"]; -"884 dequantize_per_tensor_339" -> "885 unflatten_10" [style=solid, label="(197, 1, 2304)"]; -"885 unflatten_10" -> "886 unsqueeze_10" [style=solid, label="(197, 1, 3, 768)"]; -"886 unsqueeze_10" -> "887 transpose_61" [style=solid, label="(1, 197, 1, 3, 768)"]; -"887 transpose_61" -> "888 squeeze_10" [style=solid, label="(3, 197, 1, 1, 768)"]; -"888 squeeze_10" -> "889 contiguous_10" [style=solid, label="(3, 197, 1, 768)"]; -"889 contiguous_10" -> "890 select_30" [style=solid, label="(3, 197, 1, 768)"]; -"889 contiguous_10" -> "891 select_31" [style=solid, label="(3, 197, 1, 768)"]; -"889 contiguous_10" -> "892 select_32" [style=solid, label="(3, 197, 1, 768)"]; -"890 select_30" -> "893 view_80" [style=solid, label="(197, 1, 768)"]; -"891 select_31" -> "895 view_81" [style=solid, label="(197, 1, 768)"]; -"892 select_32" -> "897 view_82" [style=solid, label="(197, 1, 768)"]; -"893 view_80" -> "894 transpose_62" [style=solid, label="(197, 12, 64)"]; -"894 transpose_62" -> "899 view_83" [style=solid, label="(12, 197, 64)"]; -"895 view_81" -> "896 transpose_63" [style=solid, label="(197, 12, 64)"]; -"896 transpose_63" -> "900 view_84" [style=solid, label="(12, 197, 64)"]; -"897 view_82" -> "898 transpose_64" [style=solid, label="(197, 12, 64)"]; -"898 transpose_64" -> "901 view_85" [style=solid, label="(12, 197, 64)"]; -"899 view_83" -> "902 scaled_dot_product_attention_10" [style=solid, label="(1, 12, 197, 64)"]; -"900 view_84" -> "902 scaled_dot_product_attention_10" [style=solid, label="(1, 12, 197, 64)"]; -"901 view_85" -> "902 scaled_dot_product_attention_10" [style=solid, label="(1, 12, 197, 64)"]; -"902 scaled_dot_product_attention_10" -> "903 permute_11" [style=solid, label="(1, 12, 197, 64)"]; -"903 permute_11" -> "904 view_86" [style=solid, label="(197, 1, 12, 64)"]; -"904 view_86" -> "905 view_86_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"905 view_86_0_0_nncf_smooth_quant_0" -> "906 quantize_per_tensor_340" [style=solid, label="(197, 768)"]; -"906 quantize_per_tensor_340" -> "907 dequantize_per_tensor_341" [style=solid, label="(197, 768)"]; -"907 dequantize_per_tensor_341" -> "910 linear_41" [style=solid, label="(197, 768)"]; -"908 _frozen_param44" -> "909 dequantize_per_tensor_342" [style=solid, label="(768, 768)"]; -"909 dequantize_per_tensor_342" -> "910 linear_41" [style=solid, label="(768, 768)"]; -"910 linear_41" -> "911 quantize_per_tensor_343" [style=solid, label="(197, 768)"]; -"911 quantize_per_tensor_343" -> "912 dequantize_per_tensor_344" [style=solid, label="(197, 768)"]; -"912 dequantize_per_tensor_344" -> "913 view_87" [style=solid, label="(197, 768)"]; -"913 view_87" -> "914 quantize_per_tensor_345" [style=solid, label="(197, 1, 768)"]; -"914 quantize_per_tensor_345" -> "915 dequantize_per_tensor_346" [style=solid, label="(197, 1, 768)"]; -"915 dequantize_per_tensor_346" -> "916 transpose_65" [style=solid, label="(197, 1, 768)"]; -"916 transpose_65" -> "917 dropout_31" [style=solid, label="(1, 197, 768)"]; -"917 dropout_31" -> "918 quantize_per_tensor_347" [style=solid, label="(1, 197, 768)"]; -"918 quantize_per_tensor_347" -> "919 dequantize_per_tensor_348" [style=solid, label="(1, 197, 768)"]; -"919 dequantize_per_tensor_348" -> "920 add_21" [style=solid, label="(1, 197, 768)"]; -"920 add_21" -> "921 quantize_per_tensor_349" [style=solid, label="(1, 197, 768)"]; -"921 quantize_per_tensor_349" -> "922 dequantize_per_tensor_350" [style=solid, label="(1, 197, 768)"]; -"921 quantize_per_tensor_349" -> "923 dequantize_per_tensor_351" [style=solid, label="(1, 197, 768)"]; -"922 dequantize_per_tensor_350" -> "946 add_22" [style=solid, label="(1, 197, 768)"]; -"923 dequantize_per_tensor_351" -> "924 layer_norm_21" [style=solid, label="(1, 197, 768)"]; -"924 layer_norm_21" -> "925 layer_norm_21_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"925 layer_norm_21_0_0_nncf_smooth_quant_0" -> "926 quantize_per_tensor_352" [style=solid, label="(1, 197, 768)"]; -"926 quantize_per_tensor_352" -> "927 dequantize_per_tensor_353" [style=solid, label="(1, 197, 768)"]; -"927 dequantize_per_tensor_353" -> "930 linear_42" [style=solid, label="(1, 197, 768)"]; -"928 _frozen_param45" -> "929 dequantize_per_tensor_354" [style=solid, label="(3072, 768)"]; -"929 dequantize_per_tensor_354" -> "930 linear_42" [style=solid, label="(3072, 768)"]; -"930 linear_42" -> "931 quantize_per_tensor_355" [style=solid, label="(1, 197, 3072)"]; -"931 quantize_per_tensor_355" -> "932 dequantize_per_tensor_356" [style=solid, label="(1, 197, 3072)"]; -"932 dequantize_per_tensor_356" -> "933 gelu_10" [style=solid, label="(1, 197, 3072)"]; -"933 gelu_10" -> "934 dropout_32" [style=solid, label="(1, 197, 3072)"]; -"934 dropout_32" -> "935 dropout_32_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"935 dropout_32_0_0_nncf_smooth_quant_0" -> "936 quantize_per_tensor_357" [style=solid, label="(1, 197, 3072)"]; -"936 quantize_per_tensor_357" -> "937 dequantize_per_tensor_358" [style=solid, label="(1, 197, 3072)"]; -"937 dequantize_per_tensor_358" -> "940 linear_43" [style=solid, label="(1, 197, 3072)"]; -"938 _frozen_param46" -> "939 dequantize_per_tensor_359" [style=solid, label="(768, 3072)"]; -"939 dequantize_per_tensor_359" -> "940 linear_43" [style=solid, label="(768, 3072)"]; -"940 linear_43" -> "941 quantize_per_tensor_360" [style=solid, label="(1, 197, 768)"]; -"941 quantize_per_tensor_360" -> "942 dequantize_per_tensor_361" [style=solid, label="(1, 197, 768)"]; -"942 dequantize_per_tensor_361" -> "943 dropout_33" [style=solid, label="(1, 197, 768)"]; -"943 dropout_33" -> "944 quantize_per_tensor_362" [style=solid, label="(1, 197, 768)"]; -"944 quantize_per_tensor_362" -> "945 dequantize_per_tensor_363" [style=solid, label="(1, 197, 768)"]; -"945 dequantize_per_tensor_363" -> "946 add_22" [style=solid, label="(1, 197, 768)"]; -"946 add_22" -> "947 quantize_per_tensor_364" [style=solid, label="(1, 197, 768)"]; -"947 quantize_per_tensor_364" -> "948 dequantize_per_tensor_365" [style=solid, label="(1, 197, 768)"]; -"947 quantize_per_tensor_364" -> "949 dequantize_per_tensor_366" [style=solid, label="(1, 197, 768)"]; -"948 dequantize_per_tensor_365" -> "995 add_23" [style=solid, label="(1, 197, 768)"]; -"949 dequantize_per_tensor_366" -> "950 layer_norm_22" [style=solid, label="(1, 197, 768)"]; -"950 layer_norm_22" -> "951 transpose_66" [style=solid, label="(1, 197, 768)"]; -"951 transpose_66" -> "952 transpose_66_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 1, 768)"]; -"952 transpose_66_0_0_nncf_smooth_quant_0" -> "953 quantize_per_tensor_367" [style=solid, label="(197, 1, 768)"]; -"953 quantize_per_tensor_367" -> "954 dequantize_per_tensor_368" [style=solid, label="(197, 1, 768)"]; -"954 dequantize_per_tensor_368" -> "957 linear_44" [style=solid, label="(197, 1, 768)"]; -"955 _frozen_param47" -> "956 dequantize_per_tensor_369" [style=solid, label="(2304, 768)"]; -"956 dequantize_per_tensor_369" -> "957 linear_44" [style=solid, label="(2304, 768)"]; -"957 linear_44" -> "958 quantize_per_tensor_370" [style=solid, label="(197, 1, 2304)"]; -"958 quantize_per_tensor_370" -> "959 dequantize_per_tensor_371" [style=solid, label="(197, 1, 2304)"]; -"959 dequantize_per_tensor_371" -> "960 unflatten_11" [style=solid, label="(197, 1, 2304)"]; -"960 unflatten_11" -> "961 unsqueeze_11" [style=solid, label="(197, 1, 3, 768)"]; -"961 unsqueeze_11" -> "962 transpose_67" [style=solid, label="(1, 197, 1, 3, 768)"]; -"962 transpose_67" -> "963 squeeze_11" [style=solid, label="(3, 197, 1, 1, 768)"]; -"963 squeeze_11" -> "964 contiguous_11" [style=solid, label="(3, 197, 1, 768)"]; -"964 contiguous_11" -> "965 select_33" [style=solid, label="(3, 197, 1, 768)"]; -"964 contiguous_11" -> "966 select_34" [style=solid, label="(3, 197, 1, 768)"]; -"964 contiguous_11" -> "967 select_35" [style=solid, label="(3, 197, 1, 768)"]; -"965 select_33" -> "968 view_88" [style=solid, label="(197, 1, 768)"]; -"966 select_34" -> "970 view_89" [style=solid, label="(197, 1, 768)"]; -"967 select_35" -> "972 view_90" [style=solid, label="(197, 1, 768)"]; -"968 view_88" -> "969 transpose_68" [style=solid, label="(197, 12, 64)"]; -"969 transpose_68" -> "974 view_91" [style=solid, label="(12, 197, 64)"]; -"970 view_89" -> "971 transpose_69" [style=solid, label="(197, 12, 64)"]; -"971 transpose_69" -> "975 view_92" [style=solid, label="(12, 197, 64)"]; -"972 view_90" -> "973 transpose_70" [style=solid, label="(197, 12, 64)"]; -"973 transpose_70" -> "976 view_93" [style=solid, label="(12, 197, 64)"]; -"974 view_91" -> "977 scaled_dot_product_attention_11" [style=solid, label="(1, 12, 197, 64)"]; -"975 view_92" -> "977 scaled_dot_product_attention_11" [style=solid, label="(1, 12, 197, 64)"]; -"976 view_93" -> "977 scaled_dot_product_attention_11" [style=solid, label="(1, 12, 197, 64)"]; -"977 scaled_dot_product_attention_11" -> "978 permute_12" [style=solid, label="(1, 12, 197, 64)"]; -"978 permute_12" -> "979 view_94" [style=solid, label="(197, 1, 12, 64)"]; -"979 view_94" -> "980 view_94_0_0_nncf_smooth_quant_0" [style=solid, label="(197, 768)"]; -"980 view_94_0_0_nncf_smooth_quant_0" -> "981 quantize_per_tensor_372" [style=solid, label="(197, 768)"]; -"981 quantize_per_tensor_372" -> "982 dequantize_per_tensor_373" [style=solid, label="(197, 768)"]; -"982 dequantize_per_tensor_373" -> "985 linear_45" [style=solid, label="(197, 768)"]; -"983 _frozen_param48" -> "984 dequantize_per_tensor_374" [style=solid, label="(768, 768)"]; -"984 dequantize_per_tensor_374" -> "985 linear_45" [style=solid, label="(768, 768)"]; -"985 linear_45" -> "986 quantize_per_tensor_375" [style=solid, label="(197, 768)"]; -"986 quantize_per_tensor_375" -> "987 dequantize_per_tensor_376" [style=solid, label="(197, 768)"]; -"987 dequantize_per_tensor_376" -> "988 view_95" [style=solid, label="(197, 768)"]; -"988 view_95" -> "989 quantize_per_tensor_377" [style=solid, label="(197, 1, 768)"]; -"989 quantize_per_tensor_377" -> "990 dequantize_per_tensor_378" [style=solid, label="(197, 1, 768)"]; -"990 dequantize_per_tensor_378" -> "991 transpose_71" [style=solid, label="(197, 1, 768)"]; -"991 transpose_71" -> "992 dropout_34" [style=solid, label="(1, 197, 768)"]; -"992 dropout_34" -> "993 quantize_per_tensor_379" [style=solid, label="(1, 197, 768)"]; -"993 quantize_per_tensor_379" -> "994 dequantize_per_tensor_380" [style=solid, label="(1, 197, 768)"]; -"994 dequantize_per_tensor_380" -> "995 add_23" [style=solid, label="(1, 197, 768)"]; -"995 add_23" -> "996 quantize_per_tensor_381" [style=solid, label="(1, 197, 768)"]; -"996 quantize_per_tensor_381" -> "997 dequantize_per_tensor_382" [style=solid, label="(1, 197, 768)"]; -"996 quantize_per_tensor_381" -> "998 dequantize_per_tensor_383" [style=solid, label="(1, 197, 768)"]; -"997 dequantize_per_tensor_382" -> "1021 add_24" [style=solid, label="(1, 197, 768)"]; -"998 dequantize_per_tensor_383" -> "999 layer_norm_23" [style=solid, label="(1, 197, 768)"]; -"999 layer_norm_23" -> "1000 layer_norm_23_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 768)"]; -"1000 layer_norm_23_0_0_nncf_smooth_quant_0" -> "1001 quantize_per_tensor_384" [style=solid, label="(1, 197, 768)"]; -"1001 quantize_per_tensor_384" -> "1002 dequantize_per_tensor_385" [style=solid, label="(1, 197, 768)"]; -"1002 dequantize_per_tensor_385" -> "1005 linear_46" [style=solid, label="(1, 197, 768)"]; -"1003 _frozen_param49" -> "1004 dequantize_per_tensor_386" [style=solid, label="(3072, 768)"]; -"1004 dequantize_per_tensor_386" -> "1005 linear_46" [style=solid, label="(3072, 768)"]; -"1005 linear_46" -> "1006 quantize_per_tensor_387" [style=solid, label="(1, 197, 3072)"]; -"1006 quantize_per_tensor_387" -> "1007 dequantize_per_tensor_388" [style=solid, label="(1, 197, 3072)"]; -"1007 dequantize_per_tensor_388" -> "1008 gelu_11" [style=solid, label="(1, 197, 3072)"]; -"1008 gelu_11" -> "1009 dropout_35" [style=solid, label="(1, 197, 3072)"]; -"1009 dropout_35" -> "1010 dropout_35_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 197, 3072)"]; -"1010 dropout_35_0_0_nncf_smooth_quant_0" -> "1011 quantize_per_tensor_389" [style=solid, label="(1, 197, 3072)"]; -"1011 quantize_per_tensor_389" -> "1012 dequantize_per_tensor_390" [style=solid, label="(1, 197, 3072)"]; -"1012 dequantize_per_tensor_390" -> "1015 linear_47" [style=solid, label="(1, 197, 3072)"]; -"1013 _frozen_param50" -> "1014 dequantize_per_tensor_391" [style=solid, label="(768, 3072)"]; -"1014 dequantize_per_tensor_391" -> "1015 linear_47" [style=solid, label="(768, 3072)"]; -"1015 linear_47" -> "1016 quantize_per_tensor_392" [style=solid, label="(1, 197, 768)"]; -"1016 quantize_per_tensor_392" -> "1017 dequantize_per_tensor_393" [style=solid, label="(1, 197, 768)"]; -"1017 dequantize_per_tensor_393" -> "1018 dropout_36" [style=solid, label="(1, 197, 768)"]; -"1018 dropout_36" -> "1019 quantize_per_tensor_394" [style=solid, label="(1, 197, 768)"]; -"1019 quantize_per_tensor_394" -> "1020 dequantize_per_tensor_395" [style=solid, label="(1, 197, 768)"]; -"1020 dequantize_per_tensor_395" -> "1021 add_24" [style=solid, label="(1, 197, 768)"]; -"1021 add_24" -> "1022 quantize_per_tensor_396" [style=solid, label="(1, 197, 768)"]; -"1022 quantize_per_tensor_396" -> "1023 dequantize_per_tensor_397" [style=solid, label="(1, 197, 768)"]; -"1023 dequantize_per_tensor_397" -> "1024 layer_norm_24" [style=solid, label="(1, 197, 768)"]; -"1024 layer_norm_24" -> "1025 slice_1" [style=solid, label="(1, 197, 768)"]; -"1025 slice_1" -> "1026 select_36" [style=solid, label="(1, 197, 768)"]; -"1026 select_36" -> "1027 select_36_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 768)"]; -"1027 select_36_0_0_nncf_smooth_quant_0" -> "1028 quantize_per_tensor_398" [style=solid, label="(1, 768)"]; -"1028 quantize_per_tensor_398" -> "1029 dequantize_per_tensor_399" [style=solid, label="(1, 768)"]; -"1029 dequantize_per_tensor_399" -> "1032 linear_48" [style=solid, label="(1, 768)"]; -"1030 _frozen_param51" -> "1031 dequantize_per_tensor_400" [style=solid, label="(1000, 768)"]; -"1031 dequantize_per_tensor_400" -> "1032 linear_48" [style=solid, label="(1000, 768)"]; -"1032 linear_48" -> "1033 quantize_per_tensor_401" [style=solid, label="(1, 1000)"]; -"1033 quantize_per_tensor_401" -> "1034 dequantize_per_tensor_402" [style=solid, label="(1, 1000)"]; -"1034 dequantize_per_tensor_402" -> "1035 output" [style=solid, label="(1, 1000)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16_ref_qconfig.json deleted file mode 100644 index 59589a44871..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/vit_b_16_ref_qconfig.json +++ /dev/null @@ -1,1764 +0,0 @@ -{ - "quantization_points": { - "('conv2d',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('conv2d',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('reshape',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('cat',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('dropout',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_1',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('transpose_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_2', 'layer_norm_1')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_2',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_3',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_3', 'layer_norm_2')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_4',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_5',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_4', 'layer_norm_3')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_6',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_1',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_7',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_5', 'layer_norm_4')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_8',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_9',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_6', 'layer_norm_5')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_10',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_2',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_11',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_7', 'layer_norm_6')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_12',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_13',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_31',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_8', 'layer_norm_7')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_14',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_3',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_15',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_9', 'layer_norm_8')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_16',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_17',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_39',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_29',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_10', 'layer_norm_9')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_18',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_4',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_19',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_11', 'layer_norm_10')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_20',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_21',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_47',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_35',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_12', 'layer_norm_11')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_22',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_5',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_23',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_12',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_13', 'layer_norm_12')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_24',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_25',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_25',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_55',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_41',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_13',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_14', 'layer_norm_13')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_26',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_26',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_6',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_27',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_27',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_14',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_15', 'layer_norm_14')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_28',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_28',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_29',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_29',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_63',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_47',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_15',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_16', 'layer_norm_15')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_30',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_30',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_7',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_31',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_31',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_16',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_17', 'layer_norm_16')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_32',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_32',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_33',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('transpose_53',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('view_71',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_17',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_18', 'layer_norm_17')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_34',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_34',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_8',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_35',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_35',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_27',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_18',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_19', 'layer_norm_18')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_36',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_36',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_37',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_37',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_79',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_59',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_19',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_20', 'layer_norm_19')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_38',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_38',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_9',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_39',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_39',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_30',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_20',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_21', 'layer_norm_20')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_40',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_40',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_41',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_41',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_87',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_65',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_21',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_22', 'layer_norm_21')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_42',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_42',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_10',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_43',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_43',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_33',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_22',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_23', 'layer_norm_22')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_44',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_44',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('unflatten_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_45',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_45',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('view_95',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('transpose_71',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_23',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_24', 'layer_norm_23')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_46',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_46',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('gelu_11',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_47',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_47',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('dropout_36',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('add_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('layer_norm_24',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_48',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear_48',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('output',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": { - "0": [ - 3, - 4, - 5 - ], - "1": [ - 13, - 14 - ], - "2": [ - 31, - 32 - ], - "3": [ - 48, - 49 - ], - "4": [ - 65, - 66 - ], - "5": [ - 82, - 83 - ], - "6": [ - 99, - 100 - ], - "7": [ - 116, - 117 - ], - "8": [ - 133, - 134 - ], - "9": [ - 150, - 151 - ], - "10": [ - 167, - 168 - ], - "11": [ - 184, - 185 - ], - "12": [ - 201, - 202 - ] - }, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block.dot b/tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block.dot deleted file mode 100644 index 508b4ddc255..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block.dot +++ /dev/null @@ -1,57 +0,0 @@ -strict digraph { -"0 x" [id=0, type=input]; -"1 x_0_0_nncf_smooth_quant_0" [id=1, type="call_module"]; -"2 quantize_per_tensor_0" [id=2, type="quantize_per_tensor"]; -"3 dequantize_per_tensor_1" [id=3, type="dequantize_per_tensor"]; -"4 _frozen_param0" [id=4, type="get_attr"]; -"5 dequantize_per_tensor_2" [id=5, type="dequantize_per_tensor"]; -"6 linear" [id=6, type=linear]; -"7 quantize_per_tensor_3" [id=7, type="quantize_per_tensor"]; -"8 dequantize_per_tensor_4" [id=8, type="dequantize_per_tensor"]; -"9 dequantize_per_tensor_5" [id=9, type="dequantize_per_tensor"]; -"10 dequantize_per_tensor_6" [id=10, type="dequantize_per_tensor"]; -"11 slice_1" [id=11, type=slice]; -"12 slice_2" [id=12, type=slice]; -"13 slice_3" [id=13, type=slice]; -"14 slice_4" [id=14, type=slice]; -"15 slice_5" [id=15, type=slice]; -"16 slice_6" [id=16, type=slice]; -"17 slice_7" [id=17, type=slice]; -"18 slice_8" [id=18, type=slice]; -"19 slice_9" [id=19, type=slice]; -"20 transpose" [id=20, type=transpose]; -"21 matmul" [id=21, type=matmul]; -"22 div_" [id=22, type="div_"]; -"23 softmax" [id=23, type=softmax]; -"24 transpose_1" [id=24, type=transpose]; -"25 matmul_1" [id=25, type=matmul]; -"26 output" [id=26, type=output]; -"0 x" -> "1 x_0_0_nncf_smooth_quant_0" [style=solid, label="(1, 2, 4)"]; -"1 x_0_0_nncf_smooth_quant_0" -> "2 quantize_per_tensor_0" [style=solid, label="(1, 2, 4)"]; -"2 quantize_per_tensor_0" -> "3 dequantize_per_tensor_1" [style=solid, label="(1, 2, 4)"]; -"3 dequantize_per_tensor_1" -> "6 linear" [style=solid, label="(1, 2, 4)"]; -"4 _frozen_param0" -> "5 dequantize_per_tensor_2" [style=solid, label="(12, 4)"]; -"5 dequantize_per_tensor_2" -> "6 linear" [style=solid, label="(12, 4)"]; -"6 linear" -> "7 quantize_per_tensor_3" [style=solid, label="(1, 2, 12)"]; -"7 quantize_per_tensor_3" -> "8 dequantize_per_tensor_4" [style=solid, label="(1, 2, 12)"]; -"7 quantize_per_tensor_3" -> "9 dequantize_per_tensor_5" [style=solid, label="(1, 2, 12)"]; -"7 quantize_per_tensor_3" -> "10 dequantize_per_tensor_6" [style=solid, label="(1, 2, 12)"]; -"8 dequantize_per_tensor_4" -> "17 slice_7" [style=solid, label="(1, 2, 12)"]; -"9 dequantize_per_tensor_5" -> "14 slice_4" [style=solid, label="(1, 2, 12)"]; -"10 dequantize_per_tensor_6" -> "11 slice_1" [style=solid, label="(1, 2, 12)"]; -"11 slice_1" -> "12 slice_2" [style=solid, label="(1, 2, 12)"]; -"12 slice_2" -> "13 slice_3" [style=solid, label="(1, 2, 12)"]; -"13 slice_3" -> "21 matmul" [style=solid, label="(1, 2, 4)"]; -"14 slice_4" -> "15 slice_5" [style=solid, label="(1, 2, 12)"]; -"15 slice_5" -> "16 slice_6" [style=solid, label="(1, 2, 12)"]; -"16 slice_6" -> "20 transpose" [style=solid, label="(1, 2, 4)"]; -"17 slice_7" -> "18 slice_8" [style=solid, label="(1, 2, 12)"]; -"18 slice_8" -> "19 slice_9" [style=solid, label="(1, 2, 12)"]; -"19 slice_9" -> "25 matmul_1" [style=solid, label="(1, 2, 4)"]; -"20 transpose" -> "21 matmul" [style=solid, label="(1, 4, 2)"]; -"21 matmul" -> "22 div_" [style=solid, label="(1, 2, 2)"]; -"22 div_" -> "23 softmax" [style=solid, label="(1, 2, 2)"]; -"23 softmax" -> "24 transpose_1" [style=solid, label="(1, 2, 2)"]; -"24 transpose_1" -> "25 matmul_1" [style=solid, label="(1, 2, 2)"]; -"25 matmul_1" -> "26 output" [style=solid, label="(1, 2, 4)"]; -} diff --git a/tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block_ref_qconfig.json b/tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block_ref_qconfig.json deleted file mode 100644 index c51f5fc2951..00000000000 --- a/tests/torch2/data/fx/XNNPACKQuantizer/yolo11n_sdpa_block_ref_qconfig.json +++ /dev/null @@ -1,30 +0,0 @@ -{ - "quantization_points": { - "('linear',)_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - }, - "('linear',)_WeightQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "symmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": true, - "dest_dtype": "INT8" - }, - "('slice_1', 'slice_4', 'slice_7')_ActivationQuantizationInsertionPoint": { - "num_bits": 8, - "mode": "asymmetric", - "signedness_to_force": false, - "per_channel": false, - "narrow_range": false, - "dest_dtype": "INT8" - } - }, - "unified_scale_groups": {}, - "shared_input_operation_set_groups": {} -} \ No newline at end of file diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/mobilenet_v3_small.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/mobilenet_v3_small.dot index 5a0bb73d036..7a91c75981d 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/mobilenet_v3_small.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/mobilenet_v3_small.dot @@ -1,11 +1,11 @@ strict digraph { "0 _scale_0" [id=0, type="get_attr"]; "1 _zero_point_0" [id=1, type="get_attr"]; -"2 _frozen_param0" [id=2, type="get_attr"]; +"2 quantize_per_channel_default" [id=2, type="get_attr"]; "3 dequantize_per_channel_default" [id=3, type="dequantize_per_channel"]; "4 _scale_1" [id=4, type="get_attr"]; "5 _zero_point_1" [id=5, type="get_attr"]; -"6 _frozen_param1" [id=6, type="get_attr"]; +"6 quantize_per_channel_default_1" [id=6, type="get_attr"]; "7 dequantize_per_channel_default_1" [id=7, type="dequantize_per_channel"]; "8 features_1_block_1_fc1_weight" [id=8, type="get_attr"]; "9 features_1_block_1_fc1_bias" [id=9, type="get_attr"]; @@ -13,39 +13,39 @@ strict digraph { "11 features_1_block_1_fc2_bias" [id=11, type="get_attr"]; "12 _scale_2" [id=12, type="get_attr"]; "13 _zero_point_2" [id=13, type="get_attr"]; -"14 _frozen_param2" [id=14, type="get_attr"]; +"14 quantize_per_channel_default_2" [id=14, type="get_attr"]; "15 dequantize_per_channel_default_2" [id=15, type="dequantize_per_channel"]; "16 _scale_3" [id=16, type="get_attr"]; "17 _zero_point_3" [id=17, type="get_attr"]; -"18 _frozen_param3" [id=18, type="get_attr"]; +"18 quantize_per_channel_default_3" [id=18, type="get_attr"]; "19 dequantize_per_channel_default_3" [id=19, type="dequantize_per_channel"]; "20 _scale_4" [id=20, type="get_attr"]; "21 _zero_point_4" [id=21, type="get_attr"]; -"22 _frozen_param4" [id=22, type="get_attr"]; +"22 quantize_per_channel_default_4" [id=22, type="get_attr"]; "23 dequantize_per_channel_default_4" [id=23, type="dequantize_per_channel"]; "24 _scale_5" [id=24, type="get_attr"]; "25 _zero_point_5" [id=25, type="get_attr"]; -"26 _frozen_param5" [id=26, type="get_attr"]; +"26 quantize_per_channel_default_5" [id=26, type="get_attr"]; "27 dequantize_per_channel_default_5" [id=27, type="dequantize_per_channel"]; "28 _scale_6" [id=28, type="get_attr"]; "29 _zero_point_6" [id=29, type="get_attr"]; -"30 _frozen_param6" [id=30, type="get_attr"]; +"30 quantize_per_channel_default_6" [id=30, type="get_attr"]; "31 dequantize_per_channel_default_6" [id=31, type="dequantize_per_channel"]; "32 _scale_7" [id=32, type="get_attr"]; "33 _zero_point_7" [id=33, type="get_attr"]; -"34 _frozen_param7" [id=34, type="get_attr"]; +"34 quantize_per_channel_default_7" [id=34, type="get_attr"]; "35 dequantize_per_channel_default_7" [id=35, type="dequantize_per_channel"]; "36 _scale_8" [id=36, type="get_attr"]; "37 _zero_point_8" [id=37, type="get_attr"]; -"38 _frozen_param8" [id=38, type="get_attr"]; +"38 quantize_per_channel_default_8" [id=38, type="get_attr"]; "39 dequantize_per_channel_default_8" [id=39, type="dequantize_per_channel"]; "40 _scale_9" [id=40, type="get_attr"]; "41 _zero_point_9" [id=41, type="get_attr"]; -"42 _frozen_param9" [id=42, type="get_attr"]; +"42 quantize_per_channel_default_9" [id=42, type="get_attr"]; "43 dequantize_per_channel_default_9" [id=43, type="dequantize_per_channel"]; "44 _scale_10" [id=44, type="get_attr"]; "45 _zero_point_10" [id=45, type="get_attr"]; -"46 _frozen_param10" [id=46, type="get_attr"]; +"46 quantize_per_channel_default_10" [id=46, type="get_attr"]; "47 dequantize_per_channel_default_10" [id=47, type="dequantize_per_channel"]; "48 features_4_block_2_fc1_weight" [id=48, type="get_attr"]; "49 features_4_block_2_fc1_bias" [id=49, type="get_attr"]; @@ -53,15 +53,15 @@ strict digraph { "51 features_4_block_2_fc2_bias" [id=51, type="get_attr"]; "52 _scale_11" [id=52, type="get_attr"]; "53 _zero_point_11" [id=53, type="get_attr"]; -"54 _frozen_param11" [id=54, type="get_attr"]; +"54 quantize_per_channel_default_11" [id=54, type="get_attr"]; "55 dequantize_per_channel_default_11" [id=55, type="dequantize_per_channel"]; "56 _scale_12" [id=56, type="get_attr"]; "57 _zero_point_12" [id=57, type="get_attr"]; -"58 _frozen_param12" [id=58, type="get_attr"]; +"58 quantize_per_channel_default_12" [id=58, type="get_attr"]; "59 dequantize_per_channel_default_12" [id=59, type="dequantize_per_channel"]; "60 _scale_13" [id=60, type="get_attr"]; "61 _zero_point_13" [id=61, type="get_attr"]; -"62 _frozen_param13" [id=62, type="get_attr"]; +"62 quantize_per_channel_default_13" [id=62, type="get_attr"]; "63 dequantize_per_channel_default_13" [id=63, type="dequantize_per_channel"]; "64 features_5_block_2_fc1_weight" [id=64, type="get_attr"]; "65 features_5_block_2_fc1_bias" [id=65, type="get_attr"]; @@ -69,15 +69,15 @@ strict digraph { "67 features_5_block_2_fc2_bias" [id=67, type="get_attr"]; "68 _scale_14" [id=68, type="get_attr"]; "69 _zero_point_14" [id=69, type="get_attr"]; -"70 _frozen_param14" [id=70, type="get_attr"]; +"70 quantize_per_channel_default_14" [id=70, type="get_attr"]; "71 dequantize_per_channel_default_14" [id=71, type="dequantize_per_channel"]; "72 _scale_15" [id=72, type="get_attr"]; "73 _zero_point_15" [id=73, type="get_attr"]; -"74 _frozen_param15" [id=74, type="get_attr"]; +"74 quantize_per_channel_default_15" [id=74, type="get_attr"]; "75 dequantize_per_channel_default_15" [id=75, type="dequantize_per_channel"]; "76 _scale_16" [id=76, type="get_attr"]; "77 _zero_point_16" [id=77, type="get_attr"]; -"78 _frozen_param16" [id=78, type="get_attr"]; +"78 quantize_per_channel_default_16" [id=78, type="get_attr"]; "79 dequantize_per_channel_default_16" [id=79, type="dequantize_per_channel"]; "80 features_6_block_2_fc1_weight" [id=80, type="get_attr"]; "81 features_6_block_2_fc1_bias" [id=81, type="get_attr"]; @@ -85,15 +85,15 @@ strict digraph { "83 features_6_block_2_fc2_bias" [id=83, type="get_attr"]; "84 _scale_17" [id=84, type="get_attr"]; "85 _zero_point_17" [id=85, type="get_attr"]; -"86 _frozen_param17" [id=86, type="get_attr"]; +"86 quantize_per_channel_default_17" [id=86, type="get_attr"]; "87 dequantize_per_channel_default_17" [id=87, type="dequantize_per_channel"]; "88 _scale_18" [id=88, type="get_attr"]; "89 _zero_point_18" [id=89, type="get_attr"]; -"90 _frozen_param18" [id=90, type="get_attr"]; +"90 quantize_per_channel_default_18" [id=90, type="get_attr"]; "91 dequantize_per_channel_default_18" [id=91, type="dequantize_per_channel"]; "92 _scale_19" [id=92, type="get_attr"]; "93 _zero_point_19" [id=93, type="get_attr"]; -"94 _frozen_param19" [id=94, type="get_attr"]; +"94 quantize_per_channel_default_19" [id=94, type="get_attr"]; "95 dequantize_per_channel_default_19" [id=95, type="dequantize_per_channel"]; "96 features_7_block_2_fc1_weight" [id=96, type="get_attr"]; "97 features_7_block_2_fc1_bias" [id=97, type="get_attr"]; @@ -101,15 +101,15 @@ strict digraph { "99 features_7_block_2_fc2_bias" [id=99, type="get_attr"]; "100 _scale_20" [id=100, type="get_attr"]; "101 _zero_point_20" [id=101, type="get_attr"]; -"102 _frozen_param20" [id=102, type="get_attr"]; +"102 quantize_per_channel_default_20" [id=102, type="get_attr"]; "103 dequantize_per_channel_default_20" [id=103, type="dequantize_per_channel"]; "104 _scale_21" [id=104, type="get_attr"]; "105 _zero_point_21" [id=105, type="get_attr"]; -"106 _frozen_param21" [id=106, type="get_attr"]; +"106 quantize_per_channel_default_21" [id=106, type="get_attr"]; "107 dequantize_per_channel_default_21" [id=107, type="dequantize_per_channel"]; "108 _scale_22" [id=108, type="get_attr"]; "109 _zero_point_22" [id=109, type="get_attr"]; -"110 _frozen_param22" [id=110, type="get_attr"]; +"110 quantize_per_channel_default_22" [id=110, type="get_attr"]; "111 dequantize_per_channel_default_22" [id=111, type="dequantize_per_channel"]; "112 features_8_block_2_fc1_weight" [id=112, type="get_attr"]; "113 features_8_block_2_fc1_bias" [id=113, type="get_attr"]; @@ -117,15 +117,15 @@ strict digraph { "115 features_8_block_2_fc2_bias" [id=115, type="get_attr"]; "116 _scale_23" [id=116, type="get_attr"]; "117 _zero_point_23" [id=117, type="get_attr"]; -"118 _frozen_param23" [id=118, type="get_attr"]; +"118 quantize_per_channel_default_23" [id=118, type="get_attr"]; "119 dequantize_per_channel_default_23" [id=119, type="dequantize_per_channel"]; "120 _scale_24" [id=120, type="get_attr"]; "121 _zero_point_24" [id=121, type="get_attr"]; -"122 _frozen_param24" [id=122, type="get_attr"]; +"122 quantize_per_channel_default_24" [id=122, type="get_attr"]; "123 dequantize_per_channel_default_24" [id=123, type="dequantize_per_channel"]; "124 _scale_25" [id=124, type="get_attr"]; "125 _zero_point_25" [id=125, type="get_attr"]; -"126 _frozen_param25" [id=126, type="get_attr"]; +"126 quantize_per_channel_default_25" [id=126, type="get_attr"]; "127 dequantize_per_channel_default_25" [id=127, type="dequantize_per_channel"]; "128 features_9_block_2_fc1_weight" [id=128, type="get_attr"]; "129 features_9_block_2_fc1_bias" [id=129, type="get_attr"]; @@ -133,15 +133,15 @@ strict digraph { "131 features_9_block_2_fc2_bias" [id=131, type="get_attr"]; "132 _scale_26" [id=132, type="get_attr"]; "133 _zero_point_26" [id=133, type="get_attr"]; -"134 _frozen_param26" [id=134, type="get_attr"]; +"134 quantize_per_channel_default_26" [id=134, type="get_attr"]; "135 dequantize_per_channel_default_26" [id=135, type="dequantize_per_channel"]; "136 _scale_27" [id=136, type="get_attr"]; "137 _zero_point_27" [id=137, type="get_attr"]; -"138 _frozen_param27" [id=138, type="get_attr"]; +"138 quantize_per_channel_default_27" [id=138, type="get_attr"]; "139 dequantize_per_channel_default_27" [id=139, type="dequantize_per_channel"]; "140 _scale_28" [id=140, type="get_attr"]; "141 _zero_point_28" [id=141, type="get_attr"]; -"142 _frozen_param28" [id=142, type="get_attr"]; +"142 quantize_per_channel_default_28" [id=142, type="get_attr"]; "143 dequantize_per_channel_default_28" [id=143, type="dequantize_per_channel"]; "144 features_10_block_2_fc1_weight" [id=144, type="get_attr"]; "145 features_10_block_2_fc1_bias" [id=145, type="get_attr"]; @@ -149,15 +149,15 @@ strict digraph { "147 features_10_block_2_fc2_bias" [id=147, type="get_attr"]; "148 _scale_29" [id=148, type="get_attr"]; "149 _zero_point_29" [id=149, type="get_attr"]; -"150 _frozen_param29" [id=150, type="get_attr"]; +"150 quantize_per_channel_default_29" [id=150, type="get_attr"]; "151 dequantize_per_channel_default_29" [id=151, type="dequantize_per_channel"]; "152 _scale_30" [id=152, type="get_attr"]; "153 _zero_point_30" [id=153, type="get_attr"]; -"154 _frozen_param30" [id=154, type="get_attr"]; +"154 quantize_per_channel_default_30" [id=154, type="get_attr"]; "155 dequantize_per_channel_default_30" [id=155, type="dequantize_per_channel"]; "156 _scale_31" [id=156, type="get_attr"]; "157 _zero_point_31" [id=157, type="get_attr"]; -"158 _frozen_param31" [id=158, type="get_attr"]; +"158 quantize_per_channel_default_31" [id=158, type="get_attr"]; "159 dequantize_per_channel_default_31" [id=159, type="dequantize_per_channel"]; "160 features_11_block_2_fc1_weight" [id=160, type="get_attr"]; "161 features_11_block_2_fc1_bias" [id=161, type="get_attr"]; @@ -165,20 +165,20 @@ strict digraph { "163 features_11_block_2_fc2_bias" [id=163, type="get_attr"]; "164 _scale_32" [id=164, type="get_attr"]; "165 _zero_point_32" [id=165, type="get_attr"]; -"166 _frozen_param32" [id=166, type="get_attr"]; +"166 quantize_per_channel_default_32" [id=166, type="get_attr"]; "167 dequantize_per_channel_default_32" [id=167, type="dequantize_per_channel"]; "168 _scale_33" [id=168, type="get_attr"]; "169 _zero_point_33" [id=169, type="get_attr"]; -"170 _frozen_param33" [id=170, type="get_attr"]; +"170 quantize_per_channel_default_33" [id=170, type="get_attr"]; "171 dequantize_per_channel_default_33" [id=171, type="dequantize_per_channel"]; "172 _scale_34" [id=172, type="get_attr"]; "173 _zero_point_34" [id=173, type="get_attr"]; -"174 _frozen_param34" [id=174, type="get_attr"]; +"174 quantize_per_channel_default_34" [id=174, type="get_attr"]; "175 dequantize_per_channel_default_34" [id=175, type="dequantize_per_channel"]; "176 classifier_0_bias" [id=176, type="get_attr"]; "177 _scale_35" [id=177, type="get_attr"]; "178 _zero_point_35" [id=178, type="get_attr"]; -"179 _frozen_param35" [id=179, type="get_attr"]; +"179 quantize_per_channel_default_35" [id=179, type="get_attr"]; "180 dequantize_per_channel_default_35" [id=180, type="dequantize_per_channel"]; "181 classifier_3_bias" [id=181, type="get_attr"]; "182 x" [id=182, type=input]; @@ -501,11 +501,11 @@ strict digraph { "499 output" [id=499, type=output]; "0 _scale_0" -> "3 dequantize_per_channel_default" [style=solid, label="(16,)"]; "1 _zero_point_0" -> "3 dequantize_per_channel_default" [style=solid, label="(16,)"]; -"2 _frozen_param0" -> "3 dequantize_per_channel_default" [style=solid, label="(16, 3, 3, 3)"]; +"2 quantize_per_channel_default" -> "3 dequantize_per_channel_default" [style=solid, label="(16, 3, 3, 3)"]; "3 dequantize_per_channel_default" -> "186 conv2d" [style=solid, label=None]; "4 _scale_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(16,)"]; "5 _zero_point_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(16,)"]; -"6 _frozen_param1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(16, 1, 3, 3)"]; +"6 quantize_per_channel_default_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(16, 1, 3, 3)"]; "7 dequantize_per_channel_default_1" -> "193 conv2d_1" [style=solid, label=None]; "8 features_1_block_1_fc1_weight" -> "199 conv2d_2" [style=solid, label="(8, 16, 1, 1)"]; "9 features_1_block_1_fc1_bias" -> "199 conv2d_2" [style=solid, label="(8,)"]; @@ -513,39 +513,39 @@ strict digraph { "11 features_1_block_1_fc2_bias" -> "201 conv2d_3" [style=solid, label="(16,)"]; "12 _scale_2" -> "15 dequantize_per_channel_default_2" [style=solid, label="(16,)"]; "13 _zero_point_2" -> "15 dequantize_per_channel_default_2" [style=solid, label="(16,)"]; -"14 _frozen_param2" -> "15 dequantize_per_channel_default_2" [style=solid, label="(16, 16, 1, 1)"]; +"14 quantize_per_channel_default_2" -> "15 dequantize_per_channel_default_2" [style=solid, label="(16, 16, 1, 1)"]; "15 dequantize_per_channel_default_2" -> "209 conv2d_4" [style=solid, label=None]; "16 _scale_3" -> "19 dequantize_per_channel_default_3" [style=solid, label="(72,)"]; "17 _zero_point_3" -> "19 dequantize_per_channel_default_3" [style=solid, label="(72,)"]; -"18 _frozen_param3" -> "19 dequantize_per_channel_default_3" [style=solid, label="(72, 16, 1, 1)"]; +"18 quantize_per_channel_default_3" -> "19 dequantize_per_channel_default_3" [style=solid, label="(72, 16, 1, 1)"]; "19 dequantize_per_channel_default_3" -> "213 conv2d_5" [style=solid, label=None]; "20 _scale_4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(72,)"]; "21 _zero_point_4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(72,)"]; -"22 _frozen_param4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(72, 1, 3, 3)"]; +"22 quantize_per_channel_default_4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(72, 1, 3, 3)"]; "23 dequantize_per_channel_default_4" -> "220 conv2d_6" [style=solid, label=None]; "24 _scale_5" -> "27 dequantize_per_channel_default_5" [style=solid, label="(24,)"]; "25 _zero_point_5" -> "27 dequantize_per_channel_default_5" [style=solid, label="(24,)"]; -"26 _frozen_param5" -> "27 dequantize_per_channel_default_5" [style=solid, label="(24, 72, 1, 1)"]; +"26 quantize_per_channel_default_5" -> "27 dequantize_per_channel_default_5" [style=solid, label="(24, 72, 1, 1)"]; "27 dequantize_per_channel_default_5" -> "225 conv2d_7" [style=solid, label=None]; "28 _scale_6" -> "31 dequantize_per_channel_default_6" [style=solid, label="(88,)"]; "29 _zero_point_6" -> "31 dequantize_per_channel_default_6" [style=solid, label="(88,)"]; -"30 _frozen_param6" -> "31 dequantize_per_channel_default_6" [style=solid, label="(88, 24, 1, 1)"]; +"30 quantize_per_channel_default_6" -> "31 dequantize_per_channel_default_6" [style=solid, label="(88, 24, 1, 1)"]; "31 dequantize_per_channel_default_6" -> "230 conv2d_8" [style=solid, label=None]; "32 _scale_7" -> "35 dequantize_per_channel_default_7" [style=solid, label="(88,)"]; "33 _zero_point_7" -> "35 dequantize_per_channel_default_7" [style=solid, label="(88,)"]; -"34 _frozen_param7" -> "35 dequantize_per_channel_default_7" [style=solid, label="(88, 1, 3, 3)"]; +"34 quantize_per_channel_default_7" -> "35 dequantize_per_channel_default_7" [style=solid, label="(88, 1, 3, 3)"]; "35 dequantize_per_channel_default_7" -> "237 conv2d_9" [style=solid, label=None]; "36 _scale_8" -> "39 dequantize_per_channel_default_8" [style=solid, label="(24,)"]; "37 _zero_point_8" -> "39 dequantize_per_channel_default_8" [style=solid, label="(24,)"]; -"38 _frozen_param8" -> "39 dequantize_per_channel_default_8" [style=solid, label="(24, 88, 1, 1)"]; +"38 quantize_per_channel_default_8" -> "39 dequantize_per_channel_default_8" [style=solid, label="(24, 88, 1, 1)"]; "39 dequantize_per_channel_default_8" -> "242 conv2d_10" [style=solid, label=None]; "40 _scale_9" -> "43 dequantize_per_channel_default_9" [style=solid, label="(96,)"]; "41 _zero_point_9" -> "43 dequantize_per_channel_default_9" [style=solid, label="(96,)"]; -"42 _frozen_param9" -> "43 dequantize_per_channel_default_9" [style=solid, label="(96, 24, 1, 1)"]; +"42 quantize_per_channel_default_9" -> "43 dequantize_per_channel_default_9" [style=solid, label="(96, 24, 1, 1)"]; "43 dequantize_per_channel_default_9" -> "249 conv2d_11" [style=solid, label=None]; "44 _scale_10" -> "47 dequantize_per_channel_default_10" [style=solid, label="(96,)"]; "45 _zero_point_10" -> "47 dequantize_per_channel_default_10" [style=solid, label="(96,)"]; -"46 _frozen_param10" -> "47 dequantize_per_channel_default_10" [style=solid, label="(96, 1, 5, 5)"]; +"46 quantize_per_channel_default_10" -> "47 dequantize_per_channel_default_10" [style=solid, label="(96, 1, 5, 5)"]; "47 dequantize_per_channel_default_10" -> "256 conv2d_12" [style=solid, label=None]; "48 features_4_block_2_fc1_weight" -> "262 conv2d_13" [style=solid, label="(24, 96, 1, 1)"]; "49 features_4_block_2_fc1_bias" -> "262 conv2d_13" [style=solid, label="(24,)"]; @@ -553,15 +553,15 @@ strict digraph { "51 features_4_block_2_fc2_bias" -> "264 conv2d_14" [style=solid, label="(96,)"]; "52 _scale_11" -> "55 dequantize_per_channel_default_11" [style=solid, label="(40,)"]; "53 _zero_point_11" -> "55 dequantize_per_channel_default_11" [style=solid, label="(40,)"]; -"54 _frozen_param11" -> "55 dequantize_per_channel_default_11" [style=solid, label="(40, 96, 1, 1)"]; +"54 quantize_per_channel_default_11" -> "55 dequantize_per_channel_default_11" [style=solid, label="(40, 96, 1, 1)"]; "55 dequantize_per_channel_default_11" -> "272 conv2d_15" [style=solid, label=None]; "56 _scale_12" -> "59 dequantize_per_channel_default_12" [style=solid, label="(240,)"]; "57 _zero_point_12" -> "59 dequantize_per_channel_default_12" [style=solid, label="(240,)"]; -"58 _frozen_param12" -> "59 dequantize_per_channel_default_12" [style=solid, label="(240, 40, 1, 1)"]; +"58 quantize_per_channel_default_12" -> "59 dequantize_per_channel_default_12" [style=solid, label="(240, 40, 1, 1)"]; "59 dequantize_per_channel_default_12" -> "277 conv2d_16" [style=solid, label=None]; "60 _scale_13" -> "63 dequantize_per_channel_default_13" [style=solid, label="(240,)"]; "61 _zero_point_13" -> "63 dequantize_per_channel_default_13" [style=solid, label="(240,)"]; -"62 _frozen_param13" -> "63 dequantize_per_channel_default_13" [style=solid, label="(240, 1, 5, 5)"]; +"62 quantize_per_channel_default_13" -> "63 dequantize_per_channel_default_13" [style=solid, label="(240, 1, 5, 5)"]; "63 dequantize_per_channel_default_13" -> "284 conv2d_17" [style=solid, label=None]; "64 features_5_block_2_fc1_weight" -> "290 conv2d_18" [style=solid, label="(64, 240, 1, 1)"]; "65 features_5_block_2_fc1_bias" -> "290 conv2d_18" [style=solid, label="(64,)"]; @@ -569,15 +569,15 @@ strict digraph { "67 features_5_block_2_fc2_bias" -> "292 conv2d_19" [style=solid, label="(240,)"]; "68 _scale_14" -> "71 dequantize_per_channel_default_14" [style=solid, label="(40,)"]; "69 _zero_point_14" -> "71 dequantize_per_channel_default_14" [style=solid, label="(40,)"]; -"70 _frozen_param14" -> "71 dequantize_per_channel_default_14" [style=solid, label="(40, 240, 1, 1)"]; +"70 quantize_per_channel_default_14" -> "71 dequantize_per_channel_default_14" [style=solid, label="(40, 240, 1, 1)"]; "71 dequantize_per_channel_default_14" -> "300 conv2d_20" [style=solid, label=None]; "72 _scale_15" -> "75 dequantize_per_channel_default_15" [style=solid, label="(240,)"]; "73 _zero_point_15" -> "75 dequantize_per_channel_default_15" [style=solid, label="(240,)"]; -"74 _frozen_param15" -> "75 dequantize_per_channel_default_15" [style=solid, label="(240, 40, 1, 1)"]; +"74 quantize_per_channel_default_15" -> "75 dequantize_per_channel_default_15" [style=solid, label="(240, 40, 1, 1)"]; "75 dequantize_per_channel_default_15" -> "308 conv2d_21" [style=solid, label=None]; "76 _scale_16" -> "79 dequantize_per_channel_default_16" [style=solid, label="(240,)"]; "77 _zero_point_16" -> "79 dequantize_per_channel_default_16" [style=solid, label="(240,)"]; -"78 _frozen_param16" -> "79 dequantize_per_channel_default_16" [style=solid, label="(240, 1, 5, 5)"]; +"78 quantize_per_channel_default_16" -> "79 dequantize_per_channel_default_16" [style=solid, label="(240, 1, 5, 5)"]; "79 dequantize_per_channel_default_16" -> "315 conv2d_22" [style=solid, label=None]; "80 features_6_block_2_fc1_weight" -> "321 conv2d_23" [style=solid, label="(64, 240, 1, 1)"]; "81 features_6_block_2_fc1_bias" -> "321 conv2d_23" [style=solid, label="(64,)"]; @@ -585,15 +585,15 @@ strict digraph { "83 features_6_block_2_fc2_bias" -> "323 conv2d_24" [style=solid, label="(240,)"]; "84 _scale_17" -> "87 dequantize_per_channel_default_17" [style=solid, label="(40,)"]; "85 _zero_point_17" -> "87 dequantize_per_channel_default_17" [style=solid, label="(40,)"]; -"86 _frozen_param17" -> "87 dequantize_per_channel_default_17" [style=solid, label="(40, 240, 1, 1)"]; +"86 quantize_per_channel_default_17" -> "87 dequantize_per_channel_default_17" [style=solid, label="(40, 240, 1, 1)"]; "87 dequantize_per_channel_default_17" -> "331 conv2d_25" [style=solid, label=None]; "88 _scale_18" -> "91 dequantize_per_channel_default_18" [style=solid, label="(120,)"]; "89 _zero_point_18" -> "91 dequantize_per_channel_default_18" [style=solid, label="(120,)"]; -"90 _frozen_param18" -> "91 dequantize_per_channel_default_18" [style=solid, label="(120, 40, 1, 1)"]; +"90 quantize_per_channel_default_18" -> "91 dequantize_per_channel_default_18" [style=solid, label="(120, 40, 1, 1)"]; "91 dequantize_per_channel_default_18" -> "338 conv2d_26" [style=solid, label=None]; "92 _scale_19" -> "95 dequantize_per_channel_default_19" [style=solid, label="(120,)"]; "93 _zero_point_19" -> "95 dequantize_per_channel_default_19" [style=solid, label="(120,)"]; -"94 _frozen_param19" -> "95 dequantize_per_channel_default_19" [style=solid, label="(120, 1, 5, 5)"]; +"94 quantize_per_channel_default_19" -> "95 dequantize_per_channel_default_19" [style=solid, label="(120, 1, 5, 5)"]; "95 dequantize_per_channel_default_19" -> "345 conv2d_27" [style=solid, label=None]; "96 features_7_block_2_fc1_weight" -> "351 conv2d_28" [style=solid, label="(32, 120, 1, 1)"]; "97 features_7_block_2_fc1_bias" -> "351 conv2d_28" [style=solid, label="(32,)"]; @@ -601,15 +601,15 @@ strict digraph { "99 features_7_block_2_fc2_bias" -> "353 conv2d_29" [style=solid, label="(120,)"]; "100 _scale_20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(48,)"]; "101 _zero_point_20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(48,)"]; -"102 _frozen_param20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(48, 120, 1, 1)"]; +"102 quantize_per_channel_default_20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(48, 120, 1, 1)"]; "103 dequantize_per_channel_default_20" -> "361 conv2d_30" [style=solid, label=None]; "104 _scale_21" -> "107 dequantize_per_channel_default_21" [style=solid, label="(144,)"]; "105 _zero_point_21" -> "107 dequantize_per_channel_default_21" [style=solid, label="(144,)"]; -"106 _frozen_param21" -> "107 dequantize_per_channel_default_21" [style=solid, label="(144, 48, 1, 1)"]; +"106 quantize_per_channel_default_21" -> "107 dequantize_per_channel_default_21" [style=solid, label="(144, 48, 1, 1)"]; "107 dequantize_per_channel_default_21" -> "366 conv2d_31" [style=solid, label=None]; "108 _scale_22" -> "111 dequantize_per_channel_default_22" [style=solid, label="(144,)"]; "109 _zero_point_22" -> "111 dequantize_per_channel_default_22" [style=solid, label="(144,)"]; -"110 _frozen_param22" -> "111 dequantize_per_channel_default_22" [style=solid, label="(144, 1, 5, 5)"]; +"110 quantize_per_channel_default_22" -> "111 dequantize_per_channel_default_22" [style=solid, label="(144, 1, 5, 5)"]; "111 dequantize_per_channel_default_22" -> "373 conv2d_32" [style=solid, label=None]; "112 features_8_block_2_fc1_weight" -> "379 conv2d_33" [style=solid, label="(40, 144, 1, 1)"]; "113 features_8_block_2_fc1_bias" -> "379 conv2d_33" [style=solid, label="(40,)"]; @@ -617,15 +617,15 @@ strict digraph { "115 features_8_block_2_fc2_bias" -> "381 conv2d_34" [style=solid, label="(144,)"]; "116 _scale_23" -> "119 dequantize_per_channel_default_23" [style=solid, label="(48,)"]; "117 _zero_point_23" -> "119 dequantize_per_channel_default_23" [style=solid, label="(48,)"]; -"118 _frozen_param23" -> "119 dequantize_per_channel_default_23" [style=solid, label="(48, 144, 1, 1)"]; +"118 quantize_per_channel_default_23" -> "119 dequantize_per_channel_default_23" [style=solid, label="(48, 144, 1, 1)"]; "119 dequantize_per_channel_default_23" -> "389 conv2d_35" [style=solid, label=None]; "120 _scale_24" -> "123 dequantize_per_channel_default_24" [style=solid, label="(288,)"]; "121 _zero_point_24" -> "123 dequantize_per_channel_default_24" [style=solid, label="(288,)"]; -"122 _frozen_param24" -> "123 dequantize_per_channel_default_24" [style=solid, label="(288, 48, 1, 1)"]; +"122 quantize_per_channel_default_24" -> "123 dequantize_per_channel_default_24" [style=solid, label="(288, 48, 1, 1)"]; "123 dequantize_per_channel_default_24" -> "396 conv2d_36" [style=solid, label=None]; "124 _scale_25" -> "127 dequantize_per_channel_default_25" [style=solid, label="(288,)"]; "125 _zero_point_25" -> "127 dequantize_per_channel_default_25" [style=solid, label="(288,)"]; -"126 _frozen_param25" -> "127 dequantize_per_channel_default_25" [style=solid, label="(288, 1, 5, 5)"]; +"126 quantize_per_channel_default_25" -> "127 dequantize_per_channel_default_25" [style=solid, label="(288, 1, 5, 5)"]; "127 dequantize_per_channel_default_25" -> "403 conv2d_37" [style=solid, label=None]; "128 features_9_block_2_fc1_weight" -> "409 conv2d_38" [style=solid, label="(72, 288, 1, 1)"]; "129 features_9_block_2_fc1_bias" -> "409 conv2d_38" [style=solid, label="(72,)"]; @@ -633,15 +633,15 @@ strict digraph { "131 features_9_block_2_fc2_bias" -> "411 conv2d_39" [style=solid, label="(288,)"]; "132 _scale_26" -> "135 dequantize_per_channel_default_26" [style=solid, label="(96,)"]; "133 _zero_point_26" -> "135 dequantize_per_channel_default_26" [style=solid, label="(96,)"]; -"134 _frozen_param26" -> "135 dequantize_per_channel_default_26" [style=solid, label="(96, 288, 1, 1)"]; +"134 quantize_per_channel_default_26" -> "135 dequantize_per_channel_default_26" [style=solid, label="(96, 288, 1, 1)"]; "135 dequantize_per_channel_default_26" -> "419 conv2d_40" [style=solid, label=None]; "136 _scale_27" -> "139 dequantize_per_channel_default_27" [style=solid, label="(576,)"]; "137 _zero_point_27" -> "139 dequantize_per_channel_default_27" [style=solid, label="(576,)"]; -"138 _frozen_param27" -> "139 dequantize_per_channel_default_27" [style=solid, label="(576, 96, 1, 1)"]; +"138 quantize_per_channel_default_27" -> "139 dequantize_per_channel_default_27" [style=solid, label="(576, 96, 1, 1)"]; "139 dequantize_per_channel_default_27" -> "424 conv2d_41" [style=solid, label=None]; "140 _scale_28" -> "143 dequantize_per_channel_default_28" [style=solid, label="(576,)"]; "141 _zero_point_28" -> "143 dequantize_per_channel_default_28" [style=solid, label="(576,)"]; -"142 _frozen_param28" -> "143 dequantize_per_channel_default_28" [style=solid, label="(576, 1, 5, 5)"]; +"142 quantize_per_channel_default_28" -> "143 dequantize_per_channel_default_28" [style=solid, label="(576, 1, 5, 5)"]; "143 dequantize_per_channel_default_28" -> "431 conv2d_42" [style=solid, label=None]; "144 features_10_block_2_fc1_weight" -> "437 conv2d_43" [style=solid, label="(144, 576, 1, 1)"]; "145 features_10_block_2_fc1_bias" -> "437 conv2d_43" [style=solid, label="(144,)"]; @@ -649,15 +649,15 @@ strict digraph { "147 features_10_block_2_fc2_bias" -> "439 conv2d_44" [style=solid, label="(576,)"]; "148 _scale_29" -> "151 dequantize_per_channel_default_29" [style=solid, label="(96,)"]; "149 _zero_point_29" -> "151 dequantize_per_channel_default_29" [style=solid, label="(96,)"]; -"150 _frozen_param29" -> "151 dequantize_per_channel_default_29" [style=solid, label="(96, 576, 1, 1)"]; +"150 quantize_per_channel_default_29" -> "151 dequantize_per_channel_default_29" [style=solid, label="(96, 576, 1, 1)"]; "151 dequantize_per_channel_default_29" -> "447 conv2d_45" [style=solid, label=None]; "152 _scale_30" -> "155 dequantize_per_channel_default_30" [style=solid, label="(576,)"]; "153 _zero_point_30" -> "155 dequantize_per_channel_default_30" [style=solid, label="(576,)"]; -"154 _frozen_param30" -> "155 dequantize_per_channel_default_30" [style=solid, label="(576, 96, 1, 1)"]; +"154 quantize_per_channel_default_30" -> "155 dequantize_per_channel_default_30" [style=solid, label="(576, 96, 1, 1)"]; "155 dequantize_per_channel_default_30" -> "455 conv2d_46" [style=solid, label=None]; "156 _scale_31" -> "159 dequantize_per_channel_default_31" [style=solid, label="(576,)"]; "157 _zero_point_31" -> "159 dequantize_per_channel_default_31" [style=solid, label="(576,)"]; -"158 _frozen_param31" -> "159 dequantize_per_channel_default_31" [style=solid, label="(576, 1, 5, 5)"]; +"158 quantize_per_channel_default_31" -> "159 dequantize_per_channel_default_31" [style=solid, label="(576, 1, 5, 5)"]; "159 dequantize_per_channel_default_31" -> "462 conv2d_47" [style=solid, label=None]; "160 features_11_block_2_fc1_weight" -> "468 conv2d_48" [style=solid, label="(144, 576, 1, 1)"]; "161 features_11_block_2_fc1_bias" -> "468 conv2d_48" [style=solid, label="(144,)"]; @@ -665,20 +665,20 @@ strict digraph { "163 features_11_block_2_fc2_bias" -> "470 conv2d_49" [style=solid, label="(576,)"]; "164 _scale_32" -> "167 dequantize_per_channel_default_32" [style=solid, label="(96,)"]; "165 _zero_point_32" -> "167 dequantize_per_channel_default_32" [style=solid, label="(96,)"]; -"166 _frozen_param32" -> "167 dequantize_per_channel_default_32" [style=solid, label="(96, 576, 1, 1)"]; +"166 quantize_per_channel_default_32" -> "167 dequantize_per_channel_default_32" [style=solid, label="(96, 576, 1, 1)"]; "167 dequantize_per_channel_default_32" -> "478 conv2d_50" [style=solid, label=None]; "168 _scale_33" -> "171 dequantize_per_channel_default_33" [style=solid, label="(576,)"]; "169 _zero_point_33" -> "171 dequantize_per_channel_default_33" [style=solid, label="(576,)"]; -"170 _frozen_param33" -> "171 dequantize_per_channel_default_33" [style=solid, label="(576, 96, 1, 1)"]; +"170 quantize_per_channel_default_33" -> "171 dequantize_per_channel_default_33" [style=solid, label="(576, 96, 1, 1)"]; "171 dequantize_per_channel_default_33" -> "485 conv2d_51" [style=solid, label=None]; "172 _scale_34" -> "175 dequantize_per_channel_default_34" [style=solid, label="(1024,)"]; "173 _zero_point_34" -> "175 dequantize_per_channel_default_34" [style=solid, label="(1024,)"]; -"174 _frozen_param34" -> "175 dequantize_per_channel_default_34" [style=solid, label="(1024, 576)"]; +"174 quantize_per_channel_default_34" -> "175 dequantize_per_channel_default_34" [style=solid, label="(1024, 576)"]; "175 dequantize_per_channel_default_34" -> "493 linear" [style=solid, label=None]; "176 classifier_0_bias" -> "493 linear" [style=solid, label="(1024,)"]; "177 _scale_35" -> "180 dequantize_per_channel_default_35" [style=solid, label="(1000,)"]; "178 _zero_point_35" -> "180 dequantize_per_channel_default_35" [style=solid, label="(1000,)"]; -"179 _frozen_param35" -> "180 dequantize_per_channel_default_35" [style=solid, label="(1000, 1024)"]; +"179 quantize_per_channel_default_35" -> "180 dequantize_per_channel_default_35" [style=solid, label="(1000, 1024)"]; "180 dequantize_per_channel_default_35" -> "498 linear_1" [style=solid, label=None]; "181 classifier_3_bias" -> "498 linear_1" [style=solid, label="(1000,)"]; "182 x" -> "183 quantize_per_tensor_default" [style=solid, label="(1, 3, 224, 224)"]; diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/resnet18.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/resnet18.dot index d04fa19316d..93e6cf7748a 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/resnet18.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/resnet18.dot @@ -1,87 +1,87 @@ strict digraph { "0 _scale_0" [id=0, type="get_attr"]; "1 _zero_point_0" [id=1, type="get_attr"]; -"2 _frozen_param0" [id=2, type="get_attr"]; +"2 quantize_per_channel_default" [id=2, type="get_attr"]; "3 dequantize_per_channel_default" [id=3, type="dequantize_per_channel"]; "4 _scale_1" [id=4, type="get_attr"]; "5 _zero_point_1" [id=5, type="get_attr"]; -"6 _frozen_param1" [id=6, type="get_attr"]; +"6 quantize_per_channel_default_1" [id=6, type="get_attr"]; "7 dequantize_per_channel_default_1" [id=7, type="dequantize_per_channel"]; "8 _scale_2" [id=8, type="get_attr"]; "9 _zero_point_2" [id=9, type="get_attr"]; -"10 _frozen_param2" [id=10, type="get_attr"]; +"10 quantize_per_channel_default_2" [id=10, type="get_attr"]; "11 dequantize_per_channel_default_2" [id=11, type="dequantize_per_channel"]; "12 _scale_3" [id=12, type="get_attr"]; "13 _zero_point_3" [id=13, type="get_attr"]; -"14 _frozen_param3" [id=14, type="get_attr"]; +"14 quantize_per_channel_default_3" [id=14, type="get_attr"]; "15 dequantize_per_channel_default_3" [id=15, type="dequantize_per_channel"]; "16 _scale_4" [id=16, type="get_attr"]; "17 _zero_point_4" [id=17, type="get_attr"]; -"18 _frozen_param4" [id=18, type="get_attr"]; +"18 quantize_per_channel_default_4" [id=18, type="get_attr"]; "19 dequantize_per_channel_default_4" [id=19, type="dequantize_per_channel"]; "20 _scale_5" [id=20, type="get_attr"]; "21 _zero_point_5" [id=21, type="get_attr"]; -"22 _frozen_param5" [id=22, type="get_attr"]; +"22 quantize_per_channel_default_5" [id=22, type="get_attr"]; "23 dequantize_per_channel_default_5" [id=23, type="dequantize_per_channel"]; "24 _scale_6" [id=24, type="get_attr"]; "25 _zero_point_6" [id=25, type="get_attr"]; -"26 _frozen_param6" [id=26, type="get_attr"]; +"26 quantize_per_channel_default_6" [id=26, type="get_attr"]; "27 dequantize_per_channel_default_6" [id=27, type="dequantize_per_channel"]; "28 _scale_7" [id=28, type="get_attr"]; "29 _zero_point_7" [id=29, type="get_attr"]; -"30 _frozen_param7" [id=30, type="get_attr"]; +"30 quantize_per_channel_default_7" [id=30, type="get_attr"]; "31 dequantize_per_channel_default_7" [id=31, type="dequantize_per_channel"]; "32 _scale_8" [id=32, type="get_attr"]; "33 _zero_point_8" [id=33, type="get_attr"]; -"34 _frozen_param8" [id=34, type="get_attr"]; +"34 quantize_per_channel_default_8" [id=34, type="get_attr"]; "35 dequantize_per_channel_default_8" [id=35, type="dequantize_per_channel"]; "36 _scale_9" [id=36, type="get_attr"]; "37 _zero_point_9" [id=37, type="get_attr"]; -"38 _frozen_param9" [id=38, type="get_attr"]; +"38 quantize_per_channel_default_9" [id=38, type="get_attr"]; "39 dequantize_per_channel_default_9" [id=39, type="dequantize_per_channel"]; "40 _scale_10" [id=40, type="get_attr"]; "41 _zero_point_10" [id=41, type="get_attr"]; -"42 _frozen_param10" [id=42, type="get_attr"]; +"42 quantize_per_channel_default_10" [id=42, type="get_attr"]; "43 dequantize_per_channel_default_10" [id=43, type="dequantize_per_channel"]; "44 _scale_11" [id=44, type="get_attr"]; "45 _zero_point_11" [id=45, type="get_attr"]; -"46 _frozen_param11" [id=46, type="get_attr"]; +"46 quantize_per_channel_default_11" [id=46, type="get_attr"]; "47 dequantize_per_channel_default_11" [id=47, type="dequantize_per_channel"]; "48 _scale_12" [id=48, type="get_attr"]; "49 _zero_point_12" [id=49, type="get_attr"]; -"50 _frozen_param12" [id=50, type="get_attr"]; +"50 quantize_per_channel_default_12" [id=50, type="get_attr"]; "51 dequantize_per_channel_default_12" [id=51, type="dequantize_per_channel"]; "52 _scale_13" [id=52, type="get_attr"]; "53 _zero_point_13" [id=53, type="get_attr"]; -"54 _frozen_param13" [id=54, type="get_attr"]; +"54 quantize_per_channel_default_13" [id=54, type="get_attr"]; "55 dequantize_per_channel_default_13" [id=55, type="dequantize_per_channel"]; "56 _scale_14" [id=56, type="get_attr"]; "57 _zero_point_14" [id=57, type="get_attr"]; -"58 _frozen_param14" [id=58, type="get_attr"]; +"58 quantize_per_channel_default_14" [id=58, type="get_attr"]; "59 dequantize_per_channel_default_14" [id=59, type="dequantize_per_channel"]; "60 _scale_15" [id=60, type="get_attr"]; "61 _zero_point_15" [id=61, type="get_attr"]; -"62 _frozen_param15" [id=62, type="get_attr"]; +"62 quantize_per_channel_default_15" [id=62, type="get_attr"]; "63 dequantize_per_channel_default_15" [id=63, type="dequantize_per_channel"]; "64 _scale_16" [id=64, type="get_attr"]; "65 _zero_point_16" [id=65, type="get_attr"]; -"66 _frozen_param16" [id=66, type="get_attr"]; +"66 quantize_per_channel_default_16" [id=66, type="get_attr"]; "67 dequantize_per_channel_default_16" [id=67, type="dequantize_per_channel"]; "68 _scale_17" [id=68, type="get_attr"]; "69 _zero_point_17" [id=69, type="get_attr"]; -"70 _frozen_param17" [id=70, type="get_attr"]; +"70 quantize_per_channel_default_17" [id=70, type="get_attr"]; "71 dequantize_per_channel_default_17" [id=71, type="dequantize_per_channel"]; "72 _scale_18" [id=72, type="get_attr"]; "73 _zero_point_18" [id=73, type="get_attr"]; -"74 _frozen_param18" [id=74, type="get_attr"]; +"74 quantize_per_channel_default_18" [id=74, type="get_attr"]; "75 dequantize_per_channel_default_18" [id=75, type="dequantize_per_channel"]; "76 _scale_19" [id=76, type="get_attr"]; "77 _zero_point_19" [id=77, type="get_attr"]; -"78 _frozen_param19" [id=78, type="get_attr"]; +"78 quantize_per_channel_default_19" [id=78, type="get_attr"]; "79 dequantize_per_channel_default_19" [id=79, type="dequantize_per_channel"]; "80 _scale_20" [id=80, type="get_attr"]; "81 _zero_point_20" [id=81, type="get_attr"]; -"82 _frozen_param20" [id=82, type="get_attr"]; +"82 quantize_per_channel_default_20" [id=82, type="get_attr"]; "83 dequantize_per_channel_default_20" [id=83, type="dequantize_per_channel"]; "84 fc_bias" [id=84, type="get_attr"]; "85 x" [id=85, type=input]; @@ -224,87 +224,87 @@ strict digraph { "222 output" [id=222, type=output]; "0 _scale_0" -> "3 dequantize_per_channel_default" [style=solid, label="(64,)"]; "1 _zero_point_0" -> "3 dequantize_per_channel_default" [style=solid, label="(64,)"]; -"2 _frozen_param0" -> "3 dequantize_per_channel_default" [style=solid, label="(64, 3, 7, 7)"]; +"2 quantize_per_channel_default" -> "3 dequantize_per_channel_default" [style=solid, label="(64, 3, 7, 7)"]; "3 dequantize_per_channel_default" -> "89 conv2d" [style=solid, label=None]; "4 _scale_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(64,)"]; "5 _zero_point_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(64,)"]; -"6 _frozen_param1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(64, 64, 3, 3)"]; +"6 quantize_per_channel_default_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(64, 64, 3, 3)"]; "7 dequantize_per_channel_default_1" -> "95 conv2d_1" [style=solid, label=None]; "8 _scale_2" -> "11 dequantize_per_channel_default_2" [style=solid, label="(64,)"]; "9 _zero_point_2" -> "11 dequantize_per_channel_default_2" [style=solid, label="(64,)"]; -"10 _frozen_param2" -> "11 dequantize_per_channel_default_2" [style=solid, label="(64, 64, 3, 3)"]; +"10 quantize_per_channel_default_2" -> "11 dequantize_per_channel_default_2" [style=solid, label="(64, 64, 3, 3)"]; "11 dequantize_per_channel_default_2" -> "100 conv2d_2" [style=solid, label=None]; "12 _scale_3" -> "15 dequantize_per_channel_default_3" [style=solid, label="(64,)"]; "13 _zero_point_3" -> "15 dequantize_per_channel_default_3" [style=solid, label="(64,)"]; -"14 _frozen_param3" -> "15 dequantize_per_channel_default_3" [style=solid, label="(64, 64, 3, 3)"]; +"14 quantize_per_channel_default_3" -> "15 dequantize_per_channel_default_3" [style=solid, label="(64, 64, 3, 3)"]; "15 dequantize_per_channel_default_3" -> "109 conv2d_3" [style=solid, label=None]; "16 _scale_4" -> "19 dequantize_per_channel_default_4" [style=solid, label="(64,)"]; "17 _zero_point_4" -> "19 dequantize_per_channel_default_4" [style=solid, label="(64,)"]; -"18 _frozen_param4" -> "19 dequantize_per_channel_default_4" [style=solid, label="(64, 64, 3, 3)"]; +"18 quantize_per_channel_default_4" -> "19 dequantize_per_channel_default_4" [style=solid, label="(64, 64, 3, 3)"]; "19 dequantize_per_channel_default_4" -> "114 conv2d_4" [style=solid, label=None]; "20 _scale_5" -> "23 dequantize_per_channel_default_5" [style=solid, label="(128,)"]; "21 _zero_point_5" -> "23 dequantize_per_channel_default_5" [style=solid, label="(128,)"]; -"22 _frozen_param5" -> "23 dequantize_per_channel_default_5" [style=solid, label="(128, 64, 3, 3)"]; +"22 quantize_per_channel_default_5" -> "23 dequantize_per_channel_default_5" [style=solid, label="(128, 64, 3, 3)"]; "23 dequantize_per_channel_default_5" -> "123 conv2d_5" [style=solid, label=None]; "24 _scale_6" -> "27 dequantize_per_channel_default_6" [style=solid, label="(128,)"]; "25 _zero_point_6" -> "27 dequantize_per_channel_default_6" [style=solid, label="(128,)"]; -"26 _frozen_param6" -> "27 dequantize_per_channel_default_6" [style=solid, label="(128, 128, 3, 3)"]; +"26 quantize_per_channel_default_6" -> "27 dequantize_per_channel_default_6" [style=solid, label="(128, 128, 3, 3)"]; "27 dequantize_per_channel_default_6" -> "128 conv2d_6" [style=solid, label=None]; "28 _scale_7" -> "31 dequantize_per_channel_default_7" [style=solid, label="(128,)"]; "29 _zero_point_7" -> "31 dequantize_per_channel_default_7" [style=solid, label="(128,)"]; -"30 _frozen_param7" -> "31 dequantize_per_channel_default_7" [style=solid, label="(128, 64, 1, 1)"]; +"30 quantize_per_channel_default_7" -> "31 dequantize_per_channel_default_7" [style=solid, label="(128, 64, 1, 1)"]; "31 dequantize_per_channel_default_7" -> "132 conv2d_7" [style=solid, label=None]; "32 _scale_8" -> "35 dequantize_per_channel_default_8" [style=solid, label="(128,)"]; "33 _zero_point_8" -> "35 dequantize_per_channel_default_8" [style=solid, label="(128,)"]; -"34 _frozen_param8" -> "35 dequantize_per_channel_default_8" [style=solid, label="(128, 128, 3, 3)"]; +"34 quantize_per_channel_default_8" -> "35 dequantize_per_channel_default_8" [style=solid, label="(128, 128, 3, 3)"]; "35 dequantize_per_channel_default_8" -> "141 conv2d_8" [style=solid, label=None]; "36 _scale_9" -> "39 dequantize_per_channel_default_9" [style=solid, label="(128,)"]; "37 _zero_point_9" -> "39 dequantize_per_channel_default_9" [style=solid, label="(128,)"]; -"38 _frozen_param9" -> "39 dequantize_per_channel_default_9" [style=solid, label="(128, 128, 3, 3)"]; +"38 quantize_per_channel_default_9" -> "39 dequantize_per_channel_default_9" [style=solid, label="(128, 128, 3, 3)"]; "39 dequantize_per_channel_default_9" -> "146 conv2d_9" [style=solid, label=None]; "40 _scale_10" -> "43 dequantize_per_channel_default_10" [style=solid, label="(256,)"]; "41 _zero_point_10" -> "43 dequantize_per_channel_default_10" [style=solid, label="(256,)"]; -"42 _frozen_param10" -> "43 dequantize_per_channel_default_10" [style=solid, label="(256, 128, 3, 3)"]; +"42 quantize_per_channel_default_10" -> "43 dequantize_per_channel_default_10" [style=solid, label="(256, 128, 3, 3)"]; "43 dequantize_per_channel_default_10" -> "155 conv2d_10" [style=solid, label=None]; "44 _scale_11" -> "47 dequantize_per_channel_default_11" [style=solid, label="(256,)"]; "45 _zero_point_11" -> "47 dequantize_per_channel_default_11" [style=solid, label="(256,)"]; -"46 _frozen_param11" -> "47 dequantize_per_channel_default_11" [style=solid, label="(256, 256, 3, 3)"]; +"46 quantize_per_channel_default_11" -> "47 dequantize_per_channel_default_11" [style=solid, label="(256, 256, 3, 3)"]; "47 dequantize_per_channel_default_11" -> "160 conv2d_11" [style=solid, label=None]; "48 _scale_12" -> "51 dequantize_per_channel_default_12" [style=solid, label="(256,)"]; "49 _zero_point_12" -> "51 dequantize_per_channel_default_12" [style=solid, label="(256,)"]; -"50 _frozen_param12" -> "51 dequantize_per_channel_default_12" [style=solid, label="(256, 128, 1, 1)"]; +"50 quantize_per_channel_default_12" -> "51 dequantize_per_channel_default_12" [style=solid, label="(256, 128, 1, 1)"]; "51 dequantize_per_channel_default_12" -> "164 conv2d_12" [style=solid, label=None]; "52 _scale_13" -> "55 dequantize_per_channel_default_13" [style=solid, label="(256,)"]; "53 _zero_point_13" -> "55 dequantize_per_channel_default_13" [style=solid, label="(256,)"]; -"54 _frozen_param13" -> "55 dequantize_per_channel_default_13" [style=solid, label="(256, 256, 3, 3)"]; +"54 quantize_per_channel_default_13" -> "55 dequantize_per_channel_default_13" [style=solid, label="(256, 256, 3, 3)"]; "55 dequantize_per_channel_default_13" -> "173 conv2d_13" [style=solid, label=None]; "56 _scale_14" -> "59 dequantize_per_channel_default_14" [style=solid, label="(256,)"]; "57 _zero_point_14" -> "59 dequantize_per_channel_default_14" [style=solid, label="(256,)"]; -"58 _frozen_param14" -> "59 dequantize_per_channel_default_14" [style=solid, label="(256, 256, 3, 3)"]; +"58 quantize_per_channel_default_14" -> "59 dequantize_per_channel_default_14" [style=solid, label="(256, 256, 3, 3)"]; "59 dequantize_per_channel_default_14" -> "178 conv2d_14" [style=solid, label=None]; "60 _scale_15" -> "63 dequantize_per_channel_default_15" [style=solid, label="(512,)"]; "61 _zero_point_15" -> "63 dequantize_per_channel_default_15" [style=solid, label="(512,)"]; -"62 _frozen_param15" -> "63 dequantize_per_channel_default_15" [style=solid, label="(512, 256, 3, 3)"]; +"62 quantize_per_channel_default_15" -> "63 dequantize_per_channel_default_15" [style=solid, label="(512, 256, 3, 3)"]; "63 dequantize_per_channel_default_15" -> "187 conv2d_15" [style=solid, label=None]; "64 _scale_16" -> "67 dequantize_per_channel_default_16" [style=solid, label="(512,)"]; "65 _zero_point_16" -> "67 dequantize_per_channel_default_16" [style=solid, label="(512,)"]; -"66 _frozen_param16" -> "67 dequantize_per_channel_default_16" [style=solid, label="(512, 512, 3, 3)"]; +"66 quantize_per_channel_default_16" -> "67 dequantize_per_channel_default_16" [style=solid, label="(512, 512, 3, 3)"]; "67 dequantize_per_channel_default_16" -> "192 conv2d_16" [style=solid, label=None]; "68 _scale_17" -> "71 dequantize_per_channel_default_17" [style=solid, label="(512,)"]; "69 _zero_point_17" -> "71 dequantize_per_channel_default_17" [style=solid, label="(512,)"]; -"70 _frozen_param17" -> "71 dequantize_per_channel_default_17" [style=solid, label="(512, 256, 1, 1)"]; +"70 quantize_per_channel_default_17" -> "71 dequantize_per_channel_default_17" [style=solid, label="(512, 256, 1, 1)"]; "71 dequantize_per_channel_default_17" -> "196 conv2d_17" [style=solid, label=None]; "72 _scale_18" -> "75 dequantize_per_channel_default_18" [style=solid, label="(512,)"]; "73 _zero_point_18" -> "75 dequantize_per_channel_default_18" [style=solid, label="(512,)"]; -"74 _frozen_param18" -> "75 dequantize_per_channel_default_18" [style=solid, label="(512, 512, 3, 3)"]; +"74 quantize_per_channel_default_18" -> "75 dequantize_per_channel_default_18" [style=solid, label="(512, 512, 3, 3)"]; "75 dequantize_per_channel_default_18" -> "205 conv2d_18" [style=solid, label=None]; "76 _scale_19" -> "79 dequantize_per_channel_default_19" [style=solid, label="(512,)"]; "77 _zero_point_19" -> "79 dequantize_per_channel_default_19" [style=solid, label="(512,)"]; -"78 _frozen_param19" -> "79 dequantize_per_channel_default_19" [style=solid, label="(512, 512, 3, 3)"]; +"78 quantize_per_channel_default_19" -> "79 dequantize_per_channel_default_19" [style=solid, label="(512, 512, 3, 3)"]; "79 dequantize_per_channel_default_19" -> "210 conv2d_19" [style=solid, label=None]; "80 _scale_20" -> "83 dequantize_per_channel_default_20" [style=solid, label="(1000,)"]; "81 _zero_point_20" -> "83 dequantize_per_channel_default_20" [style=solid, label="(1000,)"]; -"82 _frozen_param20" -> "83 dequantize_per_channel_default_20" [style=solid, label="(1000, 512)"]; +"82 quantize_per_channel_default_20" -> "83 dequantize_per_channel_default_20" [style=solid, label="(1000, 512)"]; "83 dequantize_per_channel_default_20" -> "221 linear" [style=solid, label=None]; "84 fc_bias" -> "221 linear" [style=solid, label="(1000,)"]; "85 x" -> "86 quantize_per_tensor_default" [style=solid, label="(1, 3, 224, 224)"]; diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/swin_v2_t.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/swin_v2_t.dot index fde703676ea..0adada9f3a7 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/swin_v2_t.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/swin_v2_t.dot @@ -1,139 +1,139 @@ strict digraph { "0 _scale_0" [id=0, type="get_attr"]; "1 _zero_point_0" [id=1, type="get_attr"]; -"2 _frozen_param0" [id=2, type="get_attr"]; +"2 quantize_per_channel_default" [id=2, type="get_attr"]; "3 dequantize_per_channel_default" [id=3, type="dequantize_per_channel"]; "4 _scale_1" [id=4, type="get_attr"]; "5 _zero_point_1" [id=5, type="get_attr"]; -"6 _frozen_param1" [id=6, type="get_attr"]; +"6 quantize_per_channel_default_1" [id=6, type="get_attr"]; "7 dequantize_per_channel_default_1" [id=7, type="dequantize_per_channel"]; "8 features_1_0_attn_qkv_bias" [id=8, type="get_attr"]; "9 features_1_0_attn_proj_bias" [id=9, type="get_attr"]; "10 features_1_0_attn_logit_scale" [id=10, type="get_attr"]; "11 _scale_2" [id=11, type="get_attr"]; "12 _zero_point_2" [id=12, type="get_attr"]; -"13 _frozen_param2" [id=13, type="get_attr"]; +"13 quantize_per_channel_default_2" [id=13, type="get_attr"]; "14 dequantize_per_channel_default_2" [id=14, type="dequantize_per_channel"]; "15 _scale_3" [id=15, type="get_attr"]; "16 _zero_point_3" [id=16, type="get_attr"]; -"17 _frozen_param3" [id=17, type="get_attr"]; +"17 quantize_per_channel_default_3" [id=17, type="get_attr"]; "18 dequantize_per_channel_default_3" [id=18, type="dequantize_per_channel"]; "19 features_1_1_attn_qkv_bias" [id=19, type="get_attr"]; "20 features_1_1_attn_proj_bias" [id=20, type="get_attr"]; "21 features_1_1_attn_logit_scale" [id=21, type="get_attr"]; "22 _scale_4" [id=22, type="get_attr"]; "23 _zero_point_4" [id=23, type="get_attr"]; -"24 _frozen_param4" [id=24, type="get_attr"]; +"24 quantize_per_channel_default_4" [id=24, type="get_attr"]; "25 dequantize_per_channel_default_4" [id=25, type="dequantize_per_channel"]; "26 _scale_5" [id=26, type="get_attr"]; "27 _zero_point_5" [id=27, type="get_attr"]; -"28 _frozen_param5" [id=28, type="get_attr"]; +"28 quantize_per_channel_default_5" [id=28, type="get_attr"]; "29 dequantize_per_channel_default_5" [id=29, type="dequantize_per_channel"]; "30 features_3_0_attn_qkv_bias" [id=30, type="get_attr"]; "31 features_3_0_attn_proj_bias" [id=31, type="get_attr"]; "32 features_3_0_attn_logit_scale" [id=32, type="get_attr"]; "33 _scale_6" [id=33, type="get_attr"]; "34 _zero_point_6" [id=34, type="get_attr"]; -"35 _frozen_param6" [id=35, type="get_attr"]; +"35 quantize_per_channel_default_6" [id=35, type="get_attr"]; "36 dequantize_per_channel_default_6" [id=36, type="dequantize_per_channel"]; "37 _scale_7" [id=37, type="get_attr"]; "38 _zero_point_7" [id=38, type="get_attr"]; -"39 _frozen_param7" [id=39, type="get_attr"]; +"39 quantize_per_channel_default_7" [id=39, type="get_attr"]; "40 dequantize_per_channel_default_7" [id=40, type="dequantize_per_channel"]; "41 features_3_1_attn_qkv_bias" [id=41, type="get_attr"]; "42 features_3_1_attn_proj_bias" [id=42, type="get_attr"]; "43 features_3_1_attn_logit_scale" [id=43, type="get_attr"]; "44 _scale_8" [id=44, type="get_attr"]; "45 _zero_point_8" [id=45, type="get_attr"]; -"46 _frozen_param8" [id=46, type="get_attr"]; +"46 quantize_per_channel_default_8" [id=46, type="get_attr"]; "47 dequantize_per_channel_default_8" [id=47, type="dequantize_per_channel"]; "48 _scale_9" [id=48, type="get_attr"]; "49 _zero_point_9" [id=49, type="get_attr"]; -"50 _frozen_param9" [id=50, type="get_attr"]; +"50 quantize_per_channel_default_9" [id=50, type="get_attr"]; "51 dequantize_per_channel_default_9" [id=51, type="dequantize_per_channel"]; "52 features_5_0_attn_qkv_bias" [id=52, type="get_attr"]; "53 features_5_0_attn_proj_bias" [id=53, type="get_attr"]; "54 features_5_0_attn_logit_scale" [id=54, type="get_attr"]; "55 _scale_10" [id=55, type="get_attr"]; "56 _zero_point_10" [id=56, type="get_attr"]; -"57 _frozen_param10" [id=57, type="get_attr"]; +"57 quantize_per_channel_default_10" [id=57, type="get_attr"]; "58 dequantize_per_channel_default_10" [id=58, type="dequantize_per_channel"]; "59 _scale_11" [id=59, type="get_attr"]; "60 _zero_point_11" [id=60, type="get_attr"]; -"61 _frozen_param11" [id=61, type="get_attr"]; +"61 quantize_per_channel_default_11" [id=61, type="get_attr"]; "62 dequantize_per_channel_default_11" [id=62, type="dequantize_per_channel"]; "63 features_5_1_attn_qkv_bias" [id=63, type="get_attr"]; "64 features_5_1_attn_proj_bias" [id=64, type="get_attr"]; "65 features_5_1_attn_logit_scale" [id=65, type="get_attr"]; "66 _scale_12" [id=66, type="get_attr"]; "67 _zero_point_12" [id=67, type="get_attr"]; -"68 _frozen_param12" [id=68, type="get_attr"]; +"68 quantize_per_channel_default_12" [id=68, type="get_attr"]; "69 dequantize_per_channel_default_12" [id=69, type="dequantize_per_channel"]; "70 _scale_13" [id=70, type="get_attr"]; "71 _zero_point_13" [id=71, type="get_attr"]; -"72 _frozen_param13" [id=72, type="get_attr"]; +"72 quantize_per_channel_default_13" [id=72, type="get_attr"]; "73 dequantize_per_channel_default_13" [id=73, type="dequantize_per_channel"]; "74 features_5_2_attn_qkv_bias" [id=74, type="get_attr"]; "75 features_5_2_attn_proj_bias" [id=75, type="get_attr"]; "76 features_5_2_attn_logit_scale" [id=76, type="get_attr"]; "77 _scale_14" [id=77, type="get_attr"]; "78 _zero_point_14" [id=78, type="get_attr"]; -"79 _frozen_param14" [id=79, type="get_attr"]; +"79 quantize_per_channel_default_14" [id=79, type="get_attr"]; "80 dequantize_per_channel_default_14" [id=80, type="dequantize_per_channel"]; "81 _scale_15" [id=81, type="get_attr"]; "82 _zero_point_15" [id=82, type="get_attr"]; -"83 _frozen_param15" [id=83, type="get_attr"]; +"83 quantize_per_channel_default_15" [id=83, type="get_attr"]; "84 dequantize_per_channel_default_15" [id=84, type="dequantize_per_channel"]; "85 features_5_3_attn_qkv_bias" [id=85, type="get_attr"]; "86 features_5_3_attn_proj_bias" [id=86, type="get_attr"]; "87 features_5_3_attn_logit_scale" [id=87, type="get_attr"]; "88 _scale_16" [id=88, type="get_attr"]; "89 _zero_point_16" [id=89, type="get_attr"]; -"90 _frozen_param16" [id=90, type="get_attr"]; +"90 quantize_per_channel_default_16" [id=90, type="get_attr"]; "91 dequantize_per_channel_default_16" [id=91, type="dequantize_per_channel"]; "92 _scale_17" [id=92, type="get_attr"]; "93 _zero_point_17" [id=93, type="get_attr"]; -"94 _frozen_param17" [id=94, type="get_attr"]; +"94 quantize_per_channel_default_17" [id=94, type="get_attr"]; "95 dequantize_per_channel_default_17" [id=95, type="dequantize_per_channel"]; "96 features_5_4_attn_qkv_bias" [id=96, type="get_attr"]; "97 features_5_4_attn_proj_bias" [id=97, type="get_attr"]; "98 features_5_4_attn_logit_scale" [id=98, type="get_attr"]; "99 _scale_18" [id=99, type="get_attr"]; "100 _zero_point_18" [id=100, type="get_attr"]; -"101 _frozen_param18" [id=101, type="get_attr"]; +"101 quantize_per_channel_default_18" [id=101, type="get_attr"]; "102 dequantize_per_channel_default_18" [id=102, type="dequantize_per_channel"]; "103 _scale_19" [id=103, type="get_attr"]; "104 _zero_point_19" [id=104, type="get_attr"]; -"105 _frozen_param19" [id=105, type="get_attr"]; +"105 quantize_per_channel_default_19" [id=105, type="get_attr"]; "106 dequantize_per_channel_default_19" [id=106, type="dequantize_per_channel"]; "107 features_5_5_attn_qkv_bias" [id=107, type="get_attr"]; "108 features_5_5_attn_proj_bias" [id=108, type="get_attr"]; "109 features_5_5_attn_logit_scale" [id=109, type="get_attr"]; "110 _scale_20" [id=110, type="get_attr"]; "111 _zero_point_20" [id=111, type="get_attr"]; -"112 _frozen_param20" [id=112, type="get_attr"]; +"112 quantize_per_channel_default_20" [id=112, type="get_attr"]; "113 dequantize_per_channel_default_20" [id=113, type="dequantize_per_channel"]; "114 _scale_21" [id=114, type="get_attr"]; "115 _zero_point_21" [id=115, type="get_attr"]; -"116 _frozen_param21" [id=116, type="get_attr"]; +"116 quantize_per_channel_default_21" [id=116, type="get_attr"]; "117 dequantize_per_channel_default_21" [id=117, type="dequantize_per_channel"]; "118 features_7_0_attn_qkv_bias" [id=118, type="get_attr"]; "119 features_7_0_attn_proj_bias" [id=119, type="get_attr"]; "120 features_7_0_attn_logit_scale" [id=120, type="get_attr"]; "121 _scale_22" [id=121, type="get_attr"]; "122 _zero_point_22" [id=122, type="get_attr"]; -"123 _frozen_param22" [id=123, type="get_attr"]; +"123 quantize_per_channel_default_22" [id=123, type="get_attr"]; "124 dequantize_per_channel_default_22" [id=124, type="dequantize_per_channel"]; "125 _scale_23" [id=125, type="get_attr"]; "126 _zero_point_23" [id=126, type="get_attr"]; -"127 _frozen_param23" [id=127, type="get_attr"]; +"127 quantize_per_channel_default_23" [id=127, type="get_attr"]; "128 dequantize_per_channel_default_23" [id=128, type="dequantize_per_channel"]; "129 features_7_1_attn_qkv_bias" [id=129, type="get_attr"]; "130 features_7_1_attn_proj_bias" [id=130, type="get_attr"]; "131 features_7_1_attn_logit_scale" [id=131, type="get_attr"]; "132 _scale_24" [id=132, type="get_attr"]; "133 _zero_point_24" [id=133, type="get_attr"]; -"134 _frozen_param24" [id=134, type="get_attr"]; +"134 quantize_per_channel_default_24" [id=134, type="get_attr"]; "135 dequantize_per_channel_default_24" [id=135, type="dequantize_per_channel"]; "136 features_0_0_bias" [id=136, type="get_attr"]; "137 features_0_2_weight" [id=137, type="get_attr"]; @@ -145,12 +145,12 @@ strict digraph { "143 features_1_0_norm1_bias" [id=143, type="get_attr"]; "144 _scale_25" [id=144, type="get_attr"]; "145 _zero_point_25" [id=145, type="get_attr"]; -"146 _frozen_param25" [id=146, type="get_attr"]; +"146 quantize_per_channel_default_25" [id=146, type="get_attr"]; "147 dequantize_per_channel_default_25" [id=147, type="dequantize_per_channel"]; "148 features_1_0_mlp_0_bias" [id=148, type="get_attr"]; "149 _scale_26" [id=149, type="get_attr"]; "150 _zero_point_26" [id=150, type="get_attr"]; -"151 _frozen_param26" [id=151, type="get_attr"]; +"151 quantize_per_channel_default_26" [id=151, type="get_attr"]; "152 dequantize_per_channel_default_26" [id=152, type="dequantize_per_channel"]; "153 features_1_0_mlp_3_bias" [id=153, type="get_attr"]; "154 features_1_0_norm2_weight" [id=154, type="get_attr"]; @@ -162,19 +162,19 @@ strict digraph { "160 features_1_1_norm1_bias" [id=160, type="get_attr"]; "161 _scale_27" [id=161, type="get_attr"]; "162 _zero_point_27" [id=162, type="get_attr"]; -"163 _frozen_param27" [id=163, type="get_attr"]; +"163 quantize_per_channel_default_27" [id=163, type="get_attr"]; "164 dequantize_per_channel_default_27" [id=164, type="dequantize_per_channel"]; "165 features_1_1_mlp_0_bias" [id=165, type="get_attr"]; "166 _scale_28" [id=166, type="get_attr"]; "167 _zero_point_28" [id=167, type="get_attr"]; -"168 _frozen_param28" [id=168, type="get_attr"]; +"168 quantize_per_channel_default_28" [id=168, type="get_attr"]; "169 dequantize_per_channel_default_28" [id=169, type="dequantize_per_channel"]; "170 features_1_1_mlp_3_bias" [id=170, type="get_attr"]; "171 features_1_1_norm2_weight" [id=171, type="get_attr"]; "172 features_1_1_norm2_bias" [id=172, type="get_attr"]; "173 _scale_29" [id=173, type="get_attr"]; "174 _zero_point_29" [id=174, type="get_attr"]; -"175 _frozen_param29" [id=175, type="get_attr"]; +"175 quantize_per_channel_default_29" [id=175, type="get_attr"]; "176 dequantize_per_channel_default_29" [id=176, type="dequantize_per_channel"]; "177 features_2_norm_weight" [id=177, type="get_attr"]; "178 features_2_norm_bias" [id=178, type="get_attr"]; @@ -185,12 +185,12 @@ strict digraph { "183 features_3_0_norm1_bias" [id=183, type="get_attr"]; "184 _scale_30" [id=184, type="get_attr"]; "185 _zero_point_30" [id=185, type="get_attr"]; -"186 _frozen_param30" [id=186, type="get_attr"]; +"186 quantize_per_channel_default_30" [id=186, type="get_attr"]; "187 dequantize_per_channel_default_30" [id=187, type="dequantize_per_channel"]; "188 features_3_0_mlp_0_bias" [id=188, type="get_attr"]; "189 _scale_31" [id=189, type="get_attr"]; "190 _zero_point_31" [id=190, type="get_attr"]; -"191 _frozen_param31" [id=191, type="get_attr"]; +"191 quantize_per_channel_default_31" [id=191, type="get_attr"]; "192 dequantize_per_channel_default_31" [id=192, type="dequantize_per_channel"]; "193 features_3_0_mlp_3_bias" [id=193, type="get_attr"]; "194 features_3_0_norm2_weight" [id=194, type="get_attr"]; @@ -202,19 +202,19 @@ strict digraph { "200 features_3_1_norm1_bias" [id=200, type="get_attr"]; "201 _scale_32" [id=201, type="get_attr"]; "202 _zero_point_32" [id=202, type="get_attr"]; -"203 _frozen_param32" [id=203, type="get_attr"]; +"203 quantize_per_channel_default_32" [id=203, type="get_attr"]; "204 dequantize_per_channel_default_32" [id=204, type="dequantize_per_channel"]; "205 features_3_1_mlp_0_bias" [id=205, type="get_attr"]; "206 _scale_33" [id=206, type="get_attr"]; "207 _zero_point_33" [id=207, type="get_attr"]; -"208 _frozen_param33" [id=208, type="get_attr"]; +"208 quantize_per_channel_default_33" [id=208, type="get_attr"]; "209 dequantize_per_channel_default_33" [id=209, type="dequantize_per_channel"]; "210 features_3_1_mlp_3_bias" [id=210, type="get_attr"]; "211 features_3_1_norm2_weight" [id=211, type="get_attr"]; "212 features_3_1_norm2_bias" [id=212, type="get_attr"]; "213 _scale_34" [id=213, type="get_attr"]; "214 _zero_point_34" [id=214, type="get_attr"]; -"215 _frozen_param34" [id=215, type="get_attr"]; +"215 quantize_per_channel_default_34" [id=215, type="get_attr"]; "216 dequantize_per_channel_default_34" [id=216, type="dequantize_per_channel"]; "217 features_4_norm_weight" [id=217, type="get_attr"]; "218 features_4_norm_bias" [id=218, type="get_attr"]; @@ -225,12 +225,12 @@ strict digraph { "223 features_5_0_norm1_bias" [id=223, type="get_attr"]; "224 _scale_35" [id=224, type="get_attr"]; "225 _zero_point_35" [id=225, type="get_attr"]; -"226 _frozen_param35" [id=226, type="get_attr"]; +"226 quantize_per_channel_default_35" [id=226, type="get_attr"]; "227 dequantize_per_channel_default_35" [id=227, type="dequantize_per_channel"]; "228 features_5_0_mlp_0_bias" [id=228, type="get_attr"]; "229 _scale_36" [id=229, type="get_attr"]; "230 _zero_point_36" [id=230, type="get_attr"]; -"231 _frozen_param36" [id=231, type="get_attr"]; +"231 quantize_per_channel_default_36" [id=231, type="get_attr"]; "232 dequantize_per_channel_default_36" [id=232, type="dequantize_per_channel"]; "233 features_5_0_mlp_3_bias" [id=233, type="get_attr"]; "234 features_5_0_norm2_weight" [id=234, type="get_attr"]; @@ -242,12 +242,12 @@ strict digraph { "240 features_5_1_norm1_bias" [id=240, type="get_attr"]; "241 _scale_37" [id=241, type="get_attr"]; "242 _zero_point_37" [id=242, type="get_attr"]; -"243 _frozen_param37" [id=243, type="get_attr"]; +"243 quantize_per_channel_default_37" [id=243, type="get_attr"]; "244 dequantize_per_channel_default_37" [id=244, type="dequantize_per_channel"]; "245 features_5_1_mlp_0_bias" [id=245, type="get_attr"]; "246 _scale_38" [id=246, type="get_attr"]; "247 _zero_point_38" [id=247, type="get_attr"]; -"248 _frozen_param38" [id=248, type="get_attr"]; +"248 quantize_per_channel_default_38" [id=248, type="get_attr"]; "249 dequantize_per_channel_default_38" [id=249, type="dequantize_per_channel"]; "250 features_5_1_mlp_3_bias" [id=250, type="get_attr"]; "251 features_5_1_norm2_weight" [id=251, type="get_attr"]; @@ -259,12 +259,12 @@ strict digraph { "257 features_5_2_norm1_bias" [id=257, type="get_attr"]; "258 _scale_39" [id=258, type="get_attr"]; "259 _zero_point_39" [id=259, type="get_attr"]; -"260 _frozen_param39" [id=260, type="get_attr"]; +"260 quantize_per_channel_default_39" [id=260, type="get_attr"]; "261 dequantize_per_channel_default_39" [id=261, type="dequantize_per_channel"]; "262 features_5_2_mlp_0_bias" [id=262, type="get_attr"]; "263 _scale_40" [id=263, type="get_attr"]; "264 _zero_point_40" [id=264, type="get_attr"]; -"265 _frozen_param40" [id=265, type="get_attr"]; +"265 quantize_per_channel_default_40" [id=265, type="get_attr"]; "266 dequantize_per_channel_default_40" [id=266, type="dequantize_per_channel"]; "267 features_5_2_mlp_3_bias" [id=267, type="get_attr"]; "268 features_5_2_norm2_weight" [id=268, type="get_attr"]; @@ -276,12 +276,12 @@ strict digraph { "274 features_5_3_norm1_bias" [id=274, type="get_attr"]; "275 _scale_41" [id=275, type="get_attr"]; "276 _zero_point_41" [id=276, type="get_attr"]; -"277 _frozen_param41" [id=277, type="get_attr"]; +"277 quantize_per_channel_default_41" [id=277, type="get_attr"]; "278 dequantize_per_channel_default_41" [id=278, type="dequantize_per_channel"]; "279 features_5_3_mlp_0_bias" [id=279, type="get_attr"]; "280 _scale_42" [id=280, type="get_attr"]; "281 _zero_point_42" [id=281, type="get_attr"]; -"282 _frozen_param42" [id=282, type="get_attr"]; +"282 quantize_per_channel_default_42" [id=282, type="get_attr"]; "283 dequantize_per_channel_default_42" [id=283, type="dequantize_per_channel"]; "284 features_5_3_mlp_3_bias" [id=284, type="get_attr"]; "285 features_5_3_norm2_weight" [id=285, type="get_attr"]; @@ -293,12 +293,12 @@ strict digraph { "291 features_5_4_norm1_bias" [id=291, type="get_attr"]; "292 _scale_43" [id=292, type="get_attr"]; "293 _zero_point_43" [id=293, type="get_attr"]; -"294 _frozen_param43" [id=294, type="get_attr"]; +"294 quantize_per_channel_default_43" [id=294, type="get_attr"]; "295 dequantize_per_channel_default_43" [id=295, type="dequantize_per_channel"]; "296 features_5_4_mlp_0_bias" [id=296, type="get_attr"]; "297 _scale_44" [id=297, type="get_attr"]; "298 _zero_point_44" [id=298, type="get_attr"]; -"299 _frozen_param44" [id=299, type="get_attr"]; +"299 quantize_per_channel_default_44" [id=299, type="get_attr"]; "300 dequantize_per_channel_default_44" [id=300, type="dequantize_per_channel"]; "301 features_5_4_mlp_3_bias" [id=301, type="get_attr"]; "302 features_5_4_norm2_weight" [id=302, type="get_attr"]; @@ -310,19 +310,19 @@ strict digraph { "308 features_5_5_norm1_bias" [id=308, type="get_attr"]; "309 _scale_45" [id=309, type="get_attr"]; "310 _zero_point_45" [id=310, type="get_attr"]; -"311 _frozen_param45" [id=311, type="get_attr"]; +"311 quantize_per_channel_default_45" [id=311, type="get_attr"]; "312 dequantize_per_channel_default_45" [id=312, type="dequantize_per_channel"]; "313 features_5_5_mlp_0_bias" [id=313, type="get_attr"]; "314 _scale_46" [id=314, type="get_attr"]; "315 _zero_point_46" [id=315, type="get_attr"]; -"316 _frozen_param46" [id=316, type="get_attr"]; +"316 quantize_per_channel_default_46" [id=316, type="get_attr"]; "317 dequantize_per_channel_default_46" [id=317, type="dequantize_per_channel"]; "318 features_5_5_mlp_3_bias" [id=318, type="get_attr"]; "319 features_5_5_norm2_weight" [id=319, type="get_attr"]; "320 features_5_5_norm2_bias" [id=320, type="get_attr"]; "321 _scale_47" [id=321, type="get_attr"]; "322 _zero_point_47" [id=322, type="get_attr"]; -"323 _frozen_param47" [id=323, type="get_attr"]; +"323 quantize_per_channel_default_47" [id=323, type="get_attr"]; "324 dequantize_per_channel_default_47" [id=324, type="dequantize_per_channel"]; "325 features_6_norm_weight" [id=325, type="get_attr"]; "326 features_6_norm_bias" [id=326, type="get_attr"]; @@ -333,12 +333,12 @@ strict digraph { "331 features_7_0_norm1_bias" [id=331, type="get_attr"]; "332 _scale_48" [id=332, type="get_attr"]; "333 _zero_point_48" [id=333, type="get_attr"]; -"334 _frozen_param48" [id=334, type="get_attr"]; +"334 quantize_per_channel_default_48" [id=334, type="get_attr"]; "335 dequantize_per_channel_default_48" [id=335, type="dequantize_per_channel"]; "336 features_7_0_mlp_0_bias" [id=336, type="get_attr"]; "337 _scale_49" [id=337, type="get_attr"]; "338 _zero_point_49" [id=338, type="get_attr"]; -"339 _frozen_param49" [id=339, type="get_attr"]; +"339 quantize_per_channel_default_49" [id=339, type="get_attr"]; "340 dequantize_per_channel_default_49" [id=340, type="dequantize_per_channel"]; "341 features_7_0_mlp_3_bias" [id=341, type="get_attr"]; "342 features_7_0_norm2_weight" [id=342, type="get_attr"]; @@ -350,12 +350,12 @@ strict digraph { "348 features_7_1_norm1_bias" [id=348, type="get_attr"]; "349 _scale_50" [id=349, type="get_attr"]; "350 _zero_point_50" [id=350, type="get_attr"]; -"351 _frozen_param50" [id=351, type="get_attr"]; +"351 quantize_per_channel_default_50" [id=351, type="get_attr"]; "352 dequantize_per_channel_default_50" [id=352, type="dequantize_per_channel"]; "353 features_7_1_mlp_0_bias" [id=353, type="get_attr"]; "354 _scale_51" [id=354, type="get_attr"]; "355 _zero_point_51" [id=355, type="get_attr"]; -"356 _frozen_param51" [id=356, type="get_attr"]; +"356 quantize_per_channel_default_51" [id=356, type="get_attr"]; "357 dequantize_per_channel_default_51" [id=357, type="dequantize_per_channel"]; "358 features_7_1_mlp_3_bias" [id=358, type="get_attr"]; "359 features_7_1_norm2_weight" [id=359, type="get_attr"]; @@ -364,7 +364,7 @@ strict digraph { "362 norm_bias" [id=362, type="get_attr"]; "363 _scale_52" [id=363, type="get_attr"]; "364 _zero_point_52" [id=364, type="get_attr"]; -"365 _frozen_param52" [id=365, type="get_attr"]; +"365 quantize_per_channel_default_52" [id=365, type="get_attr"]; "366 dequantize_per_channel_default_52" [id=366, type="dequantize_per_channel"]; "367 head_bias" [id=367, type="get_attr"]; "368 features_1_0_attn_relative_coords_table" [id=368, type="get_attr"]; @@ -1658,139 +1658,139 @@ strict digraph { "1656 output" [id=1656, type=output]; "0 _scale_0" -> "3 dequantize_per_channel_default" [style=solid, label="(288,)"]; "1 _zero_point_0" -> "3 dequantize_per_channel_default" [style=solid, label="(288,)"]; -"2 _frozen_param0" -> "3 dequantize_per_channel_default" [style=solid, label="(288, 96)"]; +"2 quantize_per_channel_default" -> "3 dequantize_per_channel_default" [style=solid, label="(288, 96)"]; "3 dequantize_per_channel_default" -> "463 linear_2" [style=solid, label=None]; "4 _scale_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(96,)"]; "5 _zero_point_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(96,)"]; -"6 _frozen_param1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(96, 96)"]; +"6 quantize_per_channel_default_1" -> "7 dequantize_per_channel_default_1" [style=solid, label="(96, 96)"]; "7 dequantize_per_channel_default_1" -> "494 linear_3" [style=solid, label=None]; "8 features_1_0_attn_qkv_bias" -> "460 clone" [style=solid, label="(288,)"]; "9 features_1_0_attn_proj_bias" -> "494 linear_3" [style=solid, label="(96,)"]; "10 features_1_0_attn_logit_scale" -> "483 clamp" [style=solid, label="(3, 1, 1)"]; "11 _scale_2" -> "14 dequantize_per_channel_default_2" [style=solid, label="(288,)"]; "12 _zero_point_2" -> "14 dequantize_per_channel_default_2" [style=solid, label="(288,)"]; -"13 _frozen_param2" -> "14 dequantize_per_channel_default_2" [style=solid, label="(288, 96)"]; +"13 quantize_per_channel_default_2" -> "14 dequantize_per_channel_default_2" [style=solid, label="(288, 96)"]; "14 dequantize_per_channel_default_2" -> "535 linear_8" [style=solid, label=None]; "15 _scale_3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(96,)"]; "16 _zero_point_3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(96,)"]; -"17 _frozen_param3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(96, 96)"]; +"17 quantize_per_channel_default_3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(96, 96)"]; "18 dequantize_per_channel_default_3" -> "618 linear_9" [style=solid, label=None]; "19 features_1_1_attn_qkv_bias" -> "532 clone_1" [style=solid, label="(288,)"]; "20 features_1_1_attn_proj_bias" -> "618 linear_9" [style=solid, label="(96,)"]; "21 features_1_1_attn_logit_scale" -> "555 clamp_1" [style=solid, label="(3, 1, 1)"]; "22 _scale_4" -> "25 dequantize_per_channel_default_4" [style=solid, label="(576,)"]; "23 _zero_point_4" -> "25 dequantize_per_channel_default_4" [style=solid, label="(576,)"]; -"24 _frozen_param4" -> "25 dequantize_per_channel_default_4" [style=solid, label="(576, 192)"]; +"24 quantize_per_channel_default_4" -> "25 dequantize_per_channel_default_4" [style=solid, label="(576, 192)"]; "25 dequantize_per_channel_default_4" -> "677 linear_15" [style=solid, label=None]; "26 _scale_5" -> "29 dequantize_per_channel_default_5" [style=solid, label="(192,)"]; "27 _zero_point_5" -> "29 dequantize_per_channel_default_5" [style=solid, label="(192,)"]; -"28 _frozen_param5" -> "29 dequantize_per_channel_default_5" [style=solid, label="(192, 192)"]; +"28 quantize_per_channel_default_5" -> "29 dequantize_per_channel_default_5" [style=solid, label="(192, 192)"]; "29 dequantize_per_channel_default_5" -> "708 linear_16" [style=solid, label=None]; "30 features_3_0_attn_qkv_bias" -> "674 clone_2" [style=solid, label="(576,)"]; "31 features_3_0_attn_proj_bias" -> "708 linear_16" [style=solid, label="(192,)"]; "32 features_3_0_attn_logit_scale" -> "697 clamp_2" [style=solid, label="(6, 1, 1)"]; "33 _scale_6" -> "36 dequantize_per_channel_default_6" [style=solid, label="(576,)"]; "34 _zero_point_6" -> "36 dequantize_per_channel_default_6" [style=solid, label="(576,)"]; -"35 _frozen_param6" -> "36 dequantize_per_channel_default_6" [style=solid, label="(576, 192)"]; +"35 quantize_per_channel_default_6" -> "36 dequantize_per_channel_default_6" [style=solid, label="(576, 192)"]; "36 dequantize_per_channel_default_6" -> "752 linear_21" [style=solid, label=None]; "37 _scale_7" -> "40 dequantize_per_channel_default_7" [style=solid, label="(192,)"]; "38 _zero_point_7" -> "40 dequantize_per_channel_default_7" [style=solid, label="(192,)"]; -"39 _frozen_param7" -> "40 dequantize_per_channel_default_7" [style=solid, label="(192, 192)"]; +"39 quantize_per_channel_default_7" -> "40 dequantize_per_channel_default_7" [style=solid, label="(192, 192)"]; "40 dequantize_per_channel_default_7" -> "835 linear_22" [style=solid, label=None]; "41 features_3_1_attn_qkv_bias" -> "749 clone_3" [style=solid, label="(576,)"]; "42 features_3_1_attn_proj_bias" -> "835 linear_22" [style=solid, label="(192,)"]; "43 features_3_1_attn_logit_scale" -> "772 clamp_3" [style=solid, label="(6, 1, 1)"]; "44 _scale_8" -> "47 dequantize_per_channel_default_8" [style=solid, label="(1152,)"]; "45 _zero_point_8" -> "47 dequantize_per_channel_default_8" [style=solid, label="(1152,)"]; -"46 _frozen_param8" -> "47 dequantize_per_channel_default_8" [style=solid, label="(1152, 384)"]; +"46 quantize_per_channel_default_8" -> "47 dequantize_per_channel_default_8" [style=solid, label="(1152, 384)"]; "47 dequantize_per_channel_default_8" -> "897 linear_28" [style=solid, label=None]; "48 _scale_9" -> "51 dequantize_per_channel_default_9" [style=solid, label="(384,)"]; "49 _zero_point_9" -> "51 dequantize_per_channel_default_9" [style=solid, label="(384,)"]; -"50 _frozen_param9" -> "51 dequantize_per_channel_default_9" [style=solid, label="(384, 384)"]; +"50 quantize_per_channel_default_9" -> "51 dequantize_per_channel_default_9" [style=solid, label="(384, 384)"]; "51 dequantize_per_channel_default_9" -> "928 linear_29" [style=solid, label=None]; "52 features_5_0_attn_qkv_bias" -> "894 clone_4" [style=solid, label="(1152,)"]; "53 features_5_0_attn_proj_bias" -> "928 linear_29" [style=solid, label="(384,)"]; "54 features_5_0_attn_logit_scale" -> "917 clamp_4" [style=solid, label="(12, 1, 1)"]; "55 _scale_10" -> "58 dequantize_per_channel_default_10" [style=solid, label="(1152,)"]; "56 _zero_point_10" -> "58 dequantize_per_channel_default_10" [style=solid, label="(1152,)"]; -"57 _frozen_param10" -> "58 dequantize_per_channel_default_10" [style=solid, label="(1152, 384)"]; +"57 quantize_per_channel_default_10" -> "58 dequantize_per_channel_default_10" [style=solid, label="(1152, 384)"]; "58 dequantize_per_channel_default_10" -> "972 linear_34" [style=solid, label=None]; "59 _scale_11" -> "62 dequantize_per_channel_default_11" [style=solid, label="(384,)"]; "60 _zero_point_11" -> "62 dequantize_per_channel_default_11" [style=solid, label="(384,)"]; -"61 _frozen_param11" -> "62 dequantize_per_channel_default_11" [style=solid, label="(384, 384)"]; +"61 quantize_per_channel_default_11" -> "62 dequantize_per_channel_default_11" [style=solid, label="(384, 384)"]; "62 dequantize_per_channel_default_11" -> "1055 linear_35" [style=solid, label=None]; "63 features_5_1_attn_qkv_bias" -> "969 clone_5" [style=solid, label="(1152,)"]; "64 features_5_1_attn_proj_bias" -> "1055 linear_35" [style=solid, label="(384,)"]; "65 features_5_1_attn_logit_scale" -> "992 clamp_5" [style=solid, label="(12, 1, 1)"]; "66 _scale_12" -> "69 dequantize_per_channel_default_12" [style=solid, label="(1152,)"]; "67 _zero_point_12" -> "69 dequantize_per_channel_default_12" [style=solid, label="(1152,)"]; -"68 _frozen_param12" -> "69 dequantize_per_channel_default_12" [style=solid, label="(1152, 384)"]; +"68 quantize_per_channel_default_12" -> "69 dequantize_per_channel_default_12" [style=solid, label="(1152, 384)"]; "69 dequantize_per_channel_default_12" -> "1099 linear_40" [style=solid, label=None]; "70 _scale_13" -> "73 dequantize_per_channel_default_13" [style=solid, label="(384,)"]; "71 _zero_point_13" -> "73 dequantize_per_channel_default_13" [style=solid, label="(384,)"]; -"72 _frozen_param13" -> "73 dequantize_per_channel_default_13" [style=solid, label="(384, 384)"]; +"72 quantize_per_channel_default_13" -> "73 dequantize_per_channel_default_13" [style=solid, label="(384, 384)"]; "73 dequantize_per_channel_default_13" -> "1130 linear_41" [style=solid, label=None]; "74 features_5_2_attn_qkv_bias" -> "1096 clone_6" [style=solid, label="(1152,)"]; "75 features_5_2_attn_proj_bias" -> "1130 linear_41" [style=solid, label="(384,)"]; "76 features_5_2_attn_logit_scale" -> "1119 clamp_6" [style=solid, label="(12, 1, 1)"]; "77 _scale_14" -> "80 dequantize_per_channel_default_14" [style=solid, label="(1152,)"]; "78 _zero_point_14" -> "80 dequantize_per_channel_default_14" [style=solid, label="(1152,)"]; -"79 _frozen_param14" -> "80 dequantize_per_channel_default_14" [style=solid, label="(1152, 384)"]; +"79 quantize_per_channel_default_14" -> "80 dequantize_per_channel_default_14" [style=solid, label="(1152, 384)"]; "80 dequantize_per_channel_default_14" -> "1174 linear_46" [style=solid, label=None]; "81 _scale_15" -> "84 dequantize_per_channel_default_15" [style=solid, label="(384,)"]; "82 _zero_point_15" -> "84 dequantize_per_channel_default_15" [style=solid, label="(384,)"]; -"83 _frozen_param15" -> "84 dequantize_per_channel_default_15" [style=solid, label="(384, 384)"]; +"83 quantize_per_channel_default_15" -> "84 dequantize_per_channel_default_15" [style=solid, label="(384, 384)"]; "84 dequantize_per_channel_default_15" -> "1257 linear_47" [style=solid, label=None]; "85 features_5_3_attn_qkv_bias" -> "1171 clone_7" [style=solid, label="(1152,)"]; "86 features_5_3_attn_proj_bias" -> "1257 linear_47" [style=solid, label="(384,)"]; "87 features_5_3_attn_logit_scale" -> "1194 clamp_7" [style=solid, label="(12, 1, 1)"]; "88 _scale_16" -> "91 dequantize_per_channel_default_16" [style=solid, label="(1152,)"]; "89 _zero_point_16" -> "91 dequantize_per_channel_default_16" [style=solid, label="(1152,)"]; -"90 _frozen_param16" -> "91 dequantize_per_channel_default_16" [style=solid, label="(1152, 384)"]; +"90 quantize_per_channel_default_16" -> "91 dequantize_per_channel_default_16" [style=solid, label="(1152, 384)"]; "91 dequantize_per_channel_default_16" -> "1301 linear_52" [style=solid, label=None]; "92 _scale_17" -> "95 dequantize_per_channel_default_17" [style=solid, label="(384,)"]; "93 _zero_point_17" -> "95 dequantize_per_channel_default_17" [style=solid, label="(384,)"]; -"94 _frozen_param17" -> "95 dequantize_per_channel_default_17" [style=solid, label="(384, 384)"]; +"94 quantize_per_channel_default_17" -> "95 dequantize_per_channel_default_17" [style=solid, label="(384, 384)"]; "95 dequantize_per_channel_default_17" -> "1332 linear_53" [style=solid, label=None]; "96 features_5_4_attn_qkv_bias" -> "1298 clone_8" [style=solid, label="(1152,)"]; "97 features_5_4_attn_proj_bias" -> "1332 linear_53" [style=solid, label="(384,)"]; "98 features_5_4_attn_logit_scale" -> "1321 clamp_8" [style=solid, label="(12, 1, 1)"]; "99 _scale_18" -> "102 dequantize_per_channel_default_18" [style=solid, label="(1152,)"]; "100 _zero_point_18" -> "102 dequantize_per_channel_default_18" [style=solid, label="(1152,)"]; -"101 _frozen_param18" -> "102 dequantize_per_channel_default_18" [style=solid, label="(1152, 384)"]; +"101 quantize_per_channel_default_18" -> "102 dequantize_per_channel_default_18" [style=solid, label="(1152, 384)"]; "102 dequantize_per_channel_default_18" -> "1376 linear_58" [style=solid, label=None]; "103 _scale_19" -> "106 dequantize_per_channel_default_19" [style=solid, label="(384,)"]; "104 _zero_point_19" -> "106 dequantize_per_channel_default_19" [style=solid, label="(384,)"]; -"105 _frozen_param19" -> "106 dequantize_per_channel_default_19" [style=solid, label="(384, 384)"]; +"105 quantize_per_channel_default_19" -> "106 dequantize_per_channel_default_19" [style=solid, label="(384, 384)"]; "106 dequantize_per_channel_default_19" -> "1459 linear_59" [style=solid, label=None]; "107 features_5_5_attn_qkv_bias" -> "1373 clone_9" [style=solid, label="(1152,)"]; "108 features_5_5_attn_proj_bias" -> "1459 linear_59" [style=solid, label="(384,)"]; "109 features_5_5_attn_logit_scale" -> "1396 clamp_9" [style=solid, label="(12, 1, 1)"]; "110 _scale_20" -> "113 dequantize_per_channel_default_20" [style=solid, label="(2304,)"]; "111 _zero_point_20" -> "113 dequantize_per_channel_default_20" [style=solid, label="(2304,)"]; -"112 _frozen_param20" -> "113 dequantize_per_channel_default_20" [style=solid, label="(2304, 768)"]; +"112 quantize_per_channel_default_20" -> "113 dequantize_per_channel_default_20" [style=solid, label="(2304, 768)"]; "113 dequantize_per_channel_default_20" -> "1521 linear_65" [style=solid, label=None]; "114 _scale_21" -> "117 dequantize_per_channel_default_21" [style=solid, label="(768,)"]; "115 _zero_point_21" -> "117 dequantize_per_channel_default_21" [style=solid, label="(768,)"]; -"116 _frozen_param21" -> "117 dequantize_per_channel_default_21" [style=solid, label="(768, 768)"]; +"116 quantize_per_channel_default_21" -> "117 dequantize_per_channel_default_21" [style=solid, label="(768, 768)"]; "117 dequantize_per_channel_default_21" -> "1552 linear_66" [style=solid, label=None]; "118 features_7_0_attn_qkv_bias" -> "1518 clone_10" [style=solid, label="(2304,)"]; "119 features_7_0_attn_proj_bias" -> "1552 linear_66" [style=solid, label="(768,)"]; "120 features_7_0_attn_logit_scale" -> "1541 clamp_10" [style=solid, label="(24, 1, 1)"]; "121 _scale_22" -> "124 dequantize_per_channel_default_22" [style=solid, label="(2304,)"]; "122 _zero_point_22" -> "124 dequantize_per_channel_default_22" [style=solid, label="(2304,)"]; -"123 _frozen_param22" -> "124 dequantize_per_channel_default_22" [style=solid, label="(2304, 768)"]; +"123 quantize_per_channel_default_22" -> "124 dequantize_per_channel_default_22" [style=solid, label="(2304, 768)"]; "124 dequantize_per_channel_default_22" -> "1595 linear_71" [style=solid, label=None]; "125 _scale_23" -> "128 dequantize_per_channel_default_23" [style=solid, label="(768,)"]; "126 _zero_point_23" -> "128 dequantize_per_channel_default_23" [style=solid, label="(768,)"]; -"127 _frozen_param23" -> "128 dequantize_per_channel_default_23" [style=solid, label="(768, 768)"]; +"127 quantize_per_channel_default_23" -> "128 dequantize_per_channel_default_23" [style=solid, label="(768, 768)"]; "128 dequantize_per_channel_default_23" -> "1626 linear_72" [style=solid, label=None]; "129 features_7_1_attn_qkv_bias" -> "1592 clone_11" [style=solid, label="(2304,)"]; "130 features_7_1_attn_proj_bias" -> "1626 linear_72" [style=solid, label="(768,)"]; "131 features_7_1_attn_logit_scale" -> "1615 clamp_11" [style=solid, label="(24, 1, 1)"]; "132 _scale_24" -> "135 dequantize_per_channel_default_24" [style=solid, label="(96,)"]; "133 _zero_point_24" -> "135 dequantize_per_channel_default_24" [style=solid, label="(96,)"]; -"134 _frozen_param24" -> "135 dequantize_per_channel_default_24" [style=solid, label="(96, 3, 4, 4)"]; +"134 quantize_per_channel_default_24" -> "135 dequantize_per_channel_default_24" [style=solid, label="(96, 3, 4, 4)"]; "135 dequantize_per_channel_default_24" -> "440 conv2d" [style=solid, label=None]; "136 features_0_0_bias" -> "440 conv2d" [style=solid, label="(96,)"]; "137 features_0_2_weight" -> "442 layer_norm" [style=solid, label="(96,)"]; @@ -1802,12 +1802,12 @@ strict digraph { "143 features_1_0_norm1_bias" -> "501 layer_norm_1" [style=solid, label="(96,)"]; "144 _scale_25" -> "147 dequantize_per_channel_default_25" [style=solid, label="(384,)"]; "145 _zero_point_25" -> "147 dequantize_per_channel_default_25" [style=solid, label="(384,)"]; -"146 _frozen_param25" -> "147 dequantize_per_channel_default_25" [style=solid, label="(384, 96)"]; +"146 quantize_per_channel_default_25" -> "147 dequantize_per_channel_default_25" [style=solid, label="(384, 96)"]; "147 dequantize_per_channel_default_25" -> "505 linear_4" [style=solid, label=None]; "148 features_1_0_mlp_0_bias" -> "505 linear_4" [style=solid, label="(384,)"]; "149 _scale_26" -> "152 dequantize_per_channel_default_26" [style=solid, label="(96,)"]; "150 _zero_point_26" -> "152 dequantize_per_channel_default_26" [style=solid, label="(96,)"]; -"151 _frozen_param26" -> "152 dequantize_per_channel_default_26" [style=solid, label="(96, 384)"]; +"151 quantize_per_channel_default_26" -> "152 dequantize_per_channel_default_26" [style=solid, label="(96, 384)"]; "152 dequantize_per_channel_default_26" -> "510 linear_5" [style=solid, label=None]; "153 features_1_0_mlp_3_bias" -> "510 linear_5" [style=solid, label="(96,)"]; "154 features_1_0_norm2_weight" -> "512 layer_norm_2" [style=solid, label="(96,)"]; @@ -1819,19 +1819,19 @@ strict digraph { "160 features_1_1_norm1_bias" -> "626 layer_norm_3" [style=solid, label="(96,)"]; "161 _scale_27" -> "164 dequantize_per_channel_default_27" [style=solid, label="(384,)"]; "162 _zero_point_27" -> "164 dequantize_per_channel_default_27" [style=solid, label="(384,)"]; -"163 _frozen_param27" -> "164 dequantize_per_channel_default_27" [style=solid, label="(384, 96)"]; +"163 quantize_per_channel_default_27" -> "164 dequantize_per_channel_default_27" [style=solid, label="(384, 96)"]; "164 dequantize_per_channel_default_27" -> "630 linear_10" [style=solid, label=None]; "165 features_1_1_mlp_0_bias" -> "630 linear_10" [style=solid, label="(384,)"]; "166 _scale_28" -> "169 dequantize_per_channel_default_28" [style=solid, label="(96,)"]; "167 _zero_point_28" -> "169 dequantize_per_channel_default_28" [style=solid, label="(96,)"]; -"168 _frozen_param28" -> "169 dequantize_per_channel_default_28" [style=solid, label="(96, 384)"]; +"168 quantize_per_channel_default_28" -> "169 dequantize_per_channel_default_28" [style=solid, label="(96, 384)"]; "169 dequantize_per_channel_default_28" -> "635 linear_11" [style=solid, label=None]; "170 features_1_1_mlp_3_bias" -> "635 linear_11" [style=solid, label="(96,)"]; "171 features_1_1_norm2_weight" -> "637 layer_norm_4" [style=solid, label="(96,)"]; "172 features_1_1_norm2_bias" -> "637 layer_norm_4" [style=solid, label="(96,)"]; "173 _scale_29" -> "176 dequantize_per_channel_default_29" [style=solid, label="(192,)"]; "174 _zero_point_29" -> "176 dequantize_per_channel_default_29" [style=solid, label="(192,)"]; -"175 _frozen_param29" -> "176 dequantize_per_channel_default_29" [style=solid, label="(192, 384)"]; +"175 quantize_per_channel_default_29" -> "176 dequantize_per_channel_default_29" [style=solid, label="(192, 384)"]; "176 dequantize_per_channel_default_29" -> "655 linear_12" [style=solid, label=None]; "177 features_2_norm_weight" -> "656 layer_norm_5" [style=solid, label="(192,)"]; "178 features_2_norm_bias" -> "656 layer_norm_5" [style=solid, label="(192,)"]; @@ -1842,12 +1842,12 @@ strict digraph { "183 features_3_0_norm1_bias" -> "718 layer_norm_6" [style=solid, label="(192,)"]; "184 _scale_30" -> "187 dequantize_per_channel_default_30" [style=solid, label="(768,)"]; "185 _zero_point_30" -> "187 dequantize_per_channel_default_30" [style=solid, label="(768,)"]; -"186 _frozen_param30" -> "187 dequantize_per_channel_default_30" [style=solid, label="(768, 192)"]; +"186 quantize_per_channel_default_30" -> "187 dequantize_per_channel_default_30" [style=solid, label="(768, 192)"]; "187 dequantize_per_channel_default_30" -> "722 linear_17" [style=solid, label=None]; "188 features_3_0_mlp_0_bias" -> "722 linear_17" [style=solid, label="(768,)"]; "189 _scale_31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(192,)"]; "190 _zero_point_31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(192,)"]; -"191 _frozen_param31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(192, 768)"]; +"191 quantize_per_channel_default_31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(192, 768)"]; "192 dequantize_per_channel_default_31" -> "727 linear_18" [style=solid, label=None]; "193 features_3_0_mlp_3_bias" -> "727 linear_18" [style=solid, label="(192,)"]; "194 features_3_0_norm2_weight" -> "729 layer_norm_7" [style=solid, label="(192,)"]; @@ -1859,19 +1859,19 @@ strict digraph { "200 features_3_1_norm1_bias" -> "846 layer_norm_8" [style=solid, label="(192,)"]; "201 _scale_32" -> "204 dequantize_per_channel_default_32" [style=solid, label="(768,)"]; "202 _zero_point_32" -> "204 dequantize_per_channel_default_32" [style=solid, label="(768,)"]; -"203 _frozen_param32" -> "204 dequantize_per_channel_default_32" [style=solid, label="(768, 192)"]; +"203 quantize_per_channel_default_32" -> "204 dequantize_per_channel_default_32" [style=solid, label="(768, 192)"]; "204 dequantize_per_channel_default_32" -> "850 linear_23" [style=solid, label=None]; "205 features_3_1_mlp_0_bias" -> "850 linear_23" [style=solid, label="(768,)"]; "206 _scale_33" -> "209 dequantize_per_channel_default_33" [style=solid, label="(192,)"]; "207 _zero_point_33" -> "209 dequantize_per_channel_default_33" [style=solid, label="(192,)"]; -"208 _frozen_param33" -> "209 dequantize_per_channel_default_33" [style=solid, label="(192, 768)"]; +"208 quantize_per_channel_default_33" -> "209 dequantize_per_channel_default_33" [style=solid, label="(192, 768)"]; "209 dequantize_per_channel_default_33" -> "855 linear_24" [style=solid, label=None]; "210 features_3_1_mlp_3_bias" -> "855 linear_24" [style=solid, label="(192,)"]; "211 features_3_1_norm2_weight" -> "857 layer_norm_9" [style=solid, label="(192,)"]; "212 features_3_1_norm2_bias" -> "857 layer_norm_9" [style=solid, label="(192,)"]; "213 _scale_34" -> "216 dequantize_per_channel_default_34" [style=solid, label="(384,)"]; "214 _zero_point_34" -> "216 dequantize_per_channel_default_34" [style=solid, label="(384,)"]; -"215 _frozen_param34" -> "216 dequantize_per_channel_default_34" [style=solid, label="(384, 768)"]; +"215 quantize_per_channel_default_34" -> "216 dequantize_per_channel_default_34" [style=solid, label="(384, 768)"]; "216 dequantize_per_channel_default_34" -> "875 linear_25" [style=solid, label=None]; "217 features_4_norm_weight" -> "876 layer_norm_10" [style=solid, label="(384,)"]; "218 features_4_norm_bias" -> "876 layer_norm_10" [style=solid, label="(384,)"]; @@ -1882,12 +1882,12 @@ strict digraph { "223 features_5_0_norm1_bias" -> "938 layer_norm_11" [style=solid, label="(384,)"]; "224 _scale_35" -> "227 dequantize_per_channel_default_35" [style=solid, label="(1536,)"]; "225 _zero_point_35" -> "227 dequantize_per_channel_default_35" [style=solid, label="(1536,)"]; -"226 _frozen_param35" -> "227 dequantize_per_channel_default_35" [style=solid, label="(1536, 384)"]; +"226 quantize_per_channel_default_35" -> "227 dequantize_per_channel_default_35" [style=solid, label="(1536, 384)"]; "227 dequantize_per_channel_default_35" -> "942 linear_30" [style=solid, label=None]; "228 features_5_0_mlp_0_bias" -> "942 linear_30" [style=solid, label="(1536,)"]; "229 _scale_36" -> "232 dequantize_per_channel_default_36" [style=solid, label="(384,)"]; "230 _zero_point_36" -> "232 dequantize_per_channel_default_36" [style=solid, label="(384,)"]; -"231 _frozen_param36" -> "232 dequantize_per_channel_default_36" [style=solid, label="(384, 1536)"]; +"231 quantize_per_channel_default_36" -> "232 dequantize_per_channel_default_36" [style=solid, label="(384, 1536)"]; "232 dequantize_per_channel_default_36" -> "947 linear_31" [style=solid, label=None]; "233 features_5_0_mlp_3_bias" -> "947 linear_31" [style=solid, label="(384,)"]; "234 features_5_0_norm2_weight" -> "949 layer_norm_12" [style=solid, label="(384,)"]; @@ -1899,12 +1899,12 @@ strict digraph { "240 features_5_1_norm1_bias" -> "1066 layer_norm_13" [style=solid, label="(384,)"]; "241 _scale_37" -> "244 dequantize_per_channel_default_37" [style=solid, label="(1536,)"]; "242 _zero_point_37" -> "244 dequantize_per_channel_default_37" [style=solid, label="(1536,)"]; -"243 _frozen_param37" -> "244 dequantize_per_channel_default_37" [style=solid, label="(1536, 384)"]; +"243 quantize_per_channel_default_37" -> "244 dequantize_per_channel_default_37" [style=solid, label="(1536, 384)"]; "244 dequantize_per_channel_default_37" -> "1070 linear_36" [style=solid, label=None]; "245 features_5_1_mlp_0_bias" -> "1070 linear_36" [style=solid, label="(1536,)"]; "246 _scale_38" -> "249 dequantize_per_channel_default_38" [style=solid, label="(384,)"]; "247 _zero_point_38" -> "249 dequantize_per_channel_default_38" [style=solid, label="(384,)"]; -"248 _frozen_param38" -> "249 dequantize_per_channel_default_38" [style=solid, label="(384, 1536)"]; +"248 quantize_per_channel_default_38" -> "249 dequantize_per_channel_default_38" [style=solid, label="(384, 1536)"]; "249 dequantize_per_channel_default_38" -> "1075 linear_37" [style=solid, label=None]; "250 features_5_1_mlp_3_bias" -> "1075 linear_37" [style=solid, label="(384,)"]; "251 features_5_1_norm2_weight" -> "1077 layer_norm_14" [style=solid, label="(384,)"]; @@ -1916,12 +1916,12 @@ strict digraph { "257 features_5_2_norm1_bias" -> "1140 layer_norm_15" [style=solid, label="(384,)"]; "258 _scale_39" -> "261 dequantize_per_channel_default_39" [style=solid, label="(1536,)"]; "259 _zero_point_39" -> "261 dequantize_per_channel_default_39" [style=solid, label="(1536,)"]; -"260 _frozen_param39" -> "261 dequantize_per_channel_default_39" [style=solid, label="(1536, 384)"]; +"260 quantize_per_channel_default_39" -> "261 dequantize_per_channel_default_39" [style=solid, label="(1536, 384)"]; "261 dequantize_per_channel_default_39" -> "1144 linear_42" [style=solid, label=None]; "262 features_5_2_mlp_0_bias" -> "1144 linear_42" [style=solid, label="(1536,)"]; "263 _scale_40" -> "266 dequantize_per_channel_default_40" [style=solid, label="(384,)"]; "264 _zero_point_40" -> "266 dequantize_per_channel_default_40" [style=solid, label="(384,)"]; -"265 _frozen_param40" -> "266 dequantize_per_channel_default_40" [style=solid, label="(384, 1536)"]; +"265 quantize_per_channel_default_40" -> "266 dequantize_per_channel_default_40" [style=solid, label="(384, 1536)"]; "266 dequantize_per_channel_default_40" -> "1149 linear_43" [style=solid, label=None]; "267 features_5_2_mlp_3_bias" -> "1149 linear_43" [style=solid, label="(384,)"]; "268 features_5_2_norm2_weight" -> "1151 layer_norm_16" [style=solid, label="(384,)"]; @@ -1933,12 +1933,12 @@ strict digraph { "274 features_5_3_norm1_bias" -> "1268 layer_norm_17" [style=solid, label="(384,)"]; "275 _scale_41" -> "278 dequantize_per_channel_default_41" [style=solid, label="(1536,)"]; "276 _zero_point_41" -> "278 dequantize_per_channel_default_41" [style=solid, label="(1536,)"]; -"277 _frozen_param41" -> "278 dequantize_per_channel_default_41" [style=solid, label="(1536, 384)"]; +"277 quantize_per_channel_default_41" -> "278 dequantize_per_channel_default_41" [style=solid, label="(1536, 384)"]; "278 dequantize_per_channel_default_41" -> "1272 linear_48" [style=solid, label=None]; "279 features_5_3_mlp_0_bias" -> "1272 linear_48" [style=solid, label="(1536,)"]; "280 _scale_42" -> "283 dequantize_per_channel_default_42" [style=solid, label="(384,)"]; "281 _zero_point_42" -> "283 dequantize_per_channel_default_42" [style=solid, label="(384,)"]; -"282 _frozen_param42" -> "283 dequantize_per_channel_default_42" [style=solid, label="(384, 1536)"]; +"282 quantize_per_channel_default_42" -> "283 dequantize_per_channel_default_42" [style=solid, label="(384, 1536)"]; "283 dequantize_per_channel_default_42" -> "1277 linear_49" [style=solid, label=None]; "284 features_5_3_mlp_3_bias" -> "1277 linear_49" [style=solid, label="(384,)"]; "285 features_5_3_norm2_weight" -> "1279 layer_norm_18" [style=solid, label="(384,)"]; @@ -1950,12 +1950,12 @@ strict digraph { "291 features_5_4_norm1_bias" -> "1342 layer_norm_19" [style=solid, label="(384,)"]; "292 _scale_43" -> "295 dequantize_per_channel_default_43" [style=solid, label="(1536,)"]; "293 _zero_point_43" -> "295 dequantize_per_channel_default_43" [style=solid, label="(1536,)"]; -"294 _frozen_param43" -> "295 dequantize_per_channel_default_43" [style=solid, label="(1536, 384)"]; +"294 quantize_per_channel_default_43" -> "295 dequantize_per_channel_default_43" [style=solid, label="(1536, 384)"]; "295 dequantize_per_channel_default_43" -> "1346 linear_54" [style=solid, label=None]; "296 features_5_4_mlp_0_bias" -> "1346 linear_54" [style=solid, label="(1536,)"]; "297 _scale_44" -> "300 dequantize_per_channel_default_44" [style=solid, label="(384,)"]; "298 _zero_point_44" -> "300 dequantize_per_channel_default_44" [style=solid, label="(384,)"]; -"299 _frozen_param44" -> "300 dequantize_per_channel_default_44" [style=solid, label="(384, 1536)"]; +"299 quantize_per_channel_default_44" -> "300 dequantize_per_channel_default_44" [style=solid, label="(384, 1536)"]; "300 dequantize_per_channel_default_44" -> "1351 linear_55" [style=solid, label=None]; "301 features_5_4_mlp_3_bias" -> "1351 linear_55" [style=solid, label="(384,)"]; "302 features_5_4_norm2_weight" -> "1353 layer_norm_20" [style=solid, label="(384,)"]; @@ -1967,19 +1967,19 @@ strict digraph { "308 features_5_5_norm1_bias" -> "1470 layer_norm_21" [style=solid, label="(384,)"]; "309 _scale_45" -> "312 dequantize_per_channel_default_45" [style=solid, label="(1536,)"]; "310 _zero_point_45" -> "312 dequantize_per_channel_default_45" [style=solid, label="(1536,)"]; -"311 _frozen_param45" -> "312 dequantize_per_channel_default_45" [style=solid, label="(1536, 384)"]; +"311 quantize_per_channel_default_45" -> "312 dequantize_per_channel_default_45" [style=solid, label="(1536, 384)"]; "312 dequantize_per_channel_default_45" -> "1474 linear_60" [style=solid, label=None]; "313 features_5_5_mlp_0_bias" -> "1474 linear_60" [style=solid, label="(1536,)"]; "314 _scale_46" -> "317 dequantize_per_channel_default_46" [style=solid, label="(384,)"]; "315 _zero_point_46" -> "317 dequantize_per_channel_default_46" [style=solid, label="(384,)"]; -"316 _frozen_param46" -> "317 dequantize_per_channel_default_46" [style=solid, label="(384, 1536)"]; +"316 quantize_per_channel_default_46" -> "317 dequantize_per_channel_default_46" [style=solid, label="(384, 1536)"]; "317 dequantize_per_channel_default_46" -> "1479 linear_61" [style=solid, label=None]; "318 features_5_5_mlp_3_bias" -> "1479 linear_61" [style=solid, label="(384,)"]; "319 features_5_5_norm2_weight" -> "1481 layer_norm_22" [style=solid, label="(384,)"]; "320 features_5_5_norm2_bias" -> "1481 layer_norm_22" [style=solid, label="(384,)"]; "321 _scale_47" -> "324 dequantize_per_channel_default_47" [style=solid, label="(768,)"]; "322 _zero_point_47" -> "324 dequantize_per_channel_default_47" [style=solid, label="(768,)"]; -"323 _frozen_param47" -> "324 dequantize_per_channel_default_47" [style=solid, label="(768, 1536)"]; +"323 quantize_per_channel_default_47" -> "324 dequantize_per_channel_default_47" [style=solid, label="(768, 1536)"]; "324 dequantize_per_channel_default_47" -> "1499 linear_62" [style=solid, label=None]; "325 features_6_norm_weight" -> "1500 layer_norm_23" [style=solid, label="(768,)"]; "326 features_6_norm_bias" -> "1500 layer_norm_23" [style=solid, label="(768,)"]; @@ -1990,12 +1990,12 @@ strict digraph { "331 features_7_0_norm1_bias" -> "1562 layer_norm_24" [style=solid, label="(768,)"]; "332 _scale_48" -> "335 dequantize_per_channel_default_48" [style=solid, label="(3072,)"]; "333 _zero_point_48" -> "335 dequantize_per_channel_default_48" [style=solid, label="(3072,)"]; -"334 _frozen_param48" -> "335 dequantize_per_channel_default_48" [style=solid, label="(3072, 768)"]; +"334 quantize_per_channel_default_48" -> "335 dequantize_per_channel_default_48" [style=solid, label="(3072, 768)"]; "335 dequantize_per_channel_default_48" -> "1566 linear_67" [style=solid, label=None]; "336 features_7_0_mlp_0_bias" -> "1566 linear_67" [style=solid, label="(3072,)"]; "337 _scale_49" -> "340 dequantize_per_channel_default_49" [style=solid, label="(768,)"]; "338 _zero_point_49" -> "340 dequantize_per_channel_default_49" [style=solid, label="(768,)"]; -"339 _frozen_param49" -> "340 dequantize_per_channel_default_49" [style=solid, label="(768, 3072)"]; +"339 quantize_per_channel_default_49" -> "340 dequantize_per_channel_default_49" [style=solid, label="(768, 3072)"]; "340 dequantize_per_channel_default_49" -> "1571 linear_68" [style=solid, label=None]; "341 features_7_0_mlp_3_bias" -> "1571 linear_68" [style=solid, label="(768,)"]; "342 features_7_0_norm2_weight" -> "1573 layer_norm_25" [style=solid, label="(768,)"]; @@ -2007,12 +2007,12 @@ strict digraph { "348 features_7_1_norm1_bias" -> "1636 layer_norm_26" [style=solid, label="(768,)"]; "349 _scale_50" -> "352 dequantize_per_channel_default_50" [style=solid, label="(3072,)"]; "350 _zero_point_50" -> "352 dequantize_per_channel_default_50" [style=solid, label="(3072,)"]; -"351 _frozen_param50" -> "352 dequantize_per_channel_default_50" [style=solid, label="(3072, 768)"]; +"351 quantize_per_channel_default_50" -> "352 dequantize_per_channel_default_50" [style=solid, label="(3072, 768)"]; "352 dequantize_per_channel_default_50" -> "1640 linear_73" [style=solid, label=None]; "353 features_7_1_mlp_0_bias" -> "1640 linear_73" [style=solid, label="(3072,)"]; "354 _scale_51" -> "357 dequantize_per_channel_default_51" [style=solid, label="(768,)"]; "355 _zero_point_51" -> "357 dequantize_per_channel_default_51" [style=solid, label="(768,)"]; -"356 _frozen_param51" -> "357 dequantize_per_channel_default_51" [style=solid, label="(768, 3072)"]; +"356 quantize_per_channel_default_51" -> "357 dequantize_per_channel_default_51" [style=solid, label="(768, 3072)"]; "357 dequantize_per_channel_default_51" -> "1645 linear_74" [style=solid, label=None]; "358 features_7_1_mlp_3_bias" -> "1645 linear_74" [style=solid, label="(768,)"]; "359 features_7_1_norm2_weight" -> "1647 layer_norm_27" [style=solid, label="(768,)"]; @@ -2021,7 +2021,7 @@ strict digraph { "362 norm_bias" -> "1649 layer_norm_28" [style=solid, label="(768,)"]; "363 _scale_52" -> "366 dequantize_per_channel_default_52" [style=solid, label="(1000,)"]; "364 _zero_point_52" -> "366 dequantize_per_channel_default_52" [style=solid, label="(1000,)"]; -"365 _frozen_param52" -> "366 dequantize_per_channel_default_52" [style=solid, label="(1000, 768)"]; +"365 quantize_per_channel_default_52" -> "366 dequantize_per_channel_default_52" [style=solid, label="(1000, 768)"]; "366 dequantize_per_channel_default_52" -> "1655 linear_75" [style=solid, label=None]; "367 head_bias" -> "1655 linear_75" [style=solid, label="(1000,)"]; "368 features_1_0_attn_relative_coords_table" -> "445 linear" [style=solid, label="(1, 15, 15, 2)"]; diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/synthetic_transformer.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/synthetic_transformer.dot index 3dacdab8518..0e714c2c9a2 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/synthetic_transformer.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/synthetic_transformer.dot @@ -2,12 +2,12 @@ strict digraph { "0 wte_weight" [id=0, type="get_attr"]; "1 _scale_0" [id=1, type="get_attr"]; "2 _zero_point_0" [id=2, type="get_attr"]; -"3 _frozen_param0" [id=3, type="get_attr"]; +"3 quantize_per_channel_default" [id=3, type="get_attr"]; "4 dequantize_per_channel_default" [id=4, type="dequantize_per_channel"]; "5 linear_bias" [id=5, type="get_attr"]; "6 _scale_1" [id=6, type="get_attr"]; "7 _zero_point_1" [id=7, type="get_attr"]; -"8 _frozen_param1" [id=8, type="get_attr"]; +"8 quantize_per_channel_default_1" [id=8, type="get_attr"]; "9 dequantize_per_channel_default_1" [id=9, type="dequantize_per_channel"]; "10 lm_head_bias" [id=10, type="get_attr"]; "11 input_ids" [id=11, type=input]; @@ -22,12 +22,12 @@ strict digraph { "0 wte_weight" -> "12 embedding" [style=solid, label="(10, 5)"]; "1 _scale_0" -> "4 dequantize_per_channel_default" [style=solid, label="(5,)"]; "2 _zero_point_0" -> "4 dequantize_per_channel_default" [style=solid, label="(5,)"]; -"3 _frozen_param0" -> "4 dequantize_per_channel_default" [style=solid, label="(5, 5)"]; +"3 quantize_per_channel_default" -> "4 dequantize_per_channel_default" [style=solid, label="(5, 5)"]; "4 dequantize_per_channel_default" -> "15 linear" [style=solid, label=None]; "5 linear_bias" -> "15 linear" [style=solid, label="(5,)"]; "6 _scale_1" -> "9 dequantize_per_channel_default_1" [style=solid, label="(10,)"]; "7 _zero_point_1" -> "9 dequantize_per_channel_default_1" [style=solid, label="(10,)"]; -"8 _frozen_param1" -> "9 dequantize_per_channel_default_1" [style=solid, label="(10, 5)"]; +"8 quantize_per_channel_default_1" -> "9 dequantize_per_channel_default_1" [style=solid, label="(10, 5)"]; "9 dequantize_per_channel_default_1" -> "18 linear_1" [style=solid, label=None]; "10 lm_head_bias" -> "18 linear_1" [style=solid, label="(10,)"]; "11 input_ids" -> "12 embedding" [style=solid, label="(5,)"]; diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/unet.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/unet.dot index 252a3178e4f..53fcf8b1309 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/unet.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/unet.dot @@ -1,117 +1,117 @@ strict digraph { "0 _scale_0" [id=0, type="get_attr"]; "1 _zero_point_0" [id=1, type="get_attr"]; -"2 _frozen_param0" [id=2, type="get_attr"]; +"2 quantize_per_channel_default" [id=2, type="get_attr"]; "3 dequantize_per_channel_default" [id=3, type="dequantize_per_channel"]; "4 down_path_0_block_0_bias" [id=4, type="get_attr"]; "5 _scale_1" [id=5, type="get_attr"]; "6 _zero_point_1" [id=6, type="get_attr"]; -"7 _frozen_param1" [id=7, type="get_attr"]; +"7 quantize_per_channel_default_1" [id=7, type="get_attr"]; "8 dequantize_per_channel_default_1" [id=8, type="dequantize_per_channel"]; "9 down_path_0_block_3_bias" [id=9, type="get_attr"]; "10 _scale_2" [id=10, type="get_attr"]; "11 _zero_point_2" [id=11, type="get_attr"]; -"12 _frozen_param2" [id=12, type="get_attr"]; +"12 quantize_per_channel_default_2" [id=12, type="get_attr"]; "13 dequantize_per_channel_default_2" [id=13, type="dequantize_per_channel"]; "14 down_path_1_block_0_bias" [id=14, type="get_attr"]; "15 _scale_3" [id=15, type="get_attr"]; "16 _zero_point_3" [id=16, type="get_attr"]; -"17 _frozen_param3" [id=17, type="get_attr"]; +"17 quantize_per_channel_default_3" [id=17, type="get_attr"]; "18 dequantize_per_channel_default_3" [id=18, type="dequantize_per_channel"]; "19 down_path_1_block_3_bias" [id=19, type="get_attr"]; "20 _scale_4" [id=20, type="get_attr"]; "21 _zero_point_4" [id=21, type="get_attr"]; -"22 _frozen_param4" [id=22, type="get_attr"]; +"22 quantize_per_channel_default_4" [id=22, type="get_attr"]; "23 dequantize_per_channel_default_4" [id=23, type="dequantize_per_channel"]; "24 down_path_2_block_0_bias" [id=24, type="get_attr"]; "25 _scale_5" [id=25, type="get_attr"]; "26 _zero_point_5" [id=26, type="get_attr"]; -"27 _frozen_param5" [id=27, type="get_attr"]; +"27 quantize_per_channel_default_5" [id=27, type="get_attr"]; "28 dequantize_per_channel_default_5" [id=28, type="dequantize_per_channel"]; "29 down_path_2_block_3_bias" [id=29, type="get_attr"]; "30 _scale_6" [id=30, type="get_attr"]; "31 _zero_point_6" [id=31, type="get_attr"]; -"32 _frozen_param6" [id=32, type="get_attr"]; +"32 quantize_per_channel_default_6" [id=32, type="get_attr"]; "33 dequantize_per_channel_default_6" [id=33, type="dequantize_per_channel"]; "34 down_path_3_block_0_bias" [id=34, type="get_attr"]; "35 _scale_7" [id=35, type="get_attr"]; "36 _zero_point_7" [id=36, type="get_attr"]; -"37 _frozen_param7" [id=37, type="get_attr"]; +"37 quantize_per_channel_default_7" [id=37, type="get_attr"]; "38 dequantize_per_channel_default_7" [id=38, type="dequantize_per_channel"]; "39 down_path_3_block_3_bias" [id=39, type="get_attr"]; "40 _scale_8" [id=40, type="get_attr"]; "41 _zero_point_8" [id=41, type="get_attr"]; -"42 _frozen_param8" [id=42, type="get_attr"]; +"42 quantize_per_channel_default_8" [id=42, type="get_attr"]; "43 dequantize_per_channel_default_8" [id=43, type="dequantize_per_channel"]; "44 down_path_4_block_0_bias" [id=44, type="get_attr"]; "45 _scale_9" [id=45, type="get_attr"]; "46 _zero_point_9" [id=46, type="get_attr"]; -"47 _frozen_param9" [id=47, type="get_attr"]; +"47 quantize_per_channel_default_9" [id=47, type="get_attr"]; "48 dequantize_per_channel_default_9" [id=48, type="dequantize_per_channel"]; "49 down_path_4_block_3_bias" [id=49, type="get_attr"]; "50 _scale_10" [id=50, type="get_attr"]; "51 _zero_point_10" [id=51, type="get_attr"]; -"52 _frozen_param10" [id=52, type="get_attr"]; +"52 quantize_per_channel_default_10" [id=52, type="get_attr"]; "53 dequantize_per_channel_default_10" [id=53, type="dequantize_per_channel"]; "54 up_path_0_up_bias" [id=54, type="get_attr"]; "55 _scale_11" [id=55, type="get_attr"]; "56 _zero_point_11" [id=56, type="get_attr"]; -"57 _frozen_param11" [id=57, type="get_attr"]; +"57 quantize_per_channel_default_11" [id=57, type="get_attr"]; "58 dequantize_per_channel_default_11" [id=58, type="dequantize_per_channel"]; "59 up_path_0_conv_block_block_0_bias" [id=59, type="get_attr"]; "60 _scale_12" [id=60, type="get_attr"]; "61 _zero_point_12" [id=61, type="get_attr"]; -"62 _frozen_param12" [id=62, type="get_attr"]; +"62 quantize_per_channel_default_12" [id=62, type="get_attr"]; "63 dequantize_per_channel_default_12" [id=63, type="dequantize_per_channel"]; "64 up_path_0_conv_block_block_3_bias" [id=64, type="get_attr"]; "65 _scale_13" [id=65, type="get_attr"]; "66 _zero_point_13" [id=66, type="get_attr"]; -"67 _frozen_param13" [id=67, type="get_attr"]; +"67 quantize_per_channel_default_13" [id=67, type="get_attr"]; "68 dequantize_per_channel_default_13" [id=68, type="dequantize_per_channel"]; "69 up_path_1_up_bias" [id=69, type="get_attr"]; "70 _scale_14" [id=70, type="get_attr"]; "71 _zero_point_14" [id=71, type="get_attr"]; -"72 _frozen_param14" [id=72, type="get_attr"]; +"72 quantize_per_channel_default_14" [id=72, type="get_attr"]; "73 dequantize_per_channel_default_14" [id=73, type="dequantize_per_channel"]; "74 up_path_1_conv_block_block_0_bias" [id=74, type="get_attr"]; "75 _scale_15" [id=75, type="get_attr"]; "76 _zero_point_15" [id=76, type="get_attr"]; -"77 _frozen_param15" [id=77, type="get_attr"]; +"77 quantize_per_channel_default_15" [id=77, type="get_attr"]; "78 dequantize_per_channel_default_15" [id=78, type="dequantize_per_channel"]; "79 up_path_1_conv_block_block_3_bias" [id=79, type="get_attr"]; "80 _scale_16" [id=80, type="get_attr"]; "81 _zero_point_16" [id=81, type="get_attr"]; -"82 _frozen_param16" [id=82, type="get_attr"]; +"82 quantize_per_channel_default_16" [id=82, type="get_attr"]; "83 dequantize_per_channel_default_16" [id=83, type="dequantize_per_channel"]; "84 up_path_2_up_bias" [id=84, type="get_attr"]; "85 _scale_17" [id=85, type="get_attr"]; "86 _zero_point_17" [id=86, type="get_attr"]; -"87 _frozen_param17" [id=87, type="get_attr"]; +"87 quantize_per_channel_default_17" [id=87, type="get_attr"]; "88 dequantize_per_channel_default_17" [id=88, type="dequantize_per_channel"]; "89 up_path_2_conv_block_block_0_bias" [id=89, type="get_attr"]; "90 _scale_18" [id=90, type="get_attr"]; "91 _zero_point_18" [id=91, type="get_attr"]; -"92 _frozen_param18" [id=92, type="get_attr"]; +"92 quantize_per_channel_default_18" [id=92, type="get_attr"]; "93 dequantize_per_channel_default_18" [id=93, type="dequantize_per_channel"]; "94 up_path_2_conv_block_block_3_bias" [id=94, type="get_attr"]; "95 _scale_19" [id=95, type="get_attr"]; "96 _zero_point_19" [id=96, type="get_attr"]; -"97 _frozen_param19" [id=97, type="get_attr"]; +"97 quantize_per_channel_default_19" [id=97, type="get_attr"]; "98 dequantize_per_channel_default_19" [id=98, type="dequantize_per_channel"]; "99 up_path_3_up_bias" [id=99, type="get_attr"]; "100 _scale_20" [id=100, type="get_attr"]; "101 _zero_point_20" [id=101, type="get_attr"]; -"102 _frozen_param20" [id=102, type="get_attr"]; +"102 quantize_per_channel_default_20" [id=102, type="get_attr"]; "103 dequantize_per_channel_default_20" [id=103, type="dequantize_per_channel"]; "104 up_path_3_conv_block_block_0_bias" [id=104, type="get_attr"]; "105 _scale_21" [id=105, type="get_attr"]; "106 _zero_point_21" [id=106, type="get_attr"]; -"107 _frozen_param21" [id=107, type="get_attr"]; +"107 quantize_per_channel_default_21" [id=107, type="get_attr"]; "108 dequantize_per_channel_default_21" [id=108, type="dequantize_per_channel"]; "109 up_path_3_conv_block_block_3_bias" [id=109, type="get_attr"]; "110 _scale_22" [id=110, type="get_attr"]; "111 _zero_point_22" [id=111, type="get_attr"]; -"112 _frozen_param22" [id=112, type="get_attr"]; +"112 quantize_per_channel_default_22" [id=112, type="get_attr"]; "113 dequantize_per_channel_default_22" [id=113, type="dequantize_per_channel"]; "114 last_bias" [id=114, type="get_attr"]; "115 x" [id=115, type=input]; @@ -229,117 +229,117 @@ strict digraph { "227 output" [id=227, type=output]; "0 _scale_0" -> "3 dequantize_per_channel_default" [style=solid, label="(64,)"]; "1 _zero_point_0" -> "3 dequantize_per_channel_default" [style=solid, label="(64,)"]; -"2 _frozen_param0" -> "3 dequantize_per_channel_default" [style=solid, label="(64, 3, 3, 3)"]; +"2 quantize_per_channel_default" -> "3 dequantize_per_channel_default" [style=solid, label="(64, 3, 3, 3)"]; "3 dequantize_per_channel_default" -> "118 conv2d" [style=solid, label=None]; "4 down_path_0_block_0_bias" -> "118 conv2d" [style=solid, label="(64,)"]; "5 _scale_1" -> "8 dequantize_per_channel_default_1" [style=solid, label="(64,)"]; "6 _zero_point_1" -> "8 dequantize_per_channel_default_1" [style=solid, label="(64,)"]; -"7 _frozen_param1" -> "8 dequantize_per_channel_default_1" [style=solid, label="(64, 64, 3, 3)"]; +"7 quantize_per_channel_default_1" -> "8 dequantize_per_channel_default_1" [style=solid, label="(64, 64, 3, 3)"]; "8 dequantize_per_channel_default_1" -> "122 conv2d_1" [style=solid, label=None]; "9 down_path_0_block_3_bias" -> "122 conv2d_1" [style=solid, label="(64,)"]; "10 _scale_2" -> "13 dequantize_per_channel_default_2" [style=solid, label="(128,)"]; "11 _zero_point_2" -> "13 dequantize_per_channel_default_2" [style=solid, label="(128,)"]; -"12 _frozen_param2" -> "13 dequantize_per_channel_default_2" [style=solid, label="(128, 64, 3, 3)"]; +"12 quantize_per_channel_default_2" -> "13 dequantize_per_channel_default_2" [style=solid, label="(128, 64, 3, 3)"]; "13 dequantize_per_channel_default_2" -> "127 conv2d_2" [style=solid, label=None]; "14 down_path_1_block_0_bias" -> "127 conv2d_2" [style=solid, label="(128,)"]; "15 _scale_3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(128,)"]; "16 _zero_point_3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(128,)"]; -"17 _frozen_param3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(128, 128, 3, 3)"]; +"17 quantize_per_channel_default_3" -> "18 dequantize_per_channel_default_3" [style=solid, label="(128, 128, 3, 3)"]; "18 dequantize_per_channel_default_3" -> "131 conv2d_3" [style=solid, label=None]; "19 down_path_1_block_3_bias" -> "131 conv2d_3" [style=solid, label="(128,)"]; "20 _scale_4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(256,)"]; "21 _zero_point_4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(256,)"]; -"22 _frozen_param4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(256, 128, 3, 3)"]; +"22 quantize_per_channel_default_4" -> "23 dequantize_per_channel_default_4" [style=solid, label="(256, 128, 3, 3)"]; "23 dequantize_per_channel_default_4" -> "136 conv2d_4" [style=solid, label=None]; "24 down_path_2_block_0_bias" -> "136 conv2d_4" [style=solid, label="(256,)"]; "25 _scale_5" -> "28 dequantize_per_channel_default_5" [style=solid, label="(256,)"]; "26 _zero_point_5" -> "28 dequantize_per_channel_default_5" [style=solid, label="(256,)"]; -"27 _frozen_param5" -> "28 dequantize_per_channel_default_5" [style=solid, label="(256, 256, 3, 3)"]; +"27 quantize_per_channel_default_5" -> "28 dequantize_per_channel_default_5" [style=solid, label="(256, 256, 3, 3)"]; "28 dequantize_per_channel_default_5" -> "140 conv2d_5" [style=solid, label=None]; "29 down_path_2_block_3_bias" -> "140 conv2d_5" [style=solid, label="(256,)"]; "30 _scale_6" -> "33 dequantize_per_channel_default_6" [style=solid, label="(512,)"]; "31 _zero_point_6" -> "33 dequantize_per_channel_default_6" [style=solid, label="(512,)"]; -"32 _frozen_param6" -> "33 dequantize_per_channel_default_6" [style=solid, label="(512, 256, 3, 3)"]; +"32 quantize_per_channel_default_6" -> "33 dequantize_per_channel_default_6" [style=solid, label="(512, 256, 3, 3)"]; "33 dequantize_per_channel_default_6" -> "145 conv2d_6" [style=solid, label=None]; "34 down_path_3_block_0_bias" -> "145 conv2d_6" [style=solid, label="(512,)"]; "35 _scale_7" -> "38 dequantize_per_channel_default_7" [style=solid, label="(512,)"]; "36 _zero_point_7" -> "38 dequantize_per_channel_default_7" [style=solid, label="(512,)"]; -"37 _frozen_param7" -> "38 dequantize_per_channel_default_7" [style=solid, label="(512, 512, 3, 3)"]; +"37 quantize_per_channel_default_7" -> "38 dequantize_per_channel_default_7" [style=solid, label="(512, 512, 3, 3)"]; "38 dequantize_per_channel_default_7" -> "149 conv2d_7" [style=solid, label=None]; "39 down_path_3_block_3_bias" -> "149 conv2d_7" [style=solid, label="(512,)"]; "40 _scale_8" -> "43 dequantize_per_channel_default_8" [style=solid, label="(1024,)"]; "41 _zero_point_8" -> "43 dequantize_per_channel_default_8" [style=solid, label="(1024,)"]; -"42 _frozen_param8" -> "43 dequantize_per_channel_default_8" [style=solid, label="(1024, 512, 3, 3)"]; +"42 quantize_per_channel_default_8" -> "43 dequantize_per_channel_default_8" [style=solid, label="(1024, 512, 3, 3)"]; "43 dequantize_per_channel_default_8" -> "154 conv2d_8" [style=solid, label=None]; "44 down_path_4_block_0_bias" -> "154 conv2d_8" [style=solid, label="(1024,)"]; "45 _scale_9" -> "48 dequantize_per_channel_default_9" [style=solid, label="(1024,)"]; "46 _zero_point_9" -> "48 dequantize_per_channel_default_9" [style=solid, label="(1024,)"]; -"47 _frozen_param9" -> "48 dequantize_per_channel_default_9" [style=solid, label="(1024, 1024, 3, 3)"]; +"47 quantize_per_channel_default_9" -> "48 dequantize_per_channel_default_9" [style=solid, label="(1024, 1024, 3, 3)"]; "48 dequantize_per_channel_default_9" -> "158 conv2d_9" [style=solid, label=None]; "49 down_path_4_block_3_bias" -> "158 conv2d_9" [style=solid, label="(1024,)"]; "50 _scale_10" -> "53 dequantize_per_channel_default_10" [style=solid, label="(1024,)"]; "51 _zero_point_10" -> "53 dequantize_per_channel_default_10" [style=solid, label="(1024,)"]; -"52 _frozen_param10" -> "53 dequantize_per_channel_default_10" [style=solid, label="(1024, 512, 2, 2)"]; +"52 quantize_per_channel_default_10" -> "53 dequantize_per_channel_default_10" [style=solid, label="(1024, 512, 2, 2)"]; "53 dequantize_per_channel_default_10" -> "162 conv_transpose2d" [style=solid, label=None]; "54 up_path_0_up_bias" -> "162 conv_transpose2d" [style=solid, label="(512,)"]; "55 _scale_11" -> "58 dequantize_per_channel_default_11" [style=solid, label="(512,)"]; "56 _zero_point_11" -> "58 dequantize_per_channel_default_11" [style=solid, label="(512,)"]; -"57 _frozen_param11" -> "58 dequantize_per_channel_default_11" [style=solid, label="(512, 1024, 3, 3)"]; +"57 quantize_per_channel_default_11" -> "58 dequantize_per_channel_default_11" [style=solid, label="(512, 1024, 3, 3)"]; "58 dequantize_per_channel_default_11" -> "170 conv2d_10" [style=solid, label=None]; "59 up_path_0_conv_block_block_0_bias" -> "170 conv2d_10" [style=solid, label="(512,)"]; "60 _scale_12" -> "63 dequantize_per_channel_default_12" [style=solid, label="(512,)"]; "61 _zero_point_12" -> "63 dequantize_per_channel_default_12" [style=solid, label="(512,)"]; -"62 _frozen_param12" -> "63 dequantize_per_channel_default_12" [style=solid, label="(512, 512, 3, 3)"]; +"62 quantize_per_channel_default_12" -> "63 dequantize_per_channel_default_12" [style=solid, label="(512, 512, 3, 3)"]; "63 dequantize_per_channel_default_12" -> "174 conv2d_11" [style=solid, label=None]; "64 up_path_0_conv_block_block_3_bias" -> "174 conv2d_11" [style=solid, label="(512,)"]; "65 _scale_13" -> "68 dequantize_per_channel_default_13" [style=solid, label="(512,)"]; "66 _zero_point_13" -> "68 dequantize_per_channel_default_13" [style=solid, label="(512,)"]; -"67 _frozen_param13" -> "68 dequantize_per_channel_default_13" [style=solid, label="(512, 256, 2, 2)"]; +"67 quantize_per_channel_default_13" -> "68 dequantize_per_channel_default_13" [style=solid, label="(512, 256, 2, 2)"]; "68 dequantize_per_channel_default_13" -> "178 conv_transpose2d_1" [style=solid, label=None]; "69 up_path_1_up_bias" -> "178 conv_transpose2d_1" [style=solid, label="(256,)"]; "70 _scale_14" -> "73 dequantize_per_channel_default_14" [style=solid, label="(256,)"]; "71 _zero_point_14" -> "73 dequantize_per_channel_default_14" [style=solid, label="(256,)"]; -"72 _frozen_param14" -> "73 dequantize_per_channel_default_14" [style=solid, label="(256, 512, 3, 3)"]; +"72 quantize_per_channel_default_14" -> "73 dequantize_per_channel_default_14" [style=solid, label="(256, 512, 3, 3)"]; "73 dequantize_per_channel_default_14" -> "186 conv2d_12" [style=solid, label=None]; "74 up_path_1_conv_block_block_0_bias" -> "186 conv2d_12" [style=solid, label="(256,)"]; "75 _scale_15" -> "78 dequantize_per_channel_default_15" [style=solid, label="(256,)"]; "76 _zero_point_15" -> "78 dequantize_per_channel_default_15" [style=solid, label="(256,)"]; -"77 _frozen_param15" -> "78 dequantize_per_channel_default_15" [style=solid, label="(256, 256, 3, 3)"]; +"77 quantize_per_channel_default_15" -> "78 dequantize_per_channel_default_15" [style=solid, label="(256, 256, 3, 3)"]; "78 dequantize_per_channel_default_15" -> "190 conv2d_13" [style=solid, label=None]; "79 up_path_1_conv_block_block_3_bias" -> "190 conv2d_13" [style=solid, label="(256,)"]; "80 _scale_16" -> "83 dequantize_per_channel_default_16" [style=solid, label="(256,)"]; "81 _zero_point_16" -> "83 dequantize_per_channel_default_16" [style=solid, label="(256,)"]; -"82 _frozen_param16" -> "83 dequantize_per_channel_default_16" [style=solid, label="(256, 128, 2, 2)"]; +"82 quantize_per_channel_default_16" -> "83 dequantize_per_channel_default_16" [style=solid, label="(256, 128, 2, 2)"]; "83 dequantize_per_channel_default_16" -> "194 conv_transpose2d_2" [style=solid, label=None]; "84 up_path_2_up_bias" -> "194 conv_transpose2d_2" [style=solid, label="(128,)"]; "85 _scale_17" -> "88 dequantize_per_channel_default_17" [style=solid, label="(128,)"]; "86 _zero_point_17" -> "88 dequantize_per_channel_default_17" [style=solid, label="(128,)"]; -"87 _frozen_param17" -> "88 dequantize_per_channel_default_17" [style=solid, label="(128, 256, 3, 3)"]; +"87 quantize_per_channel_default_17" -> "88 dequantize_per_channel_default_17" [style=solid, label="(128, 256, 3, 3)"]; "88 dequantize_per_channel_default_17" -> "202 conv2d_14" [style=solid, label=None]; "89 up_path_2_conv_block_block_0_bias" -> "202 conv2d_14" [style=solid, label="(128,)"]; "90 _scale_18" -> "93 dequantize_per_channel_default_18" [style=solid, label="(128,)"]; "91 _zero_point_18" -> "93 dequantize_per_channel_default_18" [style=solid, label="(128,)"]; -"92 _frozen_param18" -> "93 dequantize_per_channel_default_18" [style=solid, label="(128, 128, 3, 3)"]; +"92 quantize_per_channel_default_18" -> "93 dequantize_per_channel_default_18" [style=solid, label="(128, 128, 3, 3)"]; "93 dequantize_per_channel_default_18" -> "206 conv2d_15" [style=solid, label=None]; "94 up_path_2_conv_block_block_3_bias" -> "206 conv2d_15" [style=solid, label="(128,)"]; "95 _scale_19" -> "98 dequantize_per_channel_default_19" [style=solid, label="(128,)"]; "96 _zero_point_19" -> "98 dequantize_per_channel_default_19" [style=solid, label="(128,)"]; -"97 _frozen_param19" -> "98 dequantize_per_channel_default_19" [style=solid, label="(128, 64, 2, 2)"]; +"97 quantize_per_channel_default_19" -> "98 dequantize_per_channel_default_19" [style=solid, label="(128, 64, 2, 2)"]; "98 dequantize_per_channel_default_19" -> "210 conv_transpose2d_3" [style=solid, label=None]; "99 up_path_3_up_bias" -> "210 conv_transpose2d_3" [style=solid, label="(64,)"]; "100 _scale_20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(64,)"]; "101 _zero_point_20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(64,)"]; -"102 _frozen_param20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(64, 128, 3, 3)"]; +"102 quantize_per_channel_default_20" -> "103 dequantize_per_channel_default_20" [style=solid, label="(64, 128, 3, 3)"]; "103 dequantize_per_channel_default_20" -> "218 conv2d_16" [style=solid, label=None]; "104 up_path_3_conv_block_block_0_bias" -> "218 conv2d_16" [style=solid, label="(64,)"]; "105 _scale_21" -> "108 dequantize_per_channel_default_21" [style=solid, label="(64,)"]; "106 _zero_point_21" -> "108 dequantize_per_channel_default_21" [style=solid, label="(64,)"]; -"107 _frozen_param21" -> "108 dequantize_per_channel_default_21" [style=solid, label="(64, 64, 3, 3)"]; +"107 quantize_per_channel_default_21" -> "108 dequantize_per_channel_default_21" [style=solid, label="(64, 64, 3, 3)"]; "108 dequantize_per_channel_default_21" -> "222 conv2d_17" [style=solid, label=None]; "109 up_path_3_conv_block_block_3_bias" -> "222 conv2d_17" [style=solid, label="(64,)"]; "110 _scale_22" -> "113 dequantize_per_channel_default_22" [style=solid, label="(12,)"]; "111 _zero_point_22" -> "113 dequantize_per_channel_default_22" [style=solid, label="(12,)"]; -"112 _frozen_param22" -> "113 dequantize_per_channel_default_22" [style=solid, label="(12, 64, 1, 1)"]; +"112 quantize_per_channel_default_22" -> "113 dequantize_per_channel_default_22" [style=solid, label="(12, 64, 1, 1)"]; "113 dequantize_per_channel_default_22" -> "226 conv2d_18" [style=solid, label=None]; "114 last_bias" -> "226 conv2d_18" [style=solid, label="(12,)"]; "115 x" -> "116 quantize_per_tensor_default" [style=solid, label="(1, 3, 224, 224)"]; diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/vit_b_16.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/vit_b_16.dot index 5051830b542..7e5a3aa0c54 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/vit_b_16.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/vit_b_16.dot @@ -3,302 +3,302 @@ strict digraph { "1 encoder_pos_embedding" [id=1, type="get_attr"]; "2 _scale_0" [id=2, type="get_attr"]; "3 _zero_point_0" [id=3, type="get_attr"]; -"4 _frozen_param0" [id=4, type="get_attr"]; +"4 quantize_per_channel_default" [id=4, type="get_attr"]; "5 dequantize_per_channel_default" [id=5, type="dequantize_per_channel"]; "6 conv_proj_bias" [id=6, type="get_attr"]; "7 encoder_layers_encoder_layer_0_ln_1_weight" [id=7, type="get_attr"]; "8 encoder_layers_encoder_layer_0_ln_1_bias" [id=8, type="get_attr"]; "9 _scale_1" [id=9, type="get_attr"]; "10 _zero_point_1" [id=10, type="get_attr"]; -"11 _frozen_param1" [id=11, type="get_attr"]; +"11 quantize_per_channel_default_1" [id=11, type="get_attr"]; "12 dequantize_per_channel_default_1" [id=12, type="dequantize_per_channel"]; "13 encoder_layers_encoder_layer_0_self_attention_in_proj_bias" [id=13, type="get_attr"]; "14 _scale_2" [id=14, type="get_attr"]; "15 _zero_point_2" [id=15, type="get_attr"]; -"16 _frozen_param2" [id=16, type="get_attr"]; +"16 quantize_per_channel_default_2" [id=16, type="get_attr"]; "17 dequantize_per_channel_default_2" [id=17, type="dequantize_per_channel"]; "18 encoder_layers_encoder_layer_0_self_attention_out_proj_bias" [id=18, type="get_attr"]; "19 encoder_layers_encoder_layer_0_ln_2_weight" [id=19, type="get_attr"]; "20 encoder_layers_encoder_layer_0_ln_2_bias" [id=20, type="get_attr"]; "21 _scale_3" [id=21, type="get_attr"]; "22 _zero_point_3" [id=22, type="get_attr"]; -"23 _frozen_param3" [id=23, type="get_attr"]; +"23 quantize_per_channel_default_3" [id=23, type="get_attr"]; "24 dequantize_per_channel_default_3" [id=24, type="dequantize_per_channel"]; "25 encoder_layers_encoder_layer_0_mlp_0_bias" [id=25, type="get_attr"]; "26 _scale_4" [id=26, type="get_attr"]; "27 _zero_point_4" [id=27, type="get_attr"]; -"28 _frozen_param4" [id=28, type="get_attr"]; +"28 quantize_per_channel_default_4" [id=28, type="get_attr"]; "29 dequantize_per_channel_default_4" [id=29, type="dequantize_per_channel"]; "30 encoder_layers_encoder_layer_0_mlp_3_bias" [id=30, type="get_attr"]; "31 encoder_layers_encoder_layer_1_ln_1_weight" [id=31, type="get_attr"]; "32 encoder_layers_encoder_layer_1_ln_1_bias" [id=32, type="get_attr"]; "33 _scale_5" [id=33, type="get_attr"]; "34 _zero_point_5" [id=34, type="get_attr"]; -"35 _frozen_param5" [id=35, type="get_attr"]; +"35 quantize_per_channel_default_5" [id=35, type="get_attr"]; "36 dequantize_per_channel_default_5" [id=36, type="dequantize_per_channel"]; "37 encoder_layers_encoder_layer_1_self_attention_in_proj_bias" [id=37, type="get_attr"]; "38 _scale_6" [id=38, type="get_attr"]; "39 _zero_point_6" [id=39, type="get_attr"]; -"40 _frozen_param6" [id=40, type="get_attr"]; +"40 quantize_per_channel_default_6" [id=40, type="get_attr"]; "41 dequantize_per_channel_default_6" [id=41, type="dequantize_per_channel"]; "42 encoder_layers_encoder_layer_1_self_attention_out_proj_bias" [id=42, type="get_attr"]; "43 encoder_layers_encoder_layer_1_ln_2_weight" [id=43, type="get_attr"]; "44 encoder_layers_encoder_layer_1_ln_2_bias" [id=44, type="get_attr"]; "45 _scale_7" [id=45, type="get_attr"]; "46 _zero_point_7" [id=46, type="get_attr"]; -"47 _frozen_param7" [id=47, type="get_attr"]; +"47 quantize_per_channel_default_7" [id=47, type="get_attr"]; "48 dequantize_per_channel_default_7" [id=48, type="dequantize_per_channel"]; "49 encoder_layers_encoder_layer_1_mlp_0_bias" [id=49, type="get_attr"]; "50 _scale_8" [id=50, type="get_attr"]; "51 _zero_point_8" [id=51, type="get_attr"]; -"52 _frozen_param8" [id=52, type="get_attr"]; +"52 quantize_per_channel_default_8" [id=52, type="get_attr"]; "53 dequantize_per_channel_default_8" [id=53, type="dequantize_per_channel"]; "54 encoder_layers_encoder_layer_1_mlp_3_bias" [id=54, type="get_attr"]; "55 encoder_layers_encoder_layer_2_ln_1_weight" [id=55, type="get_attr"]; "56 encoder_layers_encoder_layer_2_ln_1_bias" [id=56, type="get_attr"]; "57 _scale_9" [id=57, type="get_attr"]; "58 _zero_point_9" [id=58, type="get_attr"]; -"59 _frozen_param9" [id=59, type="get_attr"]; +"59 quantize_per_channel_default_9" [id=59, type="get_attr"]; "60 dequantize_per_channel_default_9" [id=60, type="dequantize_per_channel"]; "61 encoder_layers_encoder_layer_2_self_attention_in_proj_bias" [id=61, type="get_attr"]; "62 _scale_10" [id=62, type="get_attr"]; "63 _zero_point_10" [id=63, type="get_attr"]; -"64 _frozen_param10" [id=64, type="get_attr"]; +"64 quantize_per_channel_default_10" [id=64, type="get_attr"]; "65 dequantize_per_channel_default_10" [id=65, type="dequantize_per_channel"]; "66 encoder_layers_encoder_layer_2_self_attention_out_proj_bias" [id=66, type="get_attr"]; "67 encoder_layers_encoder_layer_2_ln_2_weight" [id=67, type="get_attr"]; "68 encoder_layers_encoder_layer_2_ln_2_bias" [id=68, type="get_attr"]; "69 _scale_11" [id=69, type="get_attr"]; "70 _zero_point_11" [id=70, type="get_attr"]; -"71 _frozen_param11" [id=71, type="get_attr"]; +"71 quantize_per_channel_default_11" [id=71, type="get_attr"]; "72 dequantize_per_channel_default_11" [id=72, type="dequantize_per_channel"]; "73 encoder_layers_encoder_layer_2_mlp_0_bias" [id=73, type="get_attr"]; "74 _scale_12" [id=74, type="get_attr"]; "75 _zero_point_12" [id=75, type="get_attr"]; -"76 _frozen_param12" [id=76, type="get_attr"]; +"76 quantize_per_channel_default_12" [id=76, type="get_attr"]; "77 dequantize_per_channel_default_12" [id=77, type="dequantize_per_channel"]; "78 encoder_layers_encoder_layer_2_mlp_3_bias" [id=78, type="get_attr"]; "79 encoder_layers_encoder_layer_3_ln_1_weight" [id=79, type="get_attr"]; "80 encoder_layers_encoder_layer_3_ln_1_bias" [id=80, type="get_attr"]; "81 _scale_13" [id=81, type="get_attr"]; "82 _zero_point_13" [id=82, type="get_attr"]; -"83 _frozen_param13" [id=83, type="get_attr"]; +"83 quantize_per_channel_default_13" [id=83, type="get_attr"]; "84 dequantize_per_channel_default_13" [id=84, type="dequantize_per_channel"]; "85 encoder_layers_encoder_layer_3_self_attention_in_proj_bias" [id=85, type="get_attr"]; "86 _scale_14" [id=86, type="get_attr"]; "87 _zero_point_14" [id=87, type="get_attr"]; -"88 _frozen_param14" [id=88, type="get_attr"]; +"88 quantize_per_channel_default_14" [id=88, type="get_attr"]; "89 dequantize_per_channel_default_14" [id=89, type="dequantize_per_channel"]; "90 encoder_layers_encoder_layer_3_self_attention_out_proj_bias" [id=90, type="get_attr"]; "91 encoder_layers_encoder_layer_3_ln_2_weight" [id=91, type="get_attr"]; "92 encoder_layers_encoder_layer_3_ln_2_bias" [id=92, type="get_attr"]; "93 _scale_15" [id=93, type="get_attr"]; "94 _zero_point_15" [id=94, type="get_attr"]; -"95 _frozen_param15" [id=95, type="get_attr"]; +"95 quantize_per_channel_default_15" [id=95, type="get_attr"]; "96 dequantize_per_channel_default_15" [id=96, type="dequantize_per_channel"]; "97 encoder_layers_encoder_layer_3_mlp_0_bias" [id=97, type="get_attr"]; "98 _scale_16" [id=98, type="get_attr"]; "99 _zero_point_16" [id=99, type="get_attr"]; -"100 _frozen_param16" [id=100, type="get_attr"]; +"100 quantize_per_channel_default_16" [id=100, type="get_attr"]; "101 dequantize_per_channel_default_16" [id=101, type="dequantize_per_channel"]; "102 encoder_layers_encoder_layer_3_mlp_3_bias" [id=102, type="get_attr"]; "103 encoder_layers_encoder_layer_4_ln_1_weight" [id=103, type="get_attr"]; "104 encoder_layers_encoder_layer_4_ln_1_bias" [id=104, type="get_attr"]; "105 _scale_17" [id=105, type="get_attr"]; "106 _zero_point_17" [id=106, type="get_attr"]; -"107 _frozen_param17" [id=107, type="get_attr"]; +"107 quantize_per_channel_default_17" [id=107, type="get_attr"]; "108 dequantize_per_channel_default_17" [id=108, type="dequantize_per_channel"]; "109 encoder_layers_encoder_layer_4_self_attention_in_proj_bias" [id=109, type="get_attr"]; "110 _scale_18" [id=110, type="get_attr"]; "111 _zero_point_18" [id=111, type="get_attr"]; -"112 _frozen_param18" [id=112, type="get_attr"]; +"112 quantize_per_channel_default_18" [id=112, type="get_attr"]; "113 dequantize_per_channel_default_18" [id=113, type="dequantize_per_channel"]; "114 encoder_layers_encoder_layer_4_self_attention_out_proj_bias" [id=114, type="get_attr"]; "115 encoder_layers_encoder_layer_4_ln_2_weight" [id=115, type="get_attr"]; "116 encoder_layers_encoder_layer_4_ln_2_bias" [id=116, type="get_attr"]; "117 _scale_19" [id=117, type="get_attr"]; "118 _zero_point_19" [id=118, type="get_attr"]; -"119 _frozen_param19" [id=119, type="get_attr"]; +"119 quantize_per_channel_default_19" [id=119, type="get_attr"]; "120 dequantize_per_channel_default_19" [id=120, type="dequantize_per_channel"]; "121 encoder_layers_encoder_layer_4_mlp_0_bias" [id=121, type="get_attr"]; "122 _scale_20" [id=122, type="get_attr"]; "123 _zero_point_20" [id=123, type="get_attr"]; -"124 _frozen_param20" [id=124, type="get_attr"]; +"124 quantize_per_channel_default_20" [id=124, type="get_attr"]; "125 dequantize_per_channel_default_20" [id=125, type="dequantize_per_channel"]; "126 encoder_layers_encoder_layer_4_mlp_3_bias" [id=126, type="get_attr"]; "127 encoder_layers_encoder_layer_5_ln_1_weight" [id=127, type="get_attr"]; "128 encoder_layers_encoder_layer_5_ln_1_bias" [id=128, type="get_attr"]; "129 _scale_21" [id=129, type="get_attr"]; "130 _zero_point_21" [id=130, type="get_attr"]; -"131 _frozen_param21" [id=131, type="get_attr"]; +"131 quantize_per_channel_default_21" [id=131, type="get_attr"]; "132 dequantize_per_channel_default_21" [id=132, type="dequantize_per_channel"]; "133 encoder_layers_encoder_layer_5_self_attention_in_proj_bias" [id=133, type="get_attr"]; "134 _scale_22" [id=134, type="get_attr"]; "135 _zero_point_22" [id=135, type="get_attr"]; -"136 _frozen_param22" [id=136, type="get_attr"]; +"136 quantize_per_channel_default_22" [id=136, type="get_attr"]; "137 dequantize_per_channel_default_22" [id=137, type="dequantize_per_channel"]; "138 encoder_layers_encoder_layer_5_self_attention_out_proj_bias" [id=138, type="get_attr"]; "139 encoder_layers_encoder_layer_5_ln_2_weight" [id=139, type="get_attr"]; "140 encoder_layers_encoder_layer_5_ln_2_bias" [id=140, type="get_attr"]; "141 _scale_23" [id=141, type="get_attr"]; "142 _zero_point_23" [id=142, type="get_attr"]; -"143 _frozen_param23" [id=143, type="get_attr"]; +"143 quantize_per_channel_default_23" [id=143, type="get_attr"]; "144 dequantize_per_channel_default_23" [id=144, type="dequantize_per_channel"]; "145 encoder_layers_encoder_layer_5_mlp_0_bias" [id=145, type="get_attr"]; "146 _scale_24" [id=146, type="get_attr"]; "147 _zero_point_24" [id=147, type="get_attr"]; -"148 _frozen_param24" [id=148, type="get_attr"]; +"148 quantize_per_channel_default_24" [id=148, type="get_attr"]; "149 dequantize_per_channel_default_24" [id=149, type="dequantize_per_channel"]; "150 encoder_layers_encoder_layer_5_mlp_3_bias" [id=150, type="get_attr"]; "151 encoder_layers_encoder_layer_6_ln_1_weight" [id=151, type="get_attr"]; "152 encoder_layers_encoder_layer_6_ln_1_bias" [id=152, type="get_attr"]; "153 _scale_25" [id=153, type="get_attr"]; "154 _zero_point_25" [id=154, type="get_attr"]; -"155 _frozen_param25" [id=155, type="get_attr"]; +"155 quantize_per_channel_default_25" [id=155, type="get_attr"]; "156 dequantize_per_channel_default_25" [id=156, type="dequantize_per_channel"]; "157 encoder_layers_encoder_layer_6_self_attention_in_proj_bias" [id=157, type="get_attr"]; "158 _scale_26" [id=158, type="get_attr"]; "159 _zero_point_26" [id=159, type="get_attr"]; -"160 _frozen_param26" [id=160, type="get_attr"]; +"160 quantize_per_channel_default_26" [id=160, type="get_attr"]; "161 dequantize_per_channel_default_26" [id=161, type="dequantize_per_channel"]; "162 encoder_layers_encoder_layer_6_self_attention_out_proj_bias" [id=162, type="get_attr"]; "163 encoder_layers_encoder_layer_6_ln_2_weight" [id=163, type="get_attr"]; "164 encoder_layers_encoder_layer_6_ln_2_bias" [id=164, type="get_attr"]; "165 _scale_27" [id=165, type="get_attr"]; "166 _zero_point_27" [id=166, type="get_attr"]; -"167 _frozen_param27" [id=167, type="get_attr"]; +"167 quantize_per_channel_default_27" [id=167, type="get_attr"]; "168 dequantize_per_channel_default_27" [id=168, type="dequantize_per_channel"]; "169 encoder_layers_encoder_layer_6_mlp_0_bias" [id=169, type="get_attr"]; "170 _scale_28" [id=170, type="get_attr"]; "171 _zero_point_28" [id=171, type="get_attr"]; -"172 _frozen_param28" [id=172, type="get_attr"]; +"172 quantize_per_channel_default_28" [id=172, type="get_attr"]; "173 dequantize_per_channel_default_28" [id=173, type="dequantize_per_channel"]; "174 encoder_layers_encoder_layer_6_mlp_3_bias" [id=174, type="get_attr"]; "175 encoder_layers_encoder_layer_7_ln_1_weight" [id=175, type="get_attr"]; "176 encoder_layers_encoder_layer_7_ln_1_bias" [id=176, type="get_attr"]; "177 _scale_29" [id=177, type="get_attr"]; "178 _zero_point_29" [id=178, type="get_attr"]; -"179 _frozen_param29" [id=179, type="get_attr"]; +"179 quantize_per_channel_default_29" [id=179, type="get_attr"]; "180 dequantize_per_channel_default_29" [id=180, type="dequantize_per_channel"]; "181 encoder_layers_encoder_layer_7_self_attention_in_proj_bias" [id=181, type="get_attr"]; "182 _scale_30" [id=182, type="get_attr"]; "183 _zero_point_30" [id=183, type="get_attr"]; -"184 _frozen_param30" [id=184, type="get_attr"]; +"184 quantize_per_channel_default_30" [id=184, type="get_attr"]; "185 dequantize_per_channel_default_30" [id=185, type="dequantize_per_channel"]; "186 encoder_layers_encoder_layer_7_self_attention_out_proj_bias" [id=186, type="get_attr"]; "187 encoder_layers_encoder_layer_7_ln_2_weight" [id=187, type="get_attr"]; "188 encoder_layers_encoder_layer_7_ln_2_bias" [id=188, type="get_attr"]; "189 _scale_31" [id=189, type="get_attr"]; "190 _zero_point_31" [id=190, type="get_attr"]; -"191 _frozen_param31" [id=191, type="get_attr"]; +"191 quantize_per_channel_default_31" [id=191, type="get_attr"]; "192 dequantize_per_channel_default_31" [id=192, type="dequantize_per_channel"]; "193 encoder_layers_encoder_layer_7_mlp_0_bias" [id=193, type="get_attr"]; "194 _scale_32" [id=194, type="get_attr"]; "195 _zero_point_32" [id=195, type="get_attr"]; -"196 _frozen_param32" [id=196, type="get_attr"]; +"196 quantize_per_channel_default_32" [id=196, type="get_attr"]; "197 dequantize_per_channel_default_32" [id=197, type="dequantize_per_channel"]; "198 encoder_layers_encoder_layer_7_mlp_3_bias" [id=198, type="get_attr"]; "199 encoder_layers_encoder_layer_8_ln_1_weight" [id=199, type="get_attr"]; "200 encoder_layers_encoder_layer_8_ln_1_bias" [id=200, type="get_attr"]; "201 _scale_33" [id=201, type="get_attr"]; "202 _zero_point_33" [id=202, type="get_attr"]; -"203 _frozen_param33" [id=203, type="get_attr"]; +"203 quantize_per_channel_default_33" [id=203, type="get_attr"]; "204 dequantize_per_channel_default_33" [id=204, type="dequantize_per_channel"]; "205 encoder_layers_encoder_layer_8_self_attention_in_proj_bias" [id=205, type="get_attr"]; "206 _scale_34" [id=206, type="get_attr"]; "207 _zero_point_34" [id=207, type="get_attr"]; -"208 _frozen_param34" [id=208, type="get_attr"]; +"208 quantize_per_channel_default_34" [id=208, type="get_attr"]; "209 dequantize_per_channel_default_34" [id=209, type="dequantize_per_channel"]; "210 encoder_layers_encoder_layer_8_self_attention_out_proj_bias" [id=210, type="get_attr"]; "211 encoder_layers_encoder_layer_8_ln_2_weight" [id=211, type="get_attr"]; "212 encoder_layers_encoder_layer_8_ln_2_bias" [id=212, type="get_attr"]; "213 _scale_35" [id=213, type="get_attr"]; "214 _zero_point_35" [id=214, type="get_attr"]; -"215 _frozen_param35" [id=215, type="get_attr"]; +"215 quantize_per_channel_default_35" [id=215, type="get_attr"]; "216 dequantize_per_channel_default_35" [id=216, type="dequantize_per_channel"]; "217 encoder_layers_encoder_layer_8_mlp_0_bias" [id=217, type="get_attr"]; "218 _scale_36" [id=218, type="get_attr"]; "219 _zero_point_36" [id=219, type="get_attr"]; -"220 _frozen_param36" [id=220, type="get_attr"]; +"220 quantize_per_channel_default_36" [id=220, type="get_attr"]; "221 dequantize_per_channel_default_36" [id=221, type="dequantize_per_channel"]; "222 encoder_layers_encoder_layer_8_mlp_3_bias" [id=222, type="get_attr"]; "223 encoder_layers_encoder_layer_9_ln_1_weight" [id=223, type="get_attr"]; "224 encoder_layers_encoder_layer_9_ln_1_bias" [id=224, type="get_attr"]; "225 _scale_37" [id=225, type="get_attr"]; "226 _zero_point_37" [id=226, type="get_attr"]; -"227 _frozen_param37" [id=227, type="get_attr"]; +"227 quantize_per_channel_default_37" [id=227, type="get_attr"]; "228 dequantize_per_channel_default_37" [id=228, type="dequantize_per_channel"]; "229 encoder_layers_encoder_layer_9_self_attention_in_proj_bias" [id=229, type="get_attr"]; "230 _scale_38" [id=230, type="get_attr"]; "231 _zero_point_38" [id=231, type="get_attr"]; -"232 _frozen_param38" [id=232, type="get_attr"]; +"232 quantize_per_channel_default_38" [id=232, type="get_attr"]; "233 dequantize_per_channel_default_38" [id=233, type="dequantize_per_channel"]; "234 encoder_layers_encoder_layer_9_self_attention_out_proj_bias" [id=234, type="get_attr"]; "235 encoder_layers_encoder_layer_9_ln_2_weight" [id=235, type="get_attr"]; "236 encoder_layers_encoder_layer_9_ln_2_bias" [id=236, type="get_attr"]; "237 _scale_39" [id=237, type="get_attr"]; "238 _zero_point_39" [id=238, type="get_attr"]; -"239 _frozen_param39" [id=239, type="get_attr"]; +"239 quantize_per_channel_default_39" [id=239, type="get_attr"]; "240 dequantize_per_channel_default_39" [id=240, type="dequantize_per_channel"]; "241 encoder_layers_encoder_layer_9_mlp_0_bias" [id=241, type="get_attr"]; "242 _scale_40" [id=242, type="get_attr"]; "243 _zero_point_40" [id=243, type="get_attr"]; -"244 _frozen_param40" [id=244, type="get_attr"]; +"244 quantize_per_channel_default_40" [id=244, type="get_attr"]; "245 dequantize_per_channel_default_40" [id=245, type="dequantize_per_channel"]; "246 encoder_layers_encoder_layer_9_mlp_3_bias" [id=246, type="get_attr"]; "247 encoder_layers_encoder_layer_10_ln_1_weight" [id=247, type="get_attr"]; "248 encoder_layers_encoder_layer_10_ln_1_bias" [id=248, type="get_attr"]; "249 _scale_41" [id=249, type="get_attr"]; "250 _zero_point_41" [id=250, type="get_attr"]; -"251 _frozen_param41" [id=251, type="get_attr"]; +"251 quantize_per_channel_default_41" [id=251, type="get_attr"]; "252 dequantize_per_channel_default_41" [id=252, type="dequantize_per_channel"]; "253 encoder_layers_encoder_layer_10_self_attention_in_proj_bias" [id=253, type="get_attr"]; "254 _scale_42" [id=254, type="get_attr"]; "255 _zero_point_42" [id=255, type="get_attr"]; -"256 _frozen_param42" [id=256, type="get_attr"]; +"256 quantize_per_channel_default_42" [id=256, type="get_attr"]; "257 dequantize_per_channel_default_42" [id=257, type="dequantize_per_channel"]; "258 encoder_layers_encoder_layer_10_self_attention_out_proj_bias" [id=258, type="get_attr"]; "259 encoder_layers_encoder_layer_10_ln_2_weight" [id=259, type="get_attr"]; "260 encoder_layers_encoder_layer_10_ln_2_bias" [id=260, type="get_attr"]; "261 _scale_43" [id=261, type="get_attr"]; "262 _zero_point_43" [id=262, type="get_attr"]; -"263 _frozen_param43" [id=263, type="get_attr"]; +"263 quantize_per_channel_default_43" [id=263, type="get_attr"]; "264 dequantize_per_channel_default_43" [id=264, type="dequantize_per_channel"]; "265 encoder_layers_encoder_layer_10_mlp_0_bias" [id=265, type="get_attr"]; "266 _scale_44" [id=266, type="get_attr"]; "267 _zero_point_44" [id=267, type="get_attr"]; -"268 _frozen_param44" [id=268, type="get_attr"]; +"268 quantize_per_channel_default_44" [id=268, type="get_attr"]; "269 dequantize_per_channel_default_44" [id=269, type="dequantize_per_channel"]; "270 encoder_layers_encoder_layer_10_mlp_3_bias" [id=270, type="get_attr"]; "271 encoder_layers_encoder_layer_11_ln_1_weight" [id=271, type="get_attr"]; "272 encoder_layers_encoder_layer_11_ln_1_bias" [id=272, type="get_attr"]; "273 _scale_45" [id=273, type="get_attr"]; "274 _zero_point_45" [id=274, type="get_attr"]; -"275 _frozen_param45" [id=275, type="get_attr"]; +"275 quantize_per_channel_default_45" [id=275, type="get_attr"]; "276 dequantize_per_channel_default_45" [id=276, type="dequantize_per_channel"]; "277 encoder_layers_encoder_layer_11_self_attention_in_proj_bias" [id=277, type="get_attr"]; "278 _scale_46" [id=278, type="get_attr"]; "279 _zero_point_46" [id=279, type="get_attr"]; -"280 _frozen_param46" [id=280, type="get_attr"]; +"280 quantize_per_channel_default_46" [id=280, type="get_attr"]; "281 dequantize_per_channel_default_46" [id=281, type="dequantize_per_channel"]; "282 encoder_layers_encoder_layer_11_self_attention_out_proj_bias" [id=282, type="get_attr"]; "283 encoder_layers_encoder_layer_11_ln_2_weight" [id=283, type="get_attr"]; "284 encoder_layers_encoder_layer_11_ln_2_bias" [id=284, type="get_attr"]; "285 _scale_47" [id=285, type="get_attr"]; "286 _zero_point_47" [id=286, type="get_attr"]; -"287 _frozen_param47" [id=287, type="get_attr"]; +"287 quantize_per_channel_default_47" [id=287, type="get_attr"]; "288 dequantize_per_channel_default_47" [id=288, type="dequantize_per_channel"]; "289 encoder_layers_encoder_layer_11_mlp_0_bias" [id=289, type="get_attr"]; "290 _scale_48" [id=290, type="get_attr"]; "291 _zero_point_48" [id=291, type="get_attr"]; -"292 _frozen_param48" [id=292, type="get_attr"]; +"292 quantize_per_channel_default_48" [id=292, type="get_attr"]; "293 dequantize_per_channel_default_48" [id=293, type="dequantize_per_channel"]; "294 encoder_layers_encoder_layer_11_mlp_3_bias" [id=294, type="get_attr"]; "295 encoder_ln_weight" [id=295, type="get_attr"]; "296 encoder_ln_bias" [id=296, type="get_attr"]; "297 _scale_49" [id=297, type="get_attr"]; "298 _zero_point_49" [id=298, type="get_attr"]; -"299 _frozen_param49" [id=299, type="get_attr"]; +"299 quantize_per_channel_default_49" [id=299, type="get_attr"]; "300 dequantize_per_channel_default_49" [id=300, type="dequantize_per_channel"]; "301 heads_head_bias" [id=301, type="get_attr"]; "302 x" [id=302, type=input]; @@ -874,302 +874,302 @@ strict digraph { "1 encoder_pos_embedding" -> "310 add" [style=solid, label="(1, 197, 768)"]; "2 _scale_0" -> "5 dequantize_per_channel_default" [style=solid, label="(768,)"]; "3 _zero_point_0" -> "5 dequantize_per_channel_default" [style=solid, label="(768,)"]; -"4 _frozen_param0" -> "5 dequantize_per_channel_default" [style=solid, label="(768, 3, 16, 16)"]; +"4 quantize_per_channel_default" -> "5 dequantize_per_channel_default" [style=solid, label="(768, 3, 16, 16)"]; "5 dequantize_per_channel_default" -> "305 conv2d" [style=solid, label=None]; "6 conv_proj_bias" -> "305 conv2d" [style=solid, label="(768,)"]; "7 encoder_layers_encoder_layer_0_ln_1_weight" -> "312 layer_norm" [style=solid, label="(768,)"]; "8 encoder_layers_encoder_layer_0_ln_1_bias" -> "312 layer_norm" [style=solid, label="(768,)"]; "9 _scale_1" -> "12 dequantize_per_channel_default_1" [style=solid, label="(2304,)"]; "10 _zero_point_1" -> "12 dequantize_per_channel_default_1" [style=solid, label="(2304,)"]; -"11 _frozen_param1" -> "12 dequantize_per_channel_default_1" [style=solid, label="(2304, 768)"]; +"11 quantize_per_channel_default_1" -> "12 dequantize_per_channel_default_1" [style=solid, label="(2304, 768)"]; "12 dequantize_per_channel_default_1" -> "316 linear" [style=solid, label=None]; "13 encoder_layers_encoder_layer_0_self_attention_in_proj_bias" -> "316 linear" [style=solid, label="(2304,)"]; "14 _scale_2" -> "17 dequantize_per_channel_default_2" [style=solid, label="(768,)"]; "15 _zero_point_2" -> "17 dequantize_per_channel_default_2" [style=solid, label="(768,)"]; -"16 _frozen_param2" -> "17 dequantize_per_channel_default_2" [style=solid, label="(768, 768)"]; +"16 quantize_per_channel_default_2" -> "17 dequantize_per_channel_default_2" [style=solid, label="(768, 768)"]; "17 dequantize_per_channel_default_2" -> "342 linear_1" [style=solid, label=None]; "18 encoder_layers_encoder_layer_0_self_attention_out_proj_bias" -> "342 linear_1" [style=solid, label="(768,)"]; "19 encoder_layers_encoder_layer_0_ln_2_weight" -> "347 layer_norm_1" [style=solid, label="(768,)"]; "20 encoder_layers_encoder_layer_0_ln_2_bias" -> "347 layer_norm_1" [style=solid, label="(768,)"]; "21 _scale_3" -> "24 dequantize_per_channel_default_3" [style=solid, label="(3072,)"]; "22 _zero_point_3" -> "24 dequantize_per_channel_default_3" [style=solid, label="(3072,)"]; -"23 _frozen_param3" -> "24 dequantize_per_channel_default_3" [style=solid, label="(3072, 768)"]; +"23 quantize_per_channel_default_3" -> "24 dequantize_per_channel_default_3" [style=solid, label="(3072, 768)"]; "24 dequantize_per_channel_default_3" -> "350 linear_2" [style=solid, label=None]; "25 encoder_layers_encoder_layer_0_mlp_0_bias" -> "350 linear_2" [style=solid, label="(3072,)"]; "26 _scale_4" -> "29 dequantize_per_channel_default_4" [style=solid, label="(768,)"]; "27 _zero_point_4" -> "29 dequantize_per_channel_default_4" [style=solid, label="(768,)"]; -"28 _frozen_param4" -> "29 dequantize_per_channel_default_4" [style=solid, label="(768, 3072)"]; +"28 quantize_per_channel_default_4" -> "29 dequantize_per_channel_default_4" [style=solid, label="(768, 3072)"]; "29 dequantize_per_channel_default_4" -> "355 linear_3" [style=solid, label=None]; "30 encoder_layers_encoder_layer_0_mlp_3_bias" -> "355 linear_3" [style=solid, label="(768,)"]; "31 encoder_layers_encoder_layer_1_ln_1_weight" -> "358 layer_norm_2" [style=solid, label="(768,)"]; "32 encoder_layers_encoder_layer_1_ln_1_bias" -> "358 layer_norm_2" [style=solid, label="(768,)"]; "33 _scale_5" -> "36 dequantize_per_channel_default_5" [style=solid, label="(2304,)"]; "34 _zero_point_5" -> "36 dequantize_per_channel_default_5" [style=solid, label="(2304,)"]; -"35 _frozen_param5" -> "36 dequantize_per_channel_default_5" [style=solid, label="(2304, 768)"]; +"35 quantize_per_channel_default_5" -> "36 dequantize_per_channel_default_5" [style=solid, label="(2304, 768)"]; "36 dequantize_per_channel_default_5" -> "362 linear_4" [style=solid, label=None]; "37 encoder_layers_encoder_layer_1_self_attention_in_proj_bias" -> "362 linear_4" [style=solid, label="(2304,)"]; "38 _scale_6" -> "41 dequantize_per_channel_default_6" [style=solid, label="(768,)"]; "39 _zero_point_6" -> "41 dequantize_per_channel_default_6" [style=solid, label="(768,)"]; -"40 _frozen_param6" -> "41 dequantize_per_channel_default_6" [style=solid, label="(768, 768)"]; +"40 quantize_per_channel_default_6" -> "41 dequantize_per_channel_default_6" [style=solid, label="(768, 768)"]; "41 dequantize_per_channel_default_6" -> "388 linear_5" [style=solid, label=None]; "42 encoder_layers_encoder_layer_1_self_attention_out_proj_bias" -> "388 linear_5" [style=solid, label="(768,)"]; "43 encoder_layers_encoder_layer_1_ln_2_weight" -> "393 layer_norm_3" [style=solid, label="(768,)"]; "44 encoder_layers_encoder_layer_1_ln_2_bias" -> "393 layer_norm_3" [style=solid, label="(768,)"]; "45 _scale_7" -> "48 dequantize_per_channel_default_7" [style=solid, label="(3072,)"]; "46 _zero_point_7" -> "48 dequantize_per_channel_default_7" [style=solid, label="(3072,)"]; -"47 _frozen_param7" -> "48 dequantize_per_channel_default_7" [style=solid, label="(3072, 768)"]; +"47 quantize_per_channel_default_7" -> "48 dequantize_per_channel_default_7" [style=solid, label="(3072, 768)"]; "48 dequantize_per_channel_default_7" -> "396 linear_6" [style=solid, label=None]; "49 encoder_layers_encoder_layer_1_mlp_0_bias" -> "396 linear_6" [style=solid, label="(3072,)"]; "50 _scale_8" -> "53 dequantize_per_channel_default_8" [style=solid, label="(768,)"]; "51 _zero_point_8" -> "53 dequantize_per_channel_default_8" [style=solid, label="(768,)"]; -"52 _frozen_param8" -> "53 dequantize_per_channel_default_8" [style=solid, label="(768, 3072)"]; +"52 quantize_per_channel_default_8" -> "53 dequantize_per_channel_default_8" [style=solid, label="(768, 3072)"]; "53 dequantize_per_channel_default_8" -> "401 linear_7" [style=solid, label=None]; "54 encoder_layers_encoder_layer_1_mlp_3_bias" -> "401 linear_7" [style=solid, label="(768,)"]; "55 encoder_layers_encoder_layer_2_ln_1_weight" -> "404 layer_norm_4" [style=solid, label="(768,)"]; "56 encoder_layers_encoder_layer_2_ln_1_bias" -> "404 layer_norm_4" [style=solid, label="(768,)"]; "57 _scale_9" -> "60 dequantize_per_channel_default_9" [style=solid, label="(2304,)"]; "58 _zero_point_9" -> "60 dequantize_per_channel_default_9" [style=solid, label="(2304,)"]; -"59 _frozen_param9" -> "60 dequantize_per_channel_default_9" [style=solid, label="(2304, 768)"]; +"59 quantize_per_channel_default_9" -> "60 dequantize_per_channel_default_9" [style=solid, label="(2304, 768)"]; "60 dequantize_per_channel_default_9" -> "408 linear_8" [style=solid, label=None]; "61 encoder_layers_encoder_layer_2_self_attention_in_proj_bias" -> "408 linear_8" [style=solid, label="(2304,)"]; "62 _scale_10" -> "65 dequantize_per_channel_default_10" [style=solid, label="(768,)"]; "63 _zero_point_10" -> "65 dequantize_per_channel_default_10" [style=solid, label="(768,)"]; -"64 _frozen_param10" -> "65 dequantize_per_channel_default_10" [style=solid, label="(768, 768)"]; +"64 quantize_per_channel_default_10" -> "65 dequantize_per_channel_default_10" [style=solid, label="(768, 768)"]; "65 dequantize_per_channel_default_10" -> "434 linear_9" [style=solid, label=None]; "66 encoder_layers_encoder_layer_2_self_attention_out_proj_bias" -> "434 linear_9" [style=solid, label="(768,)"]; "67 encoder_layers_encoder_layer_2_ln_2_weight" -> "439 layer_norm_5" [style=solid, label="(768,)"]; "68 encoder_layers_encoder_layer_2_ln_2_bias" -> "439 layer_norm_5" [style=solid, label="(768,)"]; "69 _scale_11" -> "72 dequantize_per_channel_default_11" [style=solid, label="(3072,)"]; "70 _zero_point_11" -> "72 dequantize_per_channel_default_11" [style=solid, label="(3072,)"]; -"71 _frozen_param11" -> "72 dequantize_per_channel_default_11" [style=solid, label="(3072, 768)"]; +"71 quantize_per_channel_default_11" -> "72 dequantize_per_channel_default_11" [style=solid, label="(3072, 768)"]; "72 dequantize_per_channel_default_11" -> "442 linear_10" [style=solid, label=None]; "73 encoder_layers_encoder_layer_2_mlp_0_bias" -> "442 linear_10" [style=solid, label="(3072,)"]; "74 _scale_12" -> "77 dequantize_per_channel_default_12" [style=solid, label="(768,)"]; "75 _zero_point_12" -> "77 dequantize_per_channel_default_12" [style=solid, label="(768,)"]; -"76 _frozen_param12" -> "77 dequantize_per_channel_default_12" [style=solid, label="(768, 3072)"]; +"76 quantize_per_channel_default_12" -> "77 dequantize_per_channel_default_12" [style=solid, label="(768, 3072)"]; "77 dequantize_per_channel_default_12" -> "447 linear_11" [style=solid, label=None]; "78 encoder_layers_encoder_layer_2_mlp_3_bias" -> "447 linear_11" [style=solid, label="(768,)"]; "79 encoder_layers_encoder_layer_3_ln_1_weight" -> "450 layer_norm_6" [style=solid, label="(768,)"]; "80 encoder_layers_encoder_layer_3_ln_1_bias" -> "450 layer_norm_6" [style=solid, label="(768,)"]; "81 _scale_13" -> "84 dequantize_per_channel_default_13" [style=solid, label="(2304,)"]; "82 _zero_point_13" -> "84 dequantize_per_channel_default_13" [style=solid, label="(2304,)"]; -"83 _frozen_param13" -> "84 dequantize_per_channel_default_13" [style=solid, label="(2304, 768)"]; +"83 quantize_per_channel_default_13" -> "84 dequantize_per_channel_default_13" [style=solid, label="(2304, 768)"]; "84 dequantize_per_channel_default_13" -> "454 linear_12" [style=solid, label=None]; "85 encoder_layers_encoder_layer_3_self_attention_in_proj_bias" -> "454 linear_12" [style=solid, label="(2304,)"]; "86 _scale_14" -> "89 dequantize_per_channel_default_14" [style=solid, label="(768,)"]; "87 _zero_point_14" -> "89 dequantize_per_channel_default_14" [style=solid, label="(768,)"]; -"88 _frozen_param14" -> "89 dequantize_per_channel_default_14" [style=solid, label="(768, 768)"]; +"88 quantize_per_channel_default_14" -> "89 dequantize_per_channel_default_14" [style=solid, label="(768, 768)"]; "89 dequantize_per_channel_default_14" -> "480 linear_13" [style=solid, label=None]; "90 encoder_layers_encoder_layer_3_self_attention_out_proj_bias" -> "480 linear_13" [style=solid, label="(768,)"]; "91 encoder_layers_encoder_layer_3_ln_2_weight" -> "485 layer_norm_7" [style=solid, label="(768,)"]; "92 encoder_layers_encoder_layer_3_ln_2_bias" -> "485 layer_norm_7" [style=solid, label="(768,)"]; "93 _scale_15" -> "96 dequantize_per_channel_default_15" [style=solid, label="(3072,)"]; "94 _zero_point_15" -> "96 dequantize_per_channel_default_15" [style=solid, label="(3072,)"]; -"95 _frozen_param15" -> "96 dequantize_per_channel_default_15" [style=solid, label="(3072, 768)"]; +"95 quantize_per_channel_default_15" -> "96 dequantize_per_channel_default_15" [style=solid, label="(3072, 768)"]; "96 dequantize_per_channel_default_15" -> "488 linear_14" [style=solid, label=None]; "97 encoder_layers_encoder_layer_3_mlp_0_bias" -> "488 linear_14" [style=solid, label="(3072,)"]; "98 _scale_16" -> "101 dequantize_per_channel_default_16" [style=solid, label="(768,)"]; "99 _zero_point_16" -> "101 dequantize_per_channel_default_16" [style=solid, label="(768,)"]; -"100 _frozen_param16" -> "101 dequantize_per_channel_default_16" [style=solid, label="(768, 3072)"]; +"100 quantize_per_channel_default_16" -> "101 dequantize_per_channel_default_16" [style=solid, label="(768, 3072)"]; "101 dequantize_per_channel_default_16" -> "493 linear_15" [style=solid, label=None]; "102 encoder_layers_encoder_layer_3_mlp_3_bias" -> "493 linear_15" [style=solid, label="(768,)"]; "103 encoder_layers_encoder_layer_4_ln_1_weight" -> "496 layer_norm_8" [style=solid, label="(768,)"]; "104 encoder_layers_encoder_layer_4_ln_1_bias" -> "496 layer_norm_8" [style=solid, label="(768,)"]; "105 _scale_17" -> "108 dequantize_per_channel_default_17" [style=solid, label="(2304,)"]; "106 _zero_point_17" -> "108 dequantize_per_channel_default_17" [style=solid, label="(2304,)"]; -"107 _frozen_param17" -> "108 dequantize_per_channel_default_17" [style=solid, label="(2304, 768)"]; +"107 quantize_per_channel_default_17" -> "108 dequantize_per_channel_default_17" [style=solid, label="(2304, 768)"]; "108 dequantize_per_channel_default_17" -> "500 linear_16" [style=solid, label=None]; "109 encoder_layers_encoder_layer_4_self_attention_in_proj_bias" -> "500 linear_16" [style=solid, label="(2304,)"]; "110 _scale_18" -> "113 dequantize_per_channel_default_18" [style=solid, label="(768,)"]; "111 _zero_point_18" -> "113 dequantize_per_channel_default_18" [style=solid, label="(768,)"]; -"112 _frozen_param18" -> "113 dequantize_per_channel_default_18" [style=solid, label="(768, 768)"]; +"112 quantize_per_channel_default_18" -> "113 dequantize_per_channel_default_18" [style=solid, label="(768, 768)"]; "113 dequantize_per_channel_default_18" -> "526 linear_17" [style=solid, label=None]; "114 encoder_layers_encoder_layer_4_self_attention_out_proj_bias" -> "526 linear_17" [style=solid, label="(768,)"]; "115 encoder_layers_encoder_layer_4_ln_2_weight" -> "531 layer_norm_9" [style=solid, label="(768,)"]; "116 encoder_layers_encoder_layer_4_ln_2_bias" -> "531 layer_norm_9" [style=solid, label="(768,)"]; "117 _scale_19" -> "120 dequantize_per_channel_default_19" [style=solid, label="(3072,)"]; "118 _zero_point_19" -> "120 dequantize_per_channel_default_19" [style=solid, label="(3072,)"]; -"119 _frozen_param19" -> "120 dequantize_per_channel_default_19" [style=solid, label="(3072, 768)"]; +"119 quantize_per_channel_default_19" -> "120 dequantize_per_channel_default_19" [style=solid, label="(3072, 768)"]; "120 dequantize_per_channel_default_19" -> "534 linear_18" [style=solid, label=None]; "121 encoder_layers_encoder_layer_4_mlp_0_bias" -> "534 linear_18" [style=solid, label="(3072,)"]; "122 _scale_20" -> "125 dequantize_per_channel_default_20" [style=solid, label="(768,)"]; "123 _zero_point_20" -> "125 dequantize_per_channel_default_20" [style=solid, label="(768,)"]; -"124 _frozen_param20" -> "125 dequantize_per_channel_default_20" [style=solid, label="(768, 3072)"]; +"124 quantize_per_channel_default_20" -> "125 dequantize_per_channel_default_20" [style=solid, label="(768, 3072)"]; "125 dequantize_per_channel_default_20" -> "539 linear_19" [style=solid, label=None]; "126 encoder_layers_encoder_layer_4_mlp_3_bias" -> "539 linear_19" [style=solid, label="(768,)"]; "127 encoder_layers_encoder_layer_5_ln_1_weight" -> "542 layer_norm_10" [style=solid, label="(768,)"]; "128 encoder_layers_encoder_layer_5_ln_1_bias" -> "542 layer_norm_10" [style=solid, label="(768,)"]; "129 _scale_21" -> "132 dequantize_per_channel_default_21" [style=solid, label="(2304,)"]; "130 _zero_point_21" -> "132 dequantize_per_channel_default_21" [style=solid, label="(2304,)"]; -"131 _frozen_param21" -> "132 dequantize_per_channel_default_21" [style=solid, label="(2304, 768)"]; +"131 quantize_per_channel_default_21" -> "132 dequantize_per_channel_default_21" [style=solid, label="(2304, 768)"]; "132 dequantize_per_channel_default_21" -> "546 linear_20" [style=solid, label=None]; "133 encoder_layers_encoder_layer_5_self_attention_in_proj_bias" -> "546 linear_20" [style=solid, label="(2304,)"]; "134 _scale_22" -> "137 dequantize_per_channel_default_22" [style=solid, label="(768,)"]; "135 _zero_point_22" -> "137 dequantize_per_channel_default_22" [style=solid, label="(768,)"]; -"136 _frozen_param22" -> "137 dequantize_per_channel_default_22" [style=solid, label="(768, 768)"]; +"136 quantize_per_channel_default_22" -> "137 dequantize_per_channel_default_22" [style=solid, label="(768, 768)"]; "137 dequantize_per_channel_default_22" -> "572 linear_21" [style=solid, label=None]; "138 encoder_layers_encoder_layer_5_self_attention_out_proj_bias" -> "572 linear_21" [style=solid, label="(768,)"]; "139 encoder_layers_encoder_layer_5_ln_2_weight" -> "577 layer_norm_11" [style=solid, label="(768,)"]; "140 encoder_layers_encoder_layer_5_ln_2_bias" -> "577 layer_norm_11" [style=solid, label="(768,)"]; "141 _scale_23" -> "144 dequantize_per_channel_default_23" [style=solid, label="(3072,)"]; "142 _zero_point_23" -> "144 dequantize_per_channel_default_23" [style=solid, label="(3072,)"]; -"143 _frozen_param23" -> "144 dequantize_per_channel_default_23" [style=solid, label="(3072, 768)"]; +"143 quantize_per_channel_default_23" -> "144 dequantize_per_channel_default_23" [style=solid, label="(3072, 768)"]; "144 dequantize_per_channel_default_23" -> "580 linear_22" [style=solid, label=None]; "145 encoder_layers_encoder_layer_5_mlp_0_bias" -> "580 linear_22" [style=solid, label="(3072,)"]; "146 _scale_24" -> "149 dequantize_per_channel_default_24" [style=solid, label="(768,)"]; "147 _zero_point_24" -> "149 dequantize_per_channel_default_24" [style=solid, label="(768,)"]; -"148 _frozen_param24" -> "149 dequantize_per_channel_default_24" [style=solid, label="(768, 3072)"]; +"148 quantize_per_channel_default_24" -> "149 dequantize_per_channel_default_24" [style=solid, label="(768, 3072)"]; "149 dequantize_per_channel_default_24" -> "585 linear_23" [style=solid, label=None]; "150 encoder_layers_encoder_layer_5_mlp_3_bias" -> "585 linear_23" [style=solid, label="(768,)"]; "151 encoder_layers_encoder_layer_6_ln_1_weight" -> "588 layer_norm_12" [style=solid, label="(768,)"]; "152 encoder_layers_encoder_layer_6_ln_1_bias" -> "588 layer_norm_12" [style=solid, label="(768,)"]; "153 _scale_25" -> "156 dequantize_per_channel_default_25" [style=solid, label="(2304,)"]; "154 _zero_point_25" -> "156 dequantize_per_channel_default_25" [style=solid, label="(2304,)"]; -"155 _frozen_param25" -> "156 dequantize_per_channel_default_25" [style=solid, label="(2304, 768)"]; +"155 quantize_per_channel_default_25" -> "156 dequantize_per_channel_default_25" [style=solid, label="(2304, 768)"]; "156 dequantize_per_channel_default_25" -> "592 linear_24" [style=solid, label=None]; "157 encoder_layers_encoder_layer_6_self_attention_in_proj_bias" -> "592 linear_24" [style=solid, label="(2304,)"]; "158 _scale_26" -> "161 dequantize_per_channel_default_26" [style=solid, label="(768,)"]; "159 _zero_point_26" -> "161 dequantize_per_channel_default_26" [style=solid, label="(768,)"]; -"160 _frozen_param26" -> "161 dequantize_per_channel_default_26" [style=solid, label="(768, 768)"]; +"160 quantize_per_channel_default_26" -> "161 dequantize_per_channel_default_26" [style=solid, label="(768, 768)"]; "161 dequantize_per_channel_default_26" -> "618 linear_25" [style=solid, label=None]; "162 encoder_layers_encoder_layer_6_self_attention_out_proj_bias" -> "618 linear_25" [style=solid, label="(768,)"]; "163 encoder_layers_encoder_layer_6_ln_2_weight" -> "623 layer_norm_13" [style=solid, label="(768,)"]; "164 encoder_layers_encoder_layer_6_ln_2_bias" -> "623 layer_norm_13" [style=solid, label="(768,)"]; "165 _scale_27" -> "168 dequantize_per_channel_default_27" [style=solid, label="(3072,)"]; "166 _zero_point_27" -> "168 dequantize_per_channel_default_27" [style=solid, label="(3072,)"]; -"167 _frozen_param27" -> "168 dequantize_per_channel_default_27" [style=solid, label="(3072, 768)"]; +"167 quantize_per_channel_default_27" -> "168 dequantize_per_channel_default_27" [style=solid, label="(3072, 768)"]; "168 dequantize_per_channel_default_27" -> "626 linear_26" [style=solid, label=None]; "169 encoder_layers_encoder_layer_6_mlp_0_bias" -> "626 linear_26" [style=solid, label="(3072,)"]; "170 _scale_28" -> "173 dequantize_per_channel_default_28" [style=solid, label="(768,)"]; "171 _zero_point_28" -> "173 dequantize_per_channel_default_28" [style=solid, label="(768,)"]; -"172 _frozen_param28" -> "173 dequantize_per_channel_default_28" [style=solid, label="(768, 3072)"]; +"172 quantize_per_channel_default_28" -> "173 dequantize_per_channel_default_28" [style=solid, label="(768, 3072)"]; "173 dequantize_per_channel_default_28" -> "631 linear_27" [style=solid, label=None]; "174 encoder_layers_encoder_layer_6_mlp_3_bias" -> "631 linear_27" [style=solid, label="(768,)"]; "175 encoder_layers_encoder_layer_7_ln_1_weight" -> "634 layer_norm_14" [style=solid, label="(768,)"]; "176 encoder_layers_encoder_layer_7_ln_1_bias" -> "634 layer_norm_14" [style=solid, label="(768,)"]; "177 _scale_29" -> "180 dequantize_per_channel_default_29" [style=solid, label="(2304,)"]; "178 _zero_point_29" -> "180 dequantize_per_channel_default_29" [style=solid, label="(2304,)"]; -"179 _frozen_param29" -> "180 dequantize_per_channel_default_29" [style=solid, label="(2304, 768)"]; +"179 quantize_per_channel_default_29" -> "180 dequantize_per_channel_default_29" [style=solid, label="(2304, 768)"]; "180 dequantize_per_channel_default_29" -> "638 linear_28" [style=solid, label=None]; "181 encoder_layers_encoder_layer_7_self_attention_in_proj_bias" -> "638 linear_28" [style=solid, label="(2304,)"]; "182 _scale_30" -> "185 dequantize_per_channel_default_30" [style=solid, label="(768,)"]; "183 _zero_point_30" -> "185 dequantize_per_channel_default_30" [style=solid, label="(768,)"]; -"184 _frozen_param30" -> "185 dequantize_per_channel_default_30" [style=solid, label="(768, 768)"]; +"184 quantize_per_channel_default_30" -> "185 dequantize_per_channel_default_30" [style=solid, label="(768, 768)"]; "185 dequantize_per_channel_default_30" -> "664 linear_29" [style=solid, label=None]; "186 encoder_layers_encoder_layer_7_self_attention_out_proj_bias" -> "664 linear_29" [style=solid, label="(768,)"]; "187 encoder_layers_encoder_layer_7_ln_2_weight" -> "669 layer_norm_15" [style=solid, label="(768,)"]; "188 encoder_layers_encoder_layer_7_ln_2_bias" -> "669 layer_norm_15" [style=solid, label="(768,)"]; "189 _scale_31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(3072,)"]; "190 _zero_point_31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(3072,)"]; -"191 _frozen_param31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(3072, 768)"]; +"191 quantize_per_channel_default_31" -> "192 dequantize_per_channel_default_31" [style=solid, label="(3072, 768)"]; "192 dequantize_per_channel_default_31" -> "672 linear_30" [style=solid, label=None]; "193 encoder_layers_encoder_layer_7_mlp_0_bias" -> "672 linear_30" [style=solid, label="(3072,)"]; "194 _scale_32" -> "197 dequantize_per_channel_default_32" [style=solid, label="(768,)"]; "195 _zero_point_32" -> "197 dequantize_per_channel_default_32" [style=solid, label="(768,)"]; -"196 _frozen_param32" -> "197 dequantize_per_channel_default_32" [style=solid, label="(768, 3072)"]; +"196 quantize_per_channel_default_32" -> "197 dequantize_per_channel_default_32" [style=solid, label="(768, 3072)"]; "197 dequantize_per_channel_default_32" -> "677 linear_31" [style=solid, label=None]; "198 encoder_layers_encoder_layer_7_mlp_3_bias" -> "677 linear_31" [style=solid, label="(768,)"]; "199 encoder_layers_encoder_layer_8_ln_1_weight" -> "680 layer_norm_16" [style=solid, label="(768,)"]; "200 encoder_layers_encoder_layer_8_ln_1_bias" -> "680 layer_norm_16" [style=solid, label="(768,)"]; "201 _scale_33" -> "204 dequantize_per_channel_default_33" [style=solid, label="(2304,)"]; "202 _zero_point_33" -> "204 dequantize_per_channel_default_33" [style=solid, label="(2304,)"]; -"203 _frozen_param33" -> "204 dequantize_per_channel_default_33" [style=solid, label="(2304, 768)"]; +"203 quantize_per_channel_default_33" -> "204 dequantize_per_channel_default_33" [style=solid, label="(2304, 768)"]; "204 dequantize_per_channel_default_33" -> "684 linear_32" [style=solid, label=None]; "205 encoder_layers_encoder_layer_8_self_attention_in_proj_bias" -> "684 linear_32" [style=solid, label="(2304,)"]; "206 _scale_34" -> "209 dequantize_per_channel_default_34" [style=solid, label="(768,)"]; "207 _zero_point_34" -> "209 dequantize_per_channel_default_34" [style=solid, label="(768,)"]; -"208 _frozen_param34" -> "209 dequantize_per_channel_default_34" [style=solid, label="(768, 768)"]; +"208 quantize_per_channel_default_34" -> "209 dequantize_per_channel_default_34" [style=solid, label="(768, 768)"]; "209 dequantize_per_channel_default_34" -> "710 linear_33" [style=solid, label=None]; "210 encoder_layers_encoder_layer_8_self_attention_out_proj_bias" -> "710 linear_33" [style=solid, label="(768,)"]; "211 encoder_layers_encoder_layer_8_ln_2_weight" -> "715 layer_norm_17" [style=solid, label="(768,)"]; "212 encoder_layers_encoder_layer_8_ln_2_bias" -> "715 layer_norm_17" [style=solid, label="(768,)"]; "213 _scale_35" -> "216 dequantize_per_channel_default_35" [style=solid, label="(3072,)"]; "214 _zero_point_35" -> "216 dequantize_per_channel_default_35" [style=solid, label="(3072,)"]; -"215 _frozen_param35" -> "216 dequantize_per_channel_default_35" [style=solid, label="(3072, 768)"]; +"215 quantize_per_channel_default_35" -> "216 dequantize_per_channel_default_35" [style=solid, label="(3072, 768)"]; "216 dequantize_per_channel_default_35" -> "718 linear_34" [style=solid, label=None]; "217 encoder_layers_encoder_layer_8_mlp_0_bias" -> "718 linear_34" [style=solid, label="(3072,)"]; "218 _scale_36" -> "221 dequantize_per_channel_default_36" [style=solid, label="(768,)"]; "219 _zero_point_36" -> "221 dequantize_per_channel_default_36" [style=solid, label="(768,)"]; -"220 _frozen_param36" -> "221 dequantize_per_channel_default_36" [style=solid, label="(768, 3072)"]; +"220 quantize_per_channel_default_36" -> "221 dequantize_per_channel_default_36" [style=solid, label="(768, 3072)"]; "221 dequantize_per_channel_default_36" -> "723 linear_35" [style=solid, label=None]; "222 encoder_layers_encoder_layer_8_mlp_3_bias" -> "723 linear_35" [style=solid, label="(768,)"]; "223 encoder_layers_encoder_layer_9_ln_1_weight" -> "726 layer_norm_18" [style=solid, label="(768,)"]; "224 encoder_layers_encoder_layer_9_ln_1_bias" -> "726 layer_norm_18" [style=solid, label="(768,)"]; "225 _scale_37" -> "228 dequantize_per_channel_default_37" [style=solid, label="(2304,)"]; "226 _zero_point_37" -> "228 dequantize_per_channel_default_37" [style=solid, label="(2304,)"]; -"227 _frozen_param37" -> "228 dequantize_per_channel_default_37" [style=solid, label="(2304, 768)"]; +"227 quantize_per_channel_default_37" -> "228 dequantize_per_channel_default_37" [style=solid, label="(2304, 768)"]; "228 dequantize_per_channel_default_37" -> "730 linear_36" [style=solid, label=None]; "229 encoder_layers_encoder_layer_9_self_attention_in_proj_bias" -> "730 linear_36" [style=solid, label="(2304,)"]; "230 _scale_38" -> "233 dequantize_per_channel_default_38" [style=solid, label="(768,)"]; "231 _zero_point_38" -> "233 dequantize_per_channel_default_38" [style=solid, label="(768,)"]; -"232 _frozen_param38" -> "233 dequantize_per_channel_default_38" [style=solid, label="(768, 768)"]; +"232 quantize_per_channel_default_38" -> "233 dequantize_per_channel_default_38" [style=solid, label="(768, 768)"]; "233 dequantize_per_channel_default_38" -> "756 linear_37" [style=solid, label=None]; "234 encoder_layers_encoder_layer_9_self_attention_out_proj_bias" -> "756 linear_37" [style=solid, label="(768,)"]; "235 encoder_layers_encoder_layer_9_ln_2_weight" -> "761 layer_norm_19" [style=solid, label="(768,)"]; "236 encoder_layers_encoder_layer_9_ln_2_bias" -> "761 layer_norm_19" [style=solid, label="(768,)"]; "237 _scale_39" -> "240 dequantize_per_channel_default_39" [style=solid, label="(3072,)"]; "238 _zero_point_39" -> "240 dequantize_per_channel_default_39" [style=solid, label="(3072,)"]; -"239 _frozen_param39" -> "240 dequantize_per_channel_default_39" [style=solid, label="(3072, 768)"]; +"239 quantize_per_channel_default_39" -> "240 dequantize_per_channel_default_39" [style=solid, label="(3072, 768)"]; "240 dequantize_per_channel_default_39" -> "764 linear_38" [style=solid, label=None]; "241 encoder_layers_encoder_layer_9_mlp_0_bias" -> "764 linear_38" [style=solid, label="(3072,)"]; "242 _scale_40" -> "245 dequantize_per_channel_default_40" [style=solid, label="(768,)"]; "243 _zero_point_40" -> "245 dequantize_per_channel_default_40" [style=solid, label="(768,)"]; -"244 _frozen_param40" -> "245 dequantize_per_channel_default_40" [style=solid, label="(768, 3072)"]; +"244 quantize_per_channel_default_40" -> "245 dequantize_per_channel_default_40" [style=solid, label="(768, 3072)"]; "245 dequantize_per_channel_default_40" -> "769 linear_39" [style=solid, label=None]; "246 encoder_layers_encoder_layer_9_mlp_3_bias" -> "769 linear_39" [style=solid, label="(768,)"]; "247 encoder_layers_encoder_layer_10_ln_1_weight" -> "772 layer_norm_20" [style=solid, label="(768,)"]; "248 encoder_layers_encoder_layer_10_ln_1_bias" -> "772 layer_norm_20" [style=solid, label="(768,)"]; "249 _scale_41" -> "252 dequantize_per_channel_default_41" [style=solid, label="(2304,)"]; "250 _zero_point_41" -> "252 dequantize_per_channel_default_41" [style=solid, label="(2304,)"]; -"251 _frozen_param41" -> "252 dequantize_per_channel_default_41" [style=solid, label="(2304, 768)"]; +"251 quantize_per_channel_default_41" -> "252 dequantize_per_channel_default_41" [style=solid, label="(2304, 768)"]; "252 dequantize_per_channel_default_41" -> "776 linear_40" [style=solid, label=None]; "253 encoder_layers_encoder_layer_10_self_attention_in_proj_bias" -> "776 linear_40" [style=solid, label="(2304,)"]; "254 _scale_42" -> "257 dequantize_per_channel_default_42" [style=solid, label="(768,)"]; "255 _zero_point_42" -> "257 dequantize_per_channel_default_42" [style=solid, label="(768,)"]; -"256 _frozen_param42" -> "257 dequantize_per_channel_default_42" [style=solid, label="(768, 768)"]; +"256 quantize_per_channel_default_42" -> "257 dequantize_per_channel_default_42" [style=solid, label="(768, 768)"]; "257 dequantize_per_channel_default_42" -> "802 linear_41" [style=solid, label=None]; "258 encoder_layers_encoder_layer_10_self_attention_out_proj_bias" -> "802 linear_41" [style=solid, label="(768,)"]; "259 encoder_layers_encoder_layer_10_ln_2_weight" -> "807 layer_norm_21" [style=solid, label="(768,)"]; "260 encoder_layers_encoder_layer_10_ln_2_bias" -> "807 layer_norm_21" [style=solid, label="(768,)"]; "261 _scale_43" -> "264 dequantize_per_channel_default_43" [style=solid, label="(3072,)"]; "262 _zero_point_43" -> "264 dequantize_per_channel_default_43" [style=solid, label="(3072,)"]; -"263 _frozen_param43" -> "264 dequantize_per_channel_default_43" [style=solid, label="(3072, 768)"]; +"263 quantize_per_channel_default_43" -> "264 dequantize_per_channel_default_43" [style=solid, label="(3072, 768)"]; "264 dequantize_per_channel_default_43" -> "810 linear_42" [style=solid, label=None]; "265 encoder_layers_encoder_layer_10_mlp_0_bias" -> "810 linear_42" [style=solid, label="(3072,)"]; "266 _scale_44" -> "269 dequantize_per_channel_default_44" [style=solid, label="(768,)"]; "267 _zero_point_44" -> "269 dequantize_per_channel_default_44" [style=solid, label="(768,)"]; -"268 _frozen_param44" -> "269 dequantize_per_channel_default_44" [style=solid, label="(768, 3072)"]; +"268 quantize_per_channel_default_44" -> "269 dequantize_per_channel_default_44" [style=solid, label="(768, 3072)"]; "269 dequantize_per_channel_default_44" -> "815 linear_43" [style=solid, label=None]; "270 encoder_layers_encoder_layer_10_mlp_3_bias" -> "815 linear_43" [style=solid, label="(768,)"]; "271 encoder_layers_encoder_layer_11_ln_1_weight" -> "818 layer_norm_22" [style=solid, label="(768,)"]; "272 encoder_layers_encoder_layer_11_ln_1_bias" -> "818 layer_norm_22" [style=solid, label="(768,)"]; "273 _scale_45" -> "276 dequantize_per_channel_default_45" [style=solid, label="(2304,)"]; "274 _zero_point_45" -> "276 dequantize_per_channel_default_45" [style=solid, label="(2304,)"]; -"275 _frozen_param45" -> "276 dequantize_per_channel_default_45" [style=solid, label="(2304, 768)"]; +"275 quantize_per_channel_default_45" -> "276 dequantize_per_channel_default_45" [style=solid, label="(2304, 768)"]; "276 dequantize_per_channel_default_45" -> "822 linear_44" [style=solid, label=None]; "277 encoder_layers_encoder_layer_11_self_attention_in_proj_bias" -> "822 linear_44" [style=solid, label="(2304,)"]; "278 _scale_46" -> "281 dequantize_per_channel_default_46" [style=solid, label="(768,)"]; "279 _zero_point_46" -> "281 dequantize_per_channel_default_46" [style=solid, label="(768,)"]; -"280 _frozen_param46" -> "281 dequantize_per_channel_default_46" [style=solid, label="(768, 768)"]; +"280 quantize_per_channel_default_46" -> "281 dequantize_per_channel_default_46" [style=solid, label="(768, 768)"]; "281 dequantize_per_channel_default_46" -> "848 linear_45" [style=solid, label=None]; "282 encoder_layers_encoder_layer_11_self_attention_out_proj_bias" -> "848 linear_45" [style=solid, label="(768,)"]; "283 encoder_layers_encoder_layer_11_ln_2_weight" -> "853 layer_norm_23" [style=solid, label="(768,)"]; "284 encoder_layers_encoder_layer_11_ln_2_bias" -> "853 layer_norm_23" [style=solid, label="(768,)"]; "285 _scale_47" -> "288 dequantize_per_channel_default_47" [style=solid, label="(3072,)"]; "286 _zero_point_47" -> "288 dequantize_per_channel_default_47" [style=solid, label="(3072,)"]; -"287 _frozen_param47" -> "288 dequantize_per_channel_default_47" [style=solid, label="(3072, 768)"]; +"287 quantize_per_channel_default_47" -> "288 dequantize_per_channel_default_47" [style=solid, label="(3072, 768)"]; "288 dequantize_per_channel_default_47" -> "856 linear_46" [style=solid, label=None]; "289 encoder_layers_encoder_layer_11_mlp_0_bias" -> "856 linear_46" [style=solid, label="(3072,)"]; "290 _scale_48" -> "293 dequantize_per_channel_default_48" [style=solid, label="(768,)"]; "291 _zero_point_48" -> "293 dequantize_per_channel_default_48" [style=solid, label="(768,)"]; -"292 _frozen_param48" -> "293 dequantize_per_channel_default_48" [style=solid, label="(768, 3072)"]; +"292 quantize_per_channel_default_48" -> "293 dequantize_per_channel_default_48" [style=solid, label="(768, 3072)"]; "293 dequantize_per_channel_default_48" -> "861 linear_47" [style=solid, label=None]; "294 encoder_layers_encoder_layer_11_mlp_3_bias" -> "861 linear_47" [style=solid, label="(768,)"]; "295 encoder_ln_weight" -> "864 layer_norm_24" [style=solid, label="(768,)"]; "296 encoder_ln_bias" -> "864 layer_norm_24" [style=solid, label="(768,)"]; "297 _scale_49" -> "300 dequantize_per_channel_default_49" [style=solid, label="(1000,)"]; "298 _zero_point_49" -> "300 dequantize_per_channel_default_49" [style=solid, label="(1000,)"]; -"299 _frozen_param49" -> "300 dequantize_per_channel_default_49" [style=solid, label="(1000, 768)"]; +"299 quantize_per_channel_default_49" -> "300 dequantize_per_channel_default_49" [style=solid, label="(1000, 768)"]; "300 dequantize_per_channel_default_49" -> "869 linear_48" [style=solid, label=None]; "301 heads_head_bias" -> "869 linear_48" [style=solid, label="(1000,)"]; "302 x" -> "303 quantize_per_tensor_default" [style=solid, label="(1, 3, 224, 224)"]; diff --git a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/yolo11n_sdpa_block.dot b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/yolo11n_sdpa_block.dot index 92c69db331d..71a115356ba 100644 --- a/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/yolo11n_sdpa_block.dot +++ b/tests/torch2/data/fx/ao_export_quantization_OpenVINOQuantizer/yolo11n_sdpa_block.dot @@ -1,7 +1,7 @@ strict digraph { "0 _scale_0" [id=0, type="get_attr"]; "1 _zero_point_0" [id=1, type="get_attr"]; -"2 _frozen_param0" [id=2, type="get_attr"]; +"2 quantize_per_channel_default" [id=2, type="get_attr"]; "3 dequantize_per_channel_default" [id=3, type="dequantize_per_channel"]; "4 x" [id=4, type=input]; "5 quantize_per_tensor_default" [id=5, type="quantize_per_tensor"]; @@ -28,7 +28,7 @@ strict digraph { "26 output" [id=26, type=output]; "0 _scale_0" -> "3 dequantize_per_channel_default" [style=solid, label="(12,)"]; "1 _zero_point_0" -> "3 dequantize_per_channel_default" [style=solid, label="(12,)"]; -"2 _frozen_param0" -> "3 dequantize_per_channel_default" [style=solid, label="(12, 4)"]; +"2 quantize_per_channel_default" -> "3 dequantize_per_channel_default" [style=solid, label="(12, 4)"]; "3 dequantize_per_channel_default" -> "7 linear" [style=solid, label=None]; "4 x" -> "5 quantize_per_tensor_default" [style=solid, label="(1, 2, 4)"]; "5 quantize_per_tensor_default" -> "6 dequantize_per_tensor_default" [style=solid, label=None]; diff --git a/tests/torch2/fx/helpers.py b/tests/torch2/fx/helpers.py index 1ece19d59be..bd38930771d 100644 --- a/tests/torch2/fx/helpers.py +++ b/tests/torch2/fx/helpers.py @@ -20,9 +20,9 @@ import torchvision.datasets as datasets import torchvision.transforms as transforms from fastdownload import FastDownload +from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ from torch.fx.passes.graph_drawer import FxGraphDrawer -from nncf.experimental.torch.fx.transformations import apply_quantization_transformations from nncf.torch.graph.graph import PTNNCFGraph from nncf.torch.graph.operator_metatypes import PTConstNoopMetatype from nncf.torch.graph.operator_metatypes import PTModuleConv2dMetatype @@ -160,7 +160,7 @@ def get_torch_fx_model_q_transformed(model: torch.nn.Module, ex_input: torch.Ten :return: Exported GraphModule. """ fx_model = get_torch_fx_model(model, ex_input) - apply_quantization_transformations(fx_model) + _fuse_conv_bn_(fx_model) return fx_model diff --git a/tests/torch2/fx/test_calculation_quantizer_params.py b/tests/torch2/fx/test_calculation_quantizer_params.py index 384c9e0e75e..b499da46968 100644 --- a/tests/torch2/fx/test_calculation_quantizer_params.py +++ b/tests/torch2/fx/test_calculation_quantizer_params.py @@ -96,18 +96,17 @@ def test_quantizer_params_sym(case_to_test: CaseQuantParams, dtype: Optional[Int dest_dtype=dtype, ) - quantizer = _get_quantizer(case_to_test, qconfig) - assert quantizer.qscheme is torch.per_channel_symmetric if case_to_test.per_channel else torch.per_tensor_symmetric + params = _get_qdq_params(case_to_test, qconfig) signed = signedness_to_force or dtype is TensorDataType.int8 if signed: - assert torch.allclose(quantizer.zero_point, torch.tensor(0, dtype=torch.int8)) + assert torch.allclose(params.zero_point, torch.tensor(0, dtype=torch.int8)) else: - assert torch.allclose(quantizer.zero_point, torch.tensor(127 if narrow_range else 128, dtype=torch.uint8)) + assert torch.allclose(params.zero_point, torch.tensor(127 if narrow_range else 128, dtype=torch.uint8)) - scale = quantizer.scale.detach().numpy() + scale = params.scale.detach().numpy() assert np.allclose(scale, case_to_test.ref_scale) - _check_q_min_q_max(quantizer, signed, narrow_range) + _check_q_min_q_max(params, signed, narrow_range) SYM_CASES_SIGNEDNESS_TO_FORSE = ( @@ -314,17 +313,16 @@ def test_quantizer_params_sym_nr(case_to_test: CaseQuantParams, ref_signed: bool signedness_to_force=signedness_to_force, ) - quantizer = _get_quantizer(case_to_test, qconfig) - assert quantizer.qscheme is torch.per_channel_symmetric if case_to_test.per_channel else torch.per_tensor_symmetric + params = _get_qdq_params(case_to_test, qconfig) signed = signedness_to_force or ref_signed - assert torch.allclose(quantizer.zero_point, torch.tensor(0, dtype=torch.int8 if signed else torch.uint8)) + assert torch.allclose(params.zero_point, torch.tensor(0, dtype=torch.int8 if signed else torch.uint8)) - scale = quantizer.scale.detach().numpy() + scale = params.scale.detach().numpy() assert np.allclose(scale, case_to_test.ref_scale) - _check_q_min_q_max(quantizer, signed, narrow_range) + _check_q_min_q_max(params, signed, narrow_range) ASYM_CASES = ( @@ -396,8 +394,7 @@ def test_quantizer_params_asym(case_to_test: CaseQuantParams, ref_zp: Union[int, dest_dtype=dtype, ) - quantizer = _get_quantizer(case_to_test, qconfig) - assert quantizer.qscheme is torch.per_channel_affine if case_to_test.per_channel else torch.per_tensor_affine + quantizer = _get_qdq_params(case_to_test, qconfig) signed = dtype is TensorDataType.int8 ref_zp = torch.tensor(ref_zp) @@ -411,22 +408,23 @@ def test_quantizer_params_asym(case_to_test: CaseQuantParams, ref_zp: Union[int, _check_q_min_q_max(quantizer, signed, narrow_range) -def _get_quantizer(case_to_test: CaseQuantParams, qconfig: QuantizerConfig): +def _get_qdq_params(case_to_test: CaseQuantParams, qconfig: QuantizerConfig): fq_params = calculate_quantizer_parameters(case_to_test.stat, qconfig, case_to_test.quant_group, half_range=False) - quantizer = FXMinMaxAlgoBackend._create_quantizer( + qdq_params = FXMinMaxAlgoBackend._get_torch_qdq_params( qconfig, fq_params, is_weight_quantizer=case_to_test.quant_group == QuantizerGroup.WEIGHTS ) ch_axis = -1 if case_to_test.per_channel: ch_axis = 0 if case_to_test.quant_group == QuantizerGroup.WEIGHTS else 1 - assert quantizer.ch_axis == ch_axis + assert qdq_params.ch_axis == ch_axis + assert qdq_params.is_per_channel == qconfig.per_channel - return quantizer + return qdq_params -def _check_q_min_q_max(quantizer, signed, narrow_range): +def _check_q_min_q_max(params, signed, narrow_range): if signed: ref_quant_min = -127 if narrow_range else -128 ref_quant_max = 127 @@ -434,8 +432,8 @@ def _check_q_min_q_max(quantizer, signed, narrow_range): ref_quant_min = 0 ref_quant_max = 254 if narrow_range else 255 - assert quantizer.quant_min == ref_quant_min - assert quantizer.quant_max == ref_quant_max + assert params.quant_min == ref_quant_min + assert params.quant_max == ref_quant_max @pytest.mark.parametrize( @@ -459,4 +457,6 @@ def test_extended_q_config_non_supported_dest_dtype(dest_dtype): qconfig = TypedQuantizerConfig(dest_dtype=dest_dtype) params = FakeQuantizeParameters(-1.0, 1.0, -1.0, 1.0, 255) with pytest.raises(nncf.ParameterNotSupportedError): - FXMinMaxAlgoBackend._create_quantizer(quantizer_config=qconfig, parameters=params, is_weight_quantizer=False) + FXMinMaxAlgoBackend._get_torch_qdq_params( + quantizer_config=qconfig, parameters=params, is_weight_quantizer=False + ) diff --git a/tests/torch2/fx/test_model_transformer.py b/tests/torch2/fx/test_model_transformer.py index 669edb34d58..244c7bf8846 100644 --- a/tests/torch2/fx/test_model_transformer.py +++ b/tests/torch2/fx/test_model_transformer.py @@ -15,12 +15,7 @@ import pytest import torch -import torch.ao.quantization import torch.fx -from torch.ao.quantization.fx.utils import create_getattr_from_value -from torch.ao.quantization.observer import MinMaxObserver -from torch.ao.quantization.observer import PerChannelMinMaxObserver -from torch.quantization.fake_quantize import FakeQuantize import nncf import nncf.common @@ -28,16 +23,17 @@ from nncf.common.factory import NNCFGraphFactory from nncf.common.graph.transformations.commands import TargetType from nncf.common.graph.transformations.layout import TransformationLayout -from nncf.common.quantization.structs import QuantizationScheme as QuantizationMode from nncf.experimental.torch.fx.constant_folding import constant_fold from nncf.experimental.torch.fx.model_transformer import FXModelTransformer from nncf.experimental.torch.fx.nncf_graph_builder import GraphConverter from nncf.experimental.torch.fx.node_utils import get_graph_node_by_name from nncf.experimental.torch.fx.node_utils import get_tensor_constant_from_node +from nncf.experimental.torch.fx.quantization.qdq_parameters import TorchQDQParameters from nncf.experimental.torch.fx.transformations import _get_node_by_input_port_id from nncf.experimental.torch.fx.transformations import _set_new_node_meta from nncf.experimental.torch.fx.transformations import compress_post_quantize_transformation from nncf.experimental.torch.fx.transformations import constant_update_transformation_builder +from nncf.experimental.torch.fx.transformations import create_getattr_from_value from nncf.experimental.torch.fx.transformations import fold_constant_except_qdq from nncf.experimental.torch.fx.transformations import leaf_module_insertion_transformation_builder from nncf.experimental.torch.fx.transformations import module_insertion_transformation_builder @@ -278,27 +274,15 @@ class TestQDQInsertion: REF_SCALE = torch.tensor([1.0]) REF_ZERO_POINT = torch.tensor([0.0]) - def _get_quantizer( - self, per_channel: bool, symmetric: bool, q_min: torch.Tensor, q_max: torch.Tensor, dtype: torch.dtype - ) -> FakeQuantize: - if symmetric: - qscheme = torch.per_channel_symmetric if per_channel else torch.per_tensor_symmetric - else: - qscheme = torch.per_channel_affine if per_channel else torch.per_tensor_affine - observer = PerChannelMinMaxObserver if per_channel else MinMaxObserver - - quantizer = FakeQuantize( - observer=observer, + def _get_torch_qdq_params(self, per_channel: bool, q_min: torch.Tensor, q_max: torch.Tensor) -> TorchQDQParameters: + return TorchQDQParameters( quant_min=q_min, quant_max=q_max, - dtype=dtype, - qscheme=qscheme, - eps=1e-5, + scale=self.REF_SCALE, + zero_point=self.REF_ZERO_POINT, + is_per_channel=per_channel, + ch_axis=-1, ) - quantizer.scale = self.REF_SCALE - quantizer.zero_point = self.REF_ZERO_POINT - - return quantizer def _check_qdq_params( self, captured_model: torch.fx.GraphModule, target_point: PTTargetPoint, dtype: torch.dtype, per_channel: bool @@ -333,15 +317,13 @@ def get_value(node: torch.fx.Node): def test_one_target_point( self, is_per_channel: bool, - quantization_mode: QuantizationMode, q_min: int, q_max: int, dtype: torch.dtype, target_point: PTTargetPoint, ): - symmetric = quantization_mode == QuantizationMode.SYMMETRIC - quantizer = self._get_quantizer(is_per_channel, symmetric, q_min, q_max, dtype) - transformation = qdq_insertion_transformation_builder(quantizer, [target_point]) + torch_qdq_params = self._get_torch_qdq_params(is_per_channel, q_min, q_max) + transformation = qdq_insertion_transformation_builder(torch_qdq_params, [target_point]) model = MultiBranchesConnectedModelWithConcat() captured_model = get_torch_fx_model(model, torch.ones(MultiBranchesConnectedModelWithConcat.INPUT_SIZE)) @@ -381,16 +363,14 @@ def test_one_target_point( def test_shared_target_point( self, is_per_channel: bool, - quantization_mode: QuantizationMode, q_min: int, q_max: int, dtype: torch.dtype, target_points: PTTargetPoint, weights: bool, ): - symmetric = quantization_mode == QuantizationMode.SYMMETRIC - quantizer = self._get_quantizer(is_per_channel, symmetric, q_min, q_max, dtype) - transformation = qdq_insertion_transformation_builder(quantizer, target_points) + torch_qdq_params = self._get_torch_qdq_params(is_per_channel, q_min, q_max) + transformation = qdq_insertion_transformation_builder(torch_qdq_params, target_points) model = MultiBranchesConnectedModelWithConcat() captured_model = get_torch_fx_model(model, torch.ones(MultiBranchesConnectedModelWithConcat.INPUT_SIZE)) diff --git a/tests/torch2/fx/test_quantizer.py b/tests/torch2/fx/test_quantizer.py index bd20343f6e4..4e0ca518188 100644 --- a/tests/torch2/fx/test_quantizer.py +++ b/tests/torch2/fx/test_quantizer.py @@ -22,15 +22,6 @@ import torch.utils.data import torch.utils.data.distributed import torchvision.models as models -from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ -from torch.ao.quantization.quantize_pt2e import convert_pt2e -from torch.ao.quantization.quantize_pt2e import prepare_pt2e -from torch.ao.quantization.quantizer import xnnpack_quantizer -from torch.ao.quantization.quantizer.quantizer import QuantizationSpec as TorchAOQuantizationSpec -from torch.ao.quantization.quantizer.quantizer import Quantizer -from torch.ao.quantization.quantizer.quantizer import SharedQuantizationSpec as TorchAOSharedQuantizationSpec -from torch.ao.quantization.quantizer.x86_inductor_quantizer import X86InductorQuantizer -from torch.ao.quantization.quantizer.x86_inductor_quantizer import get_default_x86_inductor_quantization_config import nncf from nncf.common.graph import NNCFGraph @@ -51,6 +42,29 @@ from tests.torch.test_models.synthetic import YOLO11N_SDPABlock from tests.torch2.fx.helpers import get_torch_fx_model +TORCHAO_IS_AVAILABLE = False +try: + from torchao.quantization.pt2e.quantize_pt2e import convert_pt2e + from torchao.quantization.pt2e.quantize_pt2e import prepare_pt2e + from torchao.quantization.pt2e.quantizer.quantizer import QuantizationSpec as TorchAOQuantizationSpec + from torchao.quantization.pt2e.quantizer.quantizer import Quantizer + from torchao.quantization.pt2e.quantizer.quantizer import SharedQuantizationSpec as TorchAOSharedQuantizationSpec + from torchao.quantization.pt2e.quantizer.x86_inductor_quantizer import X86InductorQuantizer + from torchao.quantization.pt2e.quantizer.x86_inductor_quantizer import get_default_x86_inductor_quantization_config + from torchao.quantization.pt2e.utils import _fuse_conv_bn_ + + TORCHAO_IS_AVAILABLE = True +except ImportError: + from torch.ao.quantization.pt2e.utils import _fuse_conv_bn_ + from torch.ao.quantization.quantize_pt2e import convert_pt2e + from torch.ao.quantization.quantize_pt2e import prepare_pt2e + from torch.ao.quantization.quantizer.quantizer import QuantizationSpec as TorchAOQuantizationSpec + from torch.ao.quantization.quantizer.quantizer import Quantizer + from torch.ao.quantization.quantizer.quantizer import SharedQuantizationSpec as TorchAOSharedQuantizationSpec + from torch.ao.quantization.quantizer.x86_inductor_quantizer import X86InductorQuantizer + from torch.ao.quantization.quantizer.x86_inductor_quantizer import get_default_x86_inductor_quantization_config + + FX_QUANTIZED_DIR_NAME = TEST_ROOT / "torch2" / "data" / "fx" @@ -80,12 +94,6 @@ def get_x86_quantizer(*args, **kwarsg) -> X86InductorQuantizer: return quantizer -def get_xnnpack_quantizer(*args, **kwargs) -> xnnpack_quantizer.XNNPACKQuantizer: - quantizer = xnnpack_quantizer.XNNPACKQuantizer() - quantizer.set_global(xnnpack_quantizer.get_symmetric_quantization_config()) - return quantizer - - def get_openvino_quantizer(*args, **kwargs) -> OpenVINOQuantizer: return OpenVINOQuantizer(*args, **kwargs) @@ -140,11 +148,10 @@ def transform_fn(data_item): @pytest.mark.parametrize( "quantizer_builder", [ - get_xnnpack_quantizer, get_x86_quantizer, get_openvino_quantizer, ], - ids=["XNNPACKQuantizer", "X86InductorQuantizer", "OpenVINOQuantizer"], + ids=["X86InductorQuantizer", "OpenVINOQuantizer"], ) def test_quantized_model( quantizer_builder: Callable[[tuple[Any, ...]], Quantizer], @@ -196,11 +203,10 @@ def test_quantized_model( @pytest.mark.parametrize( "quantizer_builder", [ - get_xnnpack_quantizer, get_x86_quantizer, get_openvino_quantizer, ], - ids=["XNNPACKQuantizer", "X86InductorQuantizer", "OpenVINOQuantizer"], + ids=["X86InductorQuantizer", "OpenVINOQuantizer"], ) def test_quantizer_setup( quantizer_builder: Callable[[tuple[Any, ...]], Quantizer], @@ -265,7 +271,7 @@ def _normalize_qsetup_state(setup: dict[str, Any]) -> None: def _normalize_nncf_graph(nncf_graph: NNCFGraph, fx_graph: torch.fx.Graph): """ Normalizes the given NNCFGraph by renaming quantize/dequantize nodes to ensure consistent naming across runs. - XNNPACKQuantizer and X86InductorQuantizer quantizers insert quantize and dequantize nodes + X86InductorQuantizer quantizer inserts quantize and dequantize nodes with inconsistent names across runs. This function assigns standardized names to such nodes to maintain consistency. @@ -320,6 +326,8 @@ def _normalize_nncf_graph(nncf_graph: NNCFGraph, fx_graph: torch.fx.Graph): ids=[m[0].model_id for m in TEST_MODELS_QUANIZED], ) def test_openvino_quantizer_with_torch_ao_convert_pt2e(model_case: ModelCase, quantizer_params): + if not TORCHAO_IS_AVAILABLE: + pytest.skip("Test requires torchao to be installed.") quantizer = get_openvino_quantizer(**quantizer_params) fx_model, example_input = _build_torch_fx_model(model_case) prepared_model = prepare_pt2e(fx_model, quantizer)