diff --git a/docs/.buildinfo b/docs/.buildinfo index a1a912d62..cae0c3496 100644 --- a/docs/.buildinfo +++ b/docs/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file records the configuration used when building these files. When it is not found, a full rebuild will be done. -config: b35b7de06e13d9a56a35dbd44d23b55a +config: cf075e835198a4e6788d0d1e99f1ccaa tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/docs/_sources/api/api_docs/index.rst.txt b/docs/_sources/api/api_docs/index.rst.txt index 53a0ef9b1..9299c1f9f 100644 --- a/docs/_sources/api/api_docs/index.rst.txt +++ b/docs/_sources/api/api_docs/index.rst.txt @@ -109,7 +109,8 @@ keras_load_quantized_model target_platform_capabilities ============================== - :ref:`target_platform_capabilities`: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference. -- :ref:`get_target_platform_capabilities`: A function to get a target platform model for Tensorflow and Pytorch. +- :ref:`get_target_platform_capabilities`: A function to get a TargetPlatformCapabilities for tpc version and device type. +- :ref:`get_target_platform_capabilities_sdsp`: A function to get a TargetPlatformCapabilities for sdsp converter version. - :ref:`DefaultDict`: Util class for creating a TargetPlatformCapabilities. wrapper diff --git a/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt b/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt index e8346a359..0fbb7ff66 100644 --- a/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt +++ b/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt @@ -3,9 +3,9 @@ .. _ug-get_target_platform_capabilities: -======================================= -Get FrameworkQuantizationCapabilities -======================================= +===================================================== +Get TargetPlatformCapabilities for tpc version +===================================================== .. autofunction:: model_compression_toolkit.get_target_platform_capabilities diff --git a/docs/_sources/api/api_docs/methods/get_target_platform_capabilities_sdsp.rst.txt b/docs/_sources/api/api_docs/methods/get_target_platform_capabilities_sdsp.rst.txt new file mode 100644 index 000000000..d5b0f0f24 --- /dev/null +++ b/docs/_sources/api/api_docs/methods/get_target_platform_capabilities_sdsp.rst.txt @@ -0,0 +1,13 @@ +:orphan: + +.. _ug-get_target_platform_capabilities_sdsp: + + +============================================================= +Get TargetPlatformCapabilities for sdsp converter version +============================================================= + +.. autofunction:: model_compression_toolkit.get_target_platform_capabilities_sdsp + + +.. include:: ../notes/tpc_note.rst \ No newline at end of file diff --git a/docs/_sources/api/api_docs/modules/target_platform_capabilities.rst.txt b/docs/_sources/api/api_docs/modules/target_platform_capabilities.rst.txt index f0d1eb94a..c6b0504e6 100644 --- a/docs/_sources/api/api_docs/modules/target_platform_capabilities.rst.txt +++ b/docs/_sources/api/api_docs/modules/target_platform_capabilities.rst.txt @@ -16,7 +16,8 @@ Conv2D `_, and can be used using :ref:`get_target_platform_capabilities function`. +Models for IMX500, TFLite and qnnpack can be observed `here `_, and can be retrieved using :ref:`get_target_platform_capabilities function`. +You can also get the model for IMX500 using :ref:`get_target_platform_capabilities_sdsp function` that specifies the sdsp converter version. | diff --git a/docs/api/api_docs/classes/BitWidthConfig.html b/docs/api/api_docs/classes/BitWidthConfig.html index 01973971f..b0b40de8d 100644 --- a/docs/api/api_docs/classes/BitWidthConfig.html +++ b/docs/api/api_docs/classes/BitWidthConfig.html @@ -6,12 +6,12 @@ - BitWidthConfig — MCT Documentation: ver 2.5.0 + BitWidthConfig — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

Navigation

  • index
  • - + @@ -150,7 +150,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/DataGenerationConfig.html b/docs/api/api_docs/classes/DataGenerationConfig.html index b55e54623..961d25c3c 100644 --- a/docs/api/api_docs/classes/DataGenerationConfig.html +++ b/docs/api/api_docs/classes/DataGenerationConfig.html @@ -6,12 +6,12 @@ - Data Generation Configuration — MCT Documentation: ver 2.5.0 + Data Generation Configuration — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -233,7 +233,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/DefaultDict.html b/docs/api/api_docs/classes/DefaultDict.html index 1747d9f0b..da301735f 100644 --- a/docs/api/api_docs/classes/DefaultDict.html +++ b/docs/api/api_docs/classes/DefaultDict.html @@ -6,12 +6,12 @@ - DefaultDict Class — MCT Documentation: ver 2.5.0 + DefaultDict Class — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -125,7 +125,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/FrameworkInfo.html b/docs/api/api_docs/classes/FrameworkInfo.html index 5b7e9e32c..ea1edcf39 100644 --- a/docs/api/api_docs/classes/FrameworkInfo.html +++ b/docs/api/api_docs/classes/FrameworkInfo.html @@ -6,12 +6,12 @@ - FrameworkInfo Class — MCT Documentation: ver 2.5.0 + FrameworkInfo Class — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -145,7 +145,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/GradientPTQConfig.html b/docs/api/api_docs/classes/GradientPTQConfig.html index 488417e24..6eef769e0 100644 --- a/docs/api/api_docs/classes/GradientPTQConfig.html +++ b/docs/api/api_docs/classes/GradientPTQConfig.html @@ -6,12 +6,12 @@ - GradientPTQConfig Class — MCT Documentation: ver 2.5.0 + GradientPTQConfig Class — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -192,7 +192,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/MixedPrecisionQuantizationConfig.html b/docs/api/api_docs/classes/MixedPrecisionQuantizationConfig.html index 99cbed160..66958461e 100644 --- a/docs/api/api_docs/classes/MixedPrecisionQuantizationConfig.html +++ b/docs/api/api_docs/classes/MixedPrecisionQuantizationConfig.html @@ -6,12 +6,12 @@ - MixedPrecisionQuantizationConfig — MCT Documentation: ver 2.5.0 + MixedPrecisionQuantizationConfig — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -143,7 +143,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/PruningConfig.html b/docs/api/api_docs/classes/PruningConfig.html index e5de72d38..3b26964b7 100644 --- a/docs/api/api_docs/classes/PruningConfig.html +++ b/docs/api/api_docs/classes/PruningConfig.html @@ -6,12 +6,12 @@ - Pruning Configuration — MCT Documentation: ver 2.5.0 + Pruning Configuration — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -168,7 +168,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/PruningInfo.html b/docs/api/api_docs/classes/PruningInfo.html index 42813088f..d5902a26d 100644 --- a/docs/api/api_docs/classes/PruningInfo.html +++ b/docs/api/api_docs/classes/PruningInfo.html @@ -6,12 +6,12 @@ - Pruning Information — MCT Documentation: ver 2.5.0 + Pruning Information — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -127,7 +127,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/QuantizationConfig.html b/docs/api/api_docs/classes/QuantizationConfig.html index 3ab58a91a..0684381e1 100644 --- a/docs/api/api_docs/classes/QuantizationConfig.html +++ b/docs/api/api_docs/classes/QuantizationConfig.html @@ -6,12 +6,12 @@ - QuantizationConfig — MCT Documentation: ver 2.5.0 + QuantizationConfig — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -95,7 +95,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/QuantizationErrorMethod.html b/docs/api/api_docs/classes/QuantizationErrorMethod.html index ab0d196a2..ddbfcdd9d 100644 --- a/docs/api/api_docs/classes/QuantizationErrorMethod.html +++ b/docs/api/api_docs/classes/QuantizationErrorMethod.html @@ -6,12 +6,12 @@ - QuantizationErrorMethod — MCT Documentation: ver 2.5.0 + QuantizationErrorMethod — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -92,7 +92,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/ResourceUtilization.html b/docs/api/api_docs/classes/ResourceUtilization.html index 9a9de2dc4..53472a0fe 100644 --- a/docs/api/api_docs/classes/ResourceUtilization.html +++ b/docs/api/api_docs/classes/ResourceUtilization.html @@ -6,12 +6,12 @@ - ResourceUtilization — MCT Documentation: ver 2.5.0 + ResourceUtilization — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -90,7 +90,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/Wrapper.html b/docs/api/api_docs/classes/Wrapper.html index 4631983cb..26d92e92e 100644 --- a/docs/api/api_docs/classes/Wrapper.html +++ b/docs/api/api_docs/classes/Wrapper.html @@ -6,12 +6,12 @@ - wrapper — MCT Documentation: ver 2.5.0 + wrapper — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -337,7 +337,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/classes/XQuantConfig.html b/docs/api/api_docs/classes/XQuantConfig.html index 4b82d83b2..c5f9b7f53 100644 --- a/docs/api/api_docs/classes/XQuantConfig.html +++ b/docs/api/api_docs/classes/XQuantConfig.html @@ -6,12 +6,12 @@ - XQuant Configuration — MCT Documentation: ver 2.5.0 + XQuant Configuration — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -116,7 +116,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/index.html b/docs/api/api_docs/index.html index e7526110b..b61a8764c 100644 --- a/docs/api/api_docs/index.html +++ b/docs/api/api_docs/index.html @@ -6,12 +6,12 @@ - API Docs — MCT Documentation: ver 2.5.0 + API Docs — MCT Documentation: ver 2.5.1 - + @@ -32,7 +32,7 @@

    Navigation

  • previous |
  • - + @@ -148,7 +148,8 @@

    keras_load_quantized_model

    @@ -230,7 +231,7 @@

    Navigation

  • previous |
  • - + diff --git a/docs/api/api_docs/methods/get_keras_data_generation_config.html b/docs/api/api_docs/methods/get_keras_data_generation_config.html index 9339752ee..38e52c474 100644 --- a/docs/api/api_docs/methods/get_keras_data_generation_config.html +++ b/docs/api/api_docs/methods/get_keras_data_generation_config.html @@ -6,12 +6,12 @@ - Get DataGenerationConfig for Keras Models — MCT Documentation: ver 2.5.0 + Get DataGenerationConfig for Keras Models — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -116,7 +116,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/get_keras_gptq_config.html b/docs/api/api_docs/methods/get_keras_gptq_config.html index 1b7cbf373..aea93ccbc 100644 --- a/docs/api/api_docs/methods/get_keras_gptq_config.html +++ b/docs/api/api_docs/methods/get_keras_gptq_config.html @@ -6,12 +6,12 @@ - Get GradientPTQConfig for Keras Models — MCT Documentation: ver 2.5.0 + Get GradientPTQConfig for Keras Models — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -122,7 +122,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/get_pytorch_data_generation_config.html b/docs/api/api_docs/methods/get_pytorch_data_generation_config.html index 0898e812e..59376ebbd 100644 --- a/docs/api/api_docs/methods/get_pytorch_data_generation_config.html +++ b/docs/api/api_docs/methods/get_pytorch_data_generation_config.html @@ -6,12 +6,12 @@ - Get DataGenerationConfig for Pytorch Models — MCT Documentation: ver 2.5.0 + Get DataGenerationConfig for Pytorch Models — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -117,7 +117,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/get_pytroch_gptq_config.html b/docs/api/api_docs/methods/get_pytroch_gptq_config.html index 651c7a1ed..93fa4ed47 100644 --- a/docs/api/api_docs/methods/get_pytroch_gptq_config.html +++ b/docs/api/api_docs/methods/get_pytroch_gptq_config.html @@ -6,12 +6,12 @@ - Get GradientPTQConfig for Pytorch Models — MCT Documentation: ver 2.5.0 + Get GradientPTQConfig for Pytorch Models — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -119,7 +119,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/get_target_platform_capabilities.html b/docs/api/api_docs/methods/get_target_platform_capabilities.html index 4db07bf46..2597880e4 100644 --- a/docs/api/api_docs/methods/get_target_platform_capabilities.html +++ b/docs/api/api_docs/methods/get_target_platform_capabilities.html @@ -6,12 +6,12 @@ - Get FrameworkQuantizationCapabilities — MCT Documentation: ver 2.5.0 + Get TargetPlatformCapabilities for tpc version — MCT Documentation: ver 2.5.1 - + @@ -28,8 +28,8 @@

    Navigation

  • index
  • - - + + @@ -38,26 +38,24 @@

    Navigation

    -
    -

    Get FrameworkQuantizationCapabilities

    +
    +

    Get TargetPlatformCapabilities for tpc version

    -model_compression_toolkit.get_target_platform_capabilities(fw_name, target_platform_name, target_platform_version=None)
    -

    This is a degenerated function that only returns the MCT default TargetPlatformCapabilities object, to comply with the -existing TPC API.

    +model_compression_toolkit.get_target_platform_capabilities(tpc_version=TPC_V1_0, device_type=IMX500_TP_MODEL) +

    Retrieves target platform capabilities model based on tpc version and the specified device type.

    Return type:

    TargetPlatformCapabilities

    Parameters:
      -
    • fw_name – Framework name of the FrameworkQuantizationCapabilities.

    • -
    • target_platform_name – Target platform model name the model will use for inference.

    • -
    • target_platform_version – Target platform capabilities version.

    • +
    • tpc_version (str) – Target platform capabilities version.

    • +
    • device_type (str) – The type of device for the target platform.

    Returns:
    -

    A default TargetPlatformCapabilities object.

    +

    The TargetPlatformCapabilities object matching the tpc version.

    @@ -82,7 +80,7 @@

    Navigation

    @@ -127,7 +127,7 @@

    Navigation

  • index
  • - +
    diff --git a/docs/api/api_docs/methods/keras_gradient_post_training_quantization.html b/docs/api/api_docs/methods/keras_gradient_post_training_quantization.html index d894d22e6..925edb175 100644 --- a/docs/api/api_docs/methods/keras_gradient_post_training_quantization.html +++ b/docs/api/api_docs/methods/keras_gradient_post_training_quantization.html @@ -6,12 +6,12 @@ - Keras Gradient Based Post Training Quantization — MCT Documentation: ver 2.5.0 + Keras Gradient Based Post Training Quantization — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - +
    @@ -157,7 +157,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/keras_kpi_data.html b/docs/api/api_docs/methods/keras_kpi_data.html index 92338849d..c3420da49 100644 --- a/docs/api/api_docs/methods/keras_kpi_data.html +++ b/docs/api/api_docs/methods/keras_kpi_data.html @@ -6,12 +6,12 @@ - Get Resource Utilization information for Keras Models — MCT Documentation: ver 2.5.0 + Get Resource Utilization information for Keras Models — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -120,7 +120,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/keras_load_quantizad_model.html b/docs/api/api_docs/methods/keras_load_quantizad_model.html index f687ef409..34e1ea8ee 100644 --- a/docs/api/api_docs/methods/keras_load_quantizad_model.html +++ b/docs/api/api_docs/methods/keras_load_quantizad_model.html @@ -6,12 +6,12 @@ - Load Quantized Keras Model — MCT Documentation: ver 2.5.0 + Load Quantized Keras Model — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -96,7 +96,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/keras_post_training_quantization.html b/docs/api/api_docs/methods/keras_post_training_quantization.html index 55ffd62fc..87f877437 100644 --- a/docs/api/api_docs/methods/keras_post_training_quantization.html +++ b/docs/api/api_docs/methods/keras_post_training_quantization.html @@ -6,12 +6,12 @@ - Keras Post Training Quantization — MCT Documentation: ver 2.5.0 + Keras Post Training Quantization — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -154,7 +154,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/keras_pruning_experimental.html b/docs/api/api_docs/methods/keras_pruning_experimental.html index ea330ad34..64247dc9b 100644 --- a/docs/api/api_docs/methods/keras_pruning_experimental.html +++ b/docs/api/api_docs/methods/keras_pruning_experimental.html @@ -6,12 +6,12 @@ - Keras Structured Pruning — MCT Documentation: ver 2.5.0 + Keras Structured Pruning — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -150,7 +150,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/keras_quantization_aware_training_finalize_experimental.html b/docs/api/api_docs/methods/keras_quantization_aware_training_finalize_experimental.html index 792056b85..548a71316 100644 --- a/docs/api/api_docs/methods/keras_quantization_aware_training_finalize_experimental.html +++ b/docs/api/api_docs/methods/keras_quantization_aware_training_finalize_experimental.html @@ -6,12 +6,12 @@ - Keras Quantization Aware Training Model Finalize — MCT Documentation: ver 2.5.0 + Keras Quantization Aware Training Model Finalize — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -137,7 +137,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/keras_quantization_aware_training_init_experimental.html b/docs/api/api_docs/methods/keras_quantization_aware_training_init_experimental.html index c4be46c17..307b1d8ca 100644 --- a/docs/api/api_docs/methods/keras_quantization_aware_training_init_experimental.html +++ b/docs/api/api_docs/methods/keras_quantization_aware_training_init_experimental.html @@ -6,12 +6,12 @@ - Keras Quantization Aware Training Model Init — MCT Documentation: ver 2.5.0 + Keras Quantization Aware Training Model Init — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -159,7 +159,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_data_generation_experimental.html b/docs/api/api_docs/methods/pytorch_data_generation_experimental.html index 9a2a79150..6b4889bbb 100644 --- a/docs/api/api_docs/methods/pytorch_data_generation_experimental.html +++ b/docs/api/api_docs/methods/pytorch_data_generation_experimental.html @@ -6,12 +6,12 @@ - Pytorch Data Generation — MCT Documentation: ver 2.5.0 + Pytorch Data Generation — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -127,7 +127,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization.html b/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization.html index 860fc19e2..bdc476902 100644 --- a/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization.html +++ b/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization.html @@ -6,12 +6,12 @@ - Pytorch Gradient Based Post Training Quantization — MCT Documentation: ver 2.5.0 + Pytorch Gradient Based Post Training Quantization — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -144,7 +144,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_kpi_data.html b/docs/api/api_docs/methods/pytorch_kpi_data.html index 99809066d..11a514419 100644 --- a/docs/api/api_docs/methods/pytorch_kpi_data.html +++ b/docs/api/api_docs/methods/pytorch_kpi_data.html @@ -6,12 +6,12 @@ - Get Resource Utilization information for PyTorch Models — MCT Documentation: ver 2.5.0 + Get Resource Utilization information for PyTorch Models — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -118,7 +118,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_post_training_quantization.html b/docs/api/api_docs/methods/pytorch_post_training_quantization.html index 16a5ef7b5..ca448eb46 100644 --- a/docs/api/api_docs/methods/pytorch_post_training_quantization.html +++ b/docs/api/api_docs/methods/pytorch_post_training_quantization.html @@ -6,12 +6,12 @@ - Pytorch Post Training Quantization — MCT Documentation: ver 2.5.0 + Pytorch Post Training Quantization — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -133,7 +133,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_pruning_experimental.html b/docs/api/api_docs/methods/pytorch_pruning_experimental.html index 96b625122..2edccaff9 100644 --- a/docs/api/api_docs/methods/pytorch_pruning_experimental.html +++ b/docs/api/api_docs/methods/pytorch_pruning_experimental.html @@ -6,12 +6,12 @@ - Pytorch Structured Pruning — MCT Documentation: ver 2.5.0 + Pytorch Structured Pruning — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -42,7 +42,7 @@

    Navigation

    Pytorch Structured Pruning

    -model_compression_toolkit.pruning.pytorch_pruning_experimental(model, target_resource_utilization, representative_data_gen, pruning_config=PruningConfig(), target_platform_capabilities=DEFAULT_PYOTRCH_TPC)
    +model_compression_toolkit.pruning.pytorch_pruning_experimental(model, target_resource_utilization, representative_data_gen, pruning_config=PruningConfig(), target_platform_capabilities=DEFAULT_PYTORCH_TPC)

    Perform structured pruning on a Pytorch model to meet a specified target resource utilization. This function prunes the provided model according to the target resource utilization by grouping and pruning channels based on each layer’s SIMD configuration in the Target Platform Capabilities (TPC). @@ -151,7 +151,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental.html b/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental.html index f11946e4b..7e27a9285 100644 --- a/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental.html +++ b/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental.html @@ -6,12 +6,12 @@ - PyTorch Quantization Aware Training Model Finalize — MCT Documentation: ver 2.5.0 + PyTorch Quantization Aware Training Model Finalize — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -122,7 +122,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/pytorch_quantization_aware_training_init_experimental.html b/docs/api/api_docs/methods/pytorch_quantization_aware_training_init_experimental.html index c8ac6a00e..3e5e1e85d 100644 --- a/docs/api/api_docs/methods/pytorch_quantization_aware_training_init_experimental.html +++ b/docs/api/api_docs/methods/pytorch_quantization_aware_training_init_experimental.html @@ -6,12 +6,12 @@ - PyTorch Quantization Aware Training Model Init — MCT Documentation: ver 2.5.0 + PyTorch Quantization Aware Training Model Init — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -140,7 +140,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/set_logger_path.html b/docs/api/api_docs/methods/set_logger_path.html index 3a0463d08..6736cfb16 100644 --- a/docs/api/api_docs/methods/set_logger_path.html +++ b/docs/api/api_docs/methods/set_logger_path.html @@ -6,12 +6,12 @@ - Enable a Logger — MCT Documentation: ver 2.5.0 + Enable a Logger — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -45,10 +45,13 @@

    Navigation

    model_compression_toolkit.set_log_folder(folder, level=logging.INFO)

    Set a directory path for saving a log file.

    -
    Parameters:
    -
      -
    • folder – Folder path to save the log file.

    • -
    • level – Level of verbosity to set to the logger and handlers.

    • +
      Return type:
      +

      None

      +
      +
      Parameters:
      +
        +
      • folder (str) – Folder path to save the log file.

      • +
      • level (int) – Level of verbosity to set to the logger and handlers.

    @@ -99,7 +102,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/xquant_report_keras_experimental.html b/docs/api/api_docs/methods/xquant_report_keras_experimental.html index 3b060d3c6..0f4a964a4 100644 --- a/docs/api/api_docs/methods/xquant_report_keras_experimental.html +++ b/docs/api/api_docs/methods/xquant_report_keras_experimental.html @@ -6,12 +6,12 @@ - XQuant Report Keras — MCT Documentation: ver 2.5.0 + XQuant Report Keras — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -105,7 +105,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/xquant_report_pytorch_experimental.html b/docs/api/api_docs/methods/xquant_report_pytorch_experimental.html index fbb364969..351e51b7a 100644 --- a/docs/api/api_docs/methods/xquant_report_pytorch_experimental.html +++ b/docs/api/api_docs/methods/xquant_report_pytorch_experimental.html @@ -6,12 +6,12 @@ - XQuant Report Pytorch — MCT Documentation: ver 2.5.0 + XQuant Report Pytorch — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -102,7 +102,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental.html b/docs/api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental.html index ec2c91497..71415e4b8 100644 --- a/docs/api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental.html +++ b/docs/api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental.html @@ -6,12 +6,12 @@ - XQuant Report Troubleshoot Pytorch — MCT Documentation: ver 2.5.0 + XQuant Report Troubleshoot Pytorch — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -103,7 +103,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/core_config.html b/docs/api/api_docs/modules/core_config.html index b234f0bb4..27f0b2553 100644 --- a/docs/api/api_docs/modules/core_config.html +++ b/docs/api/api_docs/modules/core_config.html @@ -6,12 +6,12 @@ - CoreConfig — MCT Documentation: ver 2.5.0 + CoreConfig — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -97,7 +97,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/debug_config.html b/docs/api/api_docs/modules/debug_config.html index 5d51bac9d..f1557e002 100644 --- a/docs/api/api_docs/modules/debug_config.html +++ b/docs/api/api_docs/modules/debug_config.html @@ -6,12 +6,12 @@ - debug_config Module — MCT Documentation: ver 2.5.0 + debug_config Module — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -103,7 +103,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/exporter.html b/docs/api/api_docs/modules/exporter.html index ab335a595..a4c2410f2 100644 --- a/docs/api/api_docs/modules/exporter.html +++ b/docs/api/api_docs/modules/exporter.html @@ -6,12 +6,12 @@ - exporter Module — MCT Documentation: ver 2.5.0 + exporter Module — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -345,7 +345,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/layer_filters.html b/docs/api/api_docs/modules/layer_filters.html index cfaba6dbc..f69824f78 100644 --- a/docs/api/api_docs/modules/layer_filters.html +++ b/docs/api/api_docs/modules/layer_filters.html @@ -6,12 +6,12 @@ - Layer Attributes Filters — MCT Documentation: ver 2.5.0 + Layer Attributes Filters — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -220,7 +220,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/network_editor.html b/docs/api/api_docs/modules/network_editor.html index 15c5543dc..2509246ba 100644 --- a/docs/api/api_docs/modules/network_editor.html +++ b/docs/api/api_docs/modules/network_editor.html @@ -6,12 +6,12 @@ - network_editor Module — MCT Documentation: ver 2.5.0 + network_editor Module — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -298,7 +298,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/qat_config.html b/docs/api/api_docs/modules/qat_config.html index c264cd215..e7dea053f 100644 --- a/docs/api/api_docs/modules/qat_config.html +++ b/docs/api/api_docs/modules/qat_config.html @@ -6,12 +6,12 @@ - qat_config Module — MCT Documentation: ver 2.5.0 + qat_config Module — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -110,7 +110,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/target_platform_capabilities.html b/docs/api/api_docs/modules/target_platform_capabilities.html index 9796231c6..3a93a679c 100644 --- a/docs/api/api_docs/modules/target_platform_capabilities.html +++ b/docs/api/api_docs/modules/target_platform_capabilities.html @@ -6,12 +6,12 @@ - target_platform_capabilities Module — MCT Documentation: ver 2.5.0 + target_platform_capabilities Module — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -48,7 +48,8 @@

    Navigation

    Conv2D.

    This can be addressed in MCT by using the target_platform_capabilities module, that can configure different parameters that are hardware-related, and the optimization process will use this to optimize the model accordingly. -Models for IMX500, TFLite and qnnpack can be observed here, and can be used using get_target_platform_capabilities function.

    +Models for IMX500, TFLite and qnnpack can be observed here, and can be retrieved using get_target_platform_capabilities function. +You can also get the model for IMX500 using get_target_platform_capabilities_sdsp function that specifies the sdsp converter version.


    @@ -588,7 +589,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/modules/trainable_infrastructure.html b/docs/api/api_docs/modules/trainable_infrastructure.html index 7488cd9ef..6b5c3c3d5 100644 --- a/docs/api/api_docs/modules/trainable_infrastructure.html +++ b/docs/api/api_docs/modules/trainable_infrastructure.html @@ -6,12 +6,12 @@ - trainable_infrastructure Module — MCT Documentation: ver 2.5.0 + trainable_infrastructure Module — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -237,7 +237,7 @@

    Navigation

  • index
  • - + diff --git a/docs/api/api_docs/notes/tpc_note.html b/docs/api/api_docs/notes/tpc_note.html index ce7a17951..cdff15b96 100644 --- a/docs/api/api_docs/notes/tpc_note.html +++ b/docs/api/api_docs/notes/tpc_note.html @@ -6,12 +6,12 @@ - <no title> — MCT Documentation: ver 2.5.0 + <no title> — MCT Documentation: ver 2.5.1 - + @@ -28,7 +28,7 @@

    Navigation

  • index
  • - + @@ -74,7 +74,7 @@

    Navigation

  • index
  • - + diff --git a/docs/genindex.html b/docs/genindex.html index f9199ee96..7d2f0a39f 100644 --- a/docs/genindex.html +++ b/docs/genindex.html @@ -5,12 +5,12 @@ - Index — MCT Documentation: ver 2.5.0 + Index — MCT Documentation: ver 2.5.1 - + @@ -27,7 +27,7 @@

    Navigation

  • index
  • - + @@ -193,10 +193,12 @@

    G

  • get_pytorch_data_generation_config() (in module model_compression_toolkit.data_generation)
  • get_pytorch_gptq_config() (in module model_compression_toolkit.gptq) +
  • +
  • get_target_platform_capabilities() (in module model_compression_toolkit)
  • diff --git a/docs/guidelines/XQuant_Extension_Tool.html b/docs/guidelines/XQuant_Extension_Tool.html index 6afabb59d..008830b18 100644 --- a/docs/guidelines/XQuant_Extension_Tool.html +++ b/docs/guidelines/XQuant_Extension_Tool.html @@ -6,12 +6,12 @@ - XQuant Extension Tool — MCT Documentation: ver 2.5.0 + XQuant Extension Tool — MCT Documentation: ver 2.5.1 - + @@ -36,7 +36,7 @@

    Navigation

  • previous |
  • - + @@ -414,7 +414,7 @@

    Navigation

  • previous |
  • - + diff --git a/docs/guidelines/visualization.html b/docs/guidelines/visualization.html index a8549fc1f..eee7da8fb 100644 --- a/docs/guidelines/visualization.html +++ b/docs/guidelines/visualization.html @@ -6,12 +6,12 @@ - Visualization within TensorBoard — MCT Documentation: ver 2.5.0 + Visualization within TensorBoard — MCT Documentation: ver 2.5.1 - + @@ -36,7 +36,7 @@

    Navigation

  • previous |
  • - + @@ -192,7 +192,7 @@

    Navigation

  • previous |
  • - + diff --git a/docs/index.html b/docs/index.html index 35ab340de..a70c72f06 100644 --- a/docs/index.html +++ b/docs/index.html @@ -6,12 +6,12 @@ - Model Compression Toolkit User Guide — MCT Documentation: ver 2.5.0 + Model Compression Toolkit User Guide — MCT Documentation: ver 2.5.1 - + @@ -32,7 +32,7 @@

    Navigation

  • next |
  • - + @@ -175,7 +175,7 @@

    Navigation

  • next |
  • - + diff --git a/docs/objects.inv b/docs/objects.inv index d109c3ef3..38bb93be1 100644 Binary files a/docs/objects.inv and b/docs/objects.inv differ diff --git a/docs/search.html b/docs/search.html index 7848a4b79..f8166344b 100644 --- a/docs/search.html +++ b/docs/search.html @@ -5,13 +5,13 @@ - Search — MCT Documentation: ver 2.5.0 + Search — MCT Documentation: ver 2.5.1 - + @@ -34,7 +34,7 @@

    Navigation

  • index
  • - + @@ -88,7 +88,7 @@

    Navigation

  • index
  • - + diff --git a/docs/searchindex.js b/docs/searchindex.js index 6d3c96471..2439e291a 100644 --- a/docs/searchindex.js +++ b/docs/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"API Docs": [[13, null]], "API Documentation": [[49, "api-documentation"]], "About XQuant Extension Tool": [[47, "about-xquant-extension-tool"]], "Actions": [[42, "actions"]], "Attribute Filters": [[41, "attribute-filters"]], "AttributeQuantizationConfig": [[44, "attributequantizationconfig"]], "BNLayerWeightingType": [[1, "bnlayerweightingtype"]], "BaseKerasTrainableQuantizer": [[45, "basekerastrainablequantizer"]], "BasePytorchTrainableQuantizer": [[45, "basepytorchtrainablequantizer"]], "BatchNormAlignemntLossType": [[1, "batchnormalignemntlosstype"]], "BitWidthConfig": [[0, null]], "ChannelAxis": [[3, "channelaxis"]], "ChannelsFilteringStrategy": [[6, "channelsfilteringstrategy"]], "CoreConfig": [[38, null]], "Cosine Similarity Comparison": [[48, "cosine-similarity-comparison"]], "Data Generation Configuration": [[1, null]], "DataInitType": [[1, "datainittype"]], "DebugConfig": [[39, "debugconfig"]], "DefaultDict Class": [[2, null]], "EditRule": [[42, "editrule"]], "Enable a Logger": [[34, null]], "Filters": [[42, "filters"]], "FrameworkInfo Class": [[3, null]], "Fusing": [[44, "fusing"]], "GPTQHessianScoresConfig Class": [[4, "gptqhessianscoresconfig-class"]], "Get DataGenerationConfig for Keras Models": [[14, null]], "Get DataGenerationConfig for Pytorch Models": [[16, null]], "Get FrameworkQuantizationCapabilities": [[18, null]], "Get GradientPTQConfig for Keras Models": [[15, null]], "Get GradientPTQConfig for Pytorch Models": [[17, null]], "Get Resource Utilization information for Keras Models": [[21, null]], "Get Resource Utilization information for PyTorch Models": [[29, null]], "GradientPTQConfig Class": [[4, null]], "GradualActivationQuantizationConfig": [[4, "gradualactivationquantizationconfig"]], "How to Run": [[47, "how-to-run"]], "ImageGranularity": [[1, "imagegranularity"]], "ImageNormalizationType": [[1, "imagenormalizationtype"]], "ImagePipelineType": [[1, "imagepipelinetype"]], "ImportanceMetric": [[6, "importancemetric"]], "Indices and tables": [[13, "indices-and-tables"]], "Install": [[49, "install"]], "Keras Data Generation": [[19, null]], "Keras Gradient Based Post Training Quantization": [[20, null]], "Keras Post Training Quantization": [[23, null]], "Keras Quantization Aware Training Model Finalize": [[25, null]], "Keras Quantization Aware Training Model Init": [[26, null]], "Keras Structured Pruning": [[24, null]], "Keras Tutorial": [[40, "keras-tutorial"]], "KerasExportSerializationFormat": [[40, "kerasexportserializationformat"]], "Layer Attributes Filters": [[41, null]], "Load Quantized Keras Model": [[22, null]], "MCTQ": [[40, "mctq"]], "MCTQ Quantization Format": [[40, "mctq-quantization-format"]], "ManualBitWidthSelection": [[0, "manualbitwidthselection"]], "Mixed Precision with model output loss objective": [[47, "mixed-precision-with-model-output-loss-objective"]], "Mixed-precision Configuration Bit-width": [[48, "mixed-precision-configuration-bit-width"]], "MixedPrecisionQuantizationConfig": [[5, null]], "Model Compression Toolkit User Guide": [[49, null]], "MpDistanceWeighting": [[5, "mpdistanceweighting"]], "MpMetricNormalization": [[5, "mpmetricnormalization"]], "ONNX": [[40, "onnx"]], "ONNX model output names": [[40, "onnx-model-output-names"]], "ONNX opset version": [[40, "onnx-opset-version"]], "OpQuantizationConfig": [[44, "opquantizationconfig"]], "OperatorSetGroup": [[44, "operatorsetgroup"]], "OperatorsSet": [[44, "operatorsset"]], "Outlier Removal": [[47, "outlier-removal"]], "OutputLossType": [[1, "outputlosstype"]], "Overall Process Flow": [[47, "overall-process-flow"]], "Overview": [[49, "overview"]], "Pruning Configuration": [[6, null]], "Pruning Information": [[7, null]], "PyTorch Quantization Aware Training Model Finalize": [[32, null]], "PyTorch Quantization Aware Training Model Init": [[33, null]], "Pytorch Data Generation": [[27, null]], "Pytorch Gradient Based Post Training Quantization": [[28, null]], "Pytorch Post Training Quantization": [[30, null]], "Pytorch Structured Pruning": [[31, null]], "Pytorch Tutorial": [[40, "pytorch-tutorial"]], "PytorchExportSerializationFormat": [[40, "pytorchexportserializationformat"]], "QATConfig": [[43, "qatconfig"]], "QFractionLinearAnnealingConfig": [[4, "qfractionlinearannealingconfig"]], "QuantizationConfig": [[8, null]], "QuantizationConfigOptions": [[44, "quantizationconfigoptions"]], "QuantizationErrorMethod": [[9, null]], "QuantizationFormat": [[40, "quantizationformat"]], "QuantizationMethod": [[44, "quantizationmethod"]], "Quickstart": [[49, "quickstart"]], "References": [[49, "references"]], "ResourceUtilization": [[10, null]], "RoundingType": [[4, "roundingtype"]], "SchedulerType": [[1, "schedulertype"]], "Shift Negative Activation": [[47, "shift-negative-activation"]], "Supported Features": [[49, "supported-features"]], "TargetPlatformCapabilities": [[44, "targetplatformcapabilities"]], "Technical Constraints": [[49, "technical-constraints"]], "TrainableQuantizerActivationConfig": [[45, "trainablequantizeractivationconfig"]], "TrainableQuantizerWeightsConfig": [[45, "trainablequantizerweightsconfig"]], "TrainingMethod": [[43, "trainingmethod"], [45, "trainingmethod"]], "Unbalanced Concatnation": [[47, "unbalanced-concatnation"]], "Understanding the Quantization Error Graph": [[47, "understanding-the-quantization-error-graph"]], "Understanding the judgment result": [[47, "understanding-the-judgment-result"]], "Use exported model for inference": [[40, "use-exported-model-for-inference"]], "Visualization within TensorBoard": [[48, null]], "XQuant Configuration": [[12, null]], "XQuant Extension Tool": [[47, null]], "XQuant Report Keras": [[35, null]], "XQuant Report Pytorch": [[36, null]], "XQuant Report Troubleshoot Pytorch": [[37, null]], "XQuantConfig Format and Examples": [[47, "xquantconfig-format-and-examples"]], "XQuantConfig parameter": [[47, "id1"]], "core": [[13, "core"]], "data_generation": [[13, "data-generation"]], "debug_config Module": [[39, null]], "exporter": [[13, "exporter"]], "exporter Module": [[40, null]], "gptq": [[13, "gptq"]], "keras serialization format": [[40, "keras-serialization-format"]], "keras_export_model": [[40, "keras-export-model"]], "keras_load_quantized_model": [[13, "keras-load-quantized-model"]], "network_editor Module": [[42, null]], "pruning": [[13, "pruning"]], "ptq": [[13, "ptq"]], "pytorch_export_model": [[40, "pytorch-export-model"]], "qat": [[13, "qat"]], "qat_config Module": [[43, null]], "set_log_folder": [[13, "set-log-folder"]], "target_platform_capabilities": [[13, "target-platform-capabilities"]], "target_platform_capabilities Module": [[44, null]], "trainable_infrastructure": [[13, "trainable-infrastructure"]], "trainable_infrastructure Module": [[45, null]], "wrapper": [[11, null], [13, "wrapper"]], "xquant": [[13, "xquant"]]}, "docnames": ["api/api_docs/classes/BitWidthConfig", "api/api_docs/classes/DataGenerationConfig", "api/api_docs/classes/DefaultDict", "api/api_docs/classes/FrameworkInfo", "api/api_docs/classes/GradientPTQConfig", "api/api_docs/classes/MixedPrecisionQuantizationConfig", "api/api_docs/classes/PruningConfig", "api/api_docs/classes/PruningInfo", "api/api_docs/classes/QuantizationConfig", "api/api_docs/classes/QuantizationErrorMethod", "api/api_docs/classes/ResourceUtilization", "api/api_docs/classes/Wrapper", "api/api_docs/classes/XQuantConfig", "api/api_docs/index", "api/api_docs/methods/get_keras_data_generation_config", "api/api_docs/methods/get_keras_gptq_config", "api/api_docs/methods/get_pytorch_data_generation_config", "api/api_docs/methods/get_pytroch_gptq_config", "api/api_docs/methods/get_target_platform_capabilities", "api/api_docs/methods/keras_data_generation_experimental", "api/api_docs/methods/keras_gradient_post_training_quantization", "api/api_docs/methods/keras_kpi_data", "api/api_docs/methods/keras_load_quantizad_model", "api/api_docs/methods/keras_post_training_quantization", "api/api_docs/methods/keras_pruning_experimental", "api/api_docs/methods/keras_quantization_aware_training_finalize_experimental", "api/api_docs/methods/keras_quantization_aware_training_init_experimental", "api/api_docs/methods/pytorch_data_generation_experimental", "api/api_docs/methods/pytorch_gradient_post_training_quantization", "api/api_docs/methods/pytorch_kpi_data", "api/api_docs/methods/pytorch_post_training_quantization", "api/api_docs/methods/pytorch_pruning_experimental", "api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental", "api/api_docs/methods/pytorch_quantization_aware_training_init_experimental", "api/api_docs/methods/set_logger_path", "api/api_docs/methods/xquant_report_keras_experimental", "api/api_docs/methods/xquant_report_pytorch_experimental", "api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental", "api/api_docs/modules/core_config", "api/api_docs/modules/debug_config", "api/api_docs/modules/exporter", "api/api_docs/modules/layer_filters", "api/api_docs/modules/network_editor", "api/api_docs/modules/qat_config", "api/api_docs/modules/target_platform_capabilities", "api/api_docs/modules/trainable_infrastructure", "api/api_docs/notes/tpc_note", "guidelines/XQuant_Extension_Tool", "guidelines/visualization", "index"], "envversion": {"sphinx": 64, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["api/api_docs/classes/BitWidthConfig.rst", "api/api_docs/classes/DataGenerationConfig.rst", "api/api_docs/classes/DefaultDict.rst", "api/api_docs/classes/FrameworkInfo.rst", "api/api_docs/classes/GradientPTQConfig.rst", "api/api_docs/classes/MixedPrecisionQuantizationConfig.rst", "api/api_docs/classes/PruningConfig.rst", "api/api_docs/classes/PruningInfo.rst", "api/api_docs/classes/QuantizationConfig.rst", "api/api_docs/classes/QuantizationErrorMethod.rst", "api/api_docs/classes/ResourceUtilization.rst", "api/api_docs/classes/Wrapper.rst", "api/api_docs/classes/XQuantConfig.rst", "api/api_docs/index.rst", "api/api_docs/methods/get_keras_data_generation_config.rst", "api/api_docs/methods/get_keras_gptq_config.rst", "api/api_docs/methods/get_pytorch_data_generation_config.rst", "api/api_docs/methods/get_pytroch_gptq_config.rst", "api/api_docs/methods/get_target_platform_capabilities.rst", "api/api_docs/methods/keras_data_generation_experimental.rst", "api/api_docs/methods/keras_gradient_post_training_quantization.rst", "api/api_docs/methods/keras_kpi_data.rst", "api/api_docs/methods/keras_load_quantizad_model.rst", "api/api_docs/methods/keras_post_training_quantization.rst", "api/api_docs/methods/keras_pruning_experimental.rst", "api/api_docs/methods/keras_quantization_aware_training_finalize_experimental.rst", "api/api_docs/methods/keras_quantization_aware_training_init_experimental.rst", "api/api_docs/methods/pytorch_data_generation_experimental.rst", "api/api_docs/methods/pytorch_gradient_post_training_quantization.rst", "api/api_docs/methods/pytorch_kpi_data.rst", "api/api_docs/methods/pytorch_post_training_quantization.rst", "api/api_docs/methods/pytorch_pruning_experimental.rst", "api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental.rst", "api/api_docs/methods/pytorch_quantization_aware_training_init_experimental.rst", "api/api_docs/methods/set_logger_path.rst", "api/api_docs/methods/xquant_report_keras_experimental.rst", "api/api_docs/methods/xquant_report_pytorch_experimental.rst", "api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental.rst", "api/api_docs/modules/core_config.rst", "api/api_docs/modules/debug_config.rst", "api/api_docs/modules/exporter.rst", "api/api_docs/modules/layer_filters.rst", "api/api_docs/modules/network_editor.rst", "api/api_docs/modules/qat_config.rst", "api/api_docs/modules/target_platform_capabilities.rst", "api/api_docs/modules/trainable_infrastructure.rst", "api/api_docs/notes/tpc_note.rst", "guidelines/XQuant_Extension_Tool.rst", "guidelines/visualization.rst", "index.rst"], "indexentries": {"add_metadata (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.add_metadata", false]], "attributefilter (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.AttributeFilter", false]], "attributequantizationconfig (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig", false]], "base_config (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.quantizationconfigoptions attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions.base_config", false]], "basekerastrainablequantizer (class in model_compression_toolkit.trainable_infrastructure)": [[45, "model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer", false]], "basepytorchtrainablequantizer (class in model_compression_toolkit.trainable_infrastructure)": [[45, "model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer", false]], "batchnormalignemntlosstype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.BatchNormAlignemntLossType", false]], "bit_width (model_compression_toolkit.core.common.quantization.bit_width_config.manualbitwidthselection attribute)": [[0, "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection.bit_width", false]], "bitwidthconfig (class in model_compression_toolkit.core)": [[0, "model_compression_toolkit.core.BitWidthConfig", false]], "bnlayerweightingtype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.BNLayerWeightingType", false]], "changecandidatesactivationquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr", false]], "changecandidatesactivationquantizationmethod (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod", false]], "changecandidatesweightsquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr", false]], "changecandidatesweightsquantizationmethod (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod", false]], "changefinalactivationquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr", false]], "changefinalweightsquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr", false]], "changefinalweightsquantizationmethod (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod", false]], "changequantizationparamfunction (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction", false]], "channelaxis (class in model_compression_toolkit.core)": [[3, "model_compression_toolkit.core.ChannelAxis", false]], "channels_filtering_strategy (model_compression_toolkit.pruning.pruningconfig attribute)": [[6, "model_compression_toolkit.pruning.PruningConfig.channels_filtering_strategy", false]], "channelsfilteringstrategy (class in model_compression_toolkit.pruning)": [[6, "model_compression_toolkit.pruning.ChannelsFilteringStrategy", false]], "coreconfig (class in model_compression_toolkit.core)": [[38, "model_compression_toolkit.core.CoreConfig", false]], "datagenerationconfig (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.DataGenerationConfig", false]], "datainittype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.DataInitType", false]], "debugconfig (class in model_compression_toolkit.core)": [[39, "model_compression_toolkit.core.DebugConfig", false]], "default_qco (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.default_qco", false]], "defaultdict (class in model_compression_toolkit)": [[2, "model_compression_toolkit.DefaultDict", false]], "editrule (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.EditRule", false]], "enable_weights_quantization (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.enable_weights_quantization", false]], "eq (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.Eq", false]], "filter (model_compression_toolkit.core.common.quantization.bit_width_config.manualbitwidthselection attribute)": [[0, "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection.filter", false]], "frameworkinfo (class in model_compression_toolkit.core)": [[3, "model_compression_toolkit.core.FrameworkInfo", false]], "fuse_op_quantization_config (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.fusing attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing.fuse_op_quantization_config", false]], "fusing (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing", false]], "fusing_patterns (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.fusing_patterns", false]], "get() (model_compression_toolkit.defaultdict method)": [[2, "model_compression_toolkit.DefaultDict.get", false]], "get_keras_data_generation_config() (in module model_compression_toolkit.data_generation)": [[14, "model_compression_toolkit.data_generation.get_keras_data_generation_config", false]], "get_keras_gptq_config() (in module model_compression_toolkit.gptq)": [[15, "model_compression_toolkit.gptq.get_keras_gptq_config", false]], "get_pytorch_data_generation_config() (in module model_compression_toolkit.data_generation)": [[16, "model_compression_toolkit.data_generation.get_pytorch_data_generation_config", false]], "get_pytorch_gptq_config() (in module model_compression_toolkit.gptq)": [[17, "model_compression_toolkit.gptq.get_pytorch_gptq_config", false]], "get_target_platform_capabilities() (in module model_compression_toolkit)": [[18, "model_compression_toolkit.get_target_platform_capabilities", false]], "gptqhessianscoresconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.GPTQHessianScoresConfig", false]], "gradientptqconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.GradientPTQConfig", false]], "gradualactivationquantizationconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.GradualActivationQuantizationConfig", false]], "greater (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.Greater", false]], "greatereq (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.GreaterEq", false]], "imagegranularity (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.ImageGranularity", false]], "imagenormalizationtype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.ImageNormalizationType", false]], "imagepipelinetype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.ImagePipelineType", false]], "importance_metric (model_compression_toolkit.pruning.pruningconfig attribute)": [[6, "model_compression_toolkit.pruning.PruningConfig.importance_metric", false]], "importance_scores (model_compression_toolkit.pruning.pruninginfo property)": [[7, "model_compression_toolkit.pruning.PruningInfo.importance_scores", false]], "importancemetric (class in model_compression_toolkit.pruning)": [[6, "model_compression_toolkit.pruning.ImportanceMetric", false]], "insert_preserving_quantizers (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.insert_preserving_quantizers", false]], "is_simd_padding (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.is_simd_padding", false]], "keras_data_generation_experimental() (in module model_compression_toolkit.data_generation)": [[19, "model_compression_toolkit.data_generation.keras_data_generation_experimental", false]], "keras_export_model (class in model_compression_toolkit.exporter)": [[40, "model_compression_toolkit.exporter.keras_export_model", false]], "keras_gradient_post_training_quantization() (in module model_compression_toolkit.gptq)": [[20, "model_compression_toolkit.gptq.keras_gradient_post_training_quantization", false]], "keras_load_quantized_model() (in module model_compression_toolkit)": [[22, "model_compression_toolkit.keras_load_quantized_model", false]], "keras_post_training_quantization() (in module model_compression_toolkit.ptq)": [[23, "model_compression_toolkit.ptq.keras_post_training_quantization", false]], "keras_pruning_experimental() (in module model_compression_toolkit.pruning)": [[24, "model_compression_toolkit.pruning.keras_pruning_experimental", false]], "keras_quantization_aware_training_finalize_experimental() (in module model_compression_toolkit.qat)": [[25, "model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental", false]], "keras_quantization_aware_training_init_experimental() (in module model_compression_toolkit.qat)": [[26, "model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental", false]], "keras_resource_utilization_data() (in module model_compression_toolkit.core)": [[21, "model_compression_toolkit.core.keras_resource_utilization_data", false]], "kerasexportserializationformat (class in model_compression_toolkit.exporter)": [[40, "model_compression_toolkit.exporter.KerasExportSerializationFormat", false]], "keys() (model_compression_toolkit.defaultdict method)": [[2, "model_compression_toolkit.DefaultDict.keys", false]], "lut_values_bitwidth (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.lut_values_bitwidth", false]], "manual_activation_bit_width_selection_list (model_compression_toolkit.core.bitwidthconfig attribute)": [[0, "model_compression_toolkit.core.BitWidthConfig.manual_activation_bit_width_selection_list", false]], "manual_weights_bit_width_selection_list (model_compression_toolkit.core.bitwidthconfig attribute)": [[0, "model_compression_toolkit.core.BitWidthConfig.manual_weights_bit_width_selection_list", false]], "manualbitwidthselection (class in model_compression_toolkit.core.common.quantization.bit_width_config)": [[0, "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection", false]], "mctwrapper (class in model_compression_toolkit.wrapper.mct_wrapper)": [[11, "model_compression_toolkit.wrapper.mct_wrapper.MCTWrapper", false]], "mixedprecisionquantizationconfig (class in model_compression_toolkit.core)": [[5, "model_compression_toolkit.core.MixedPrecisionQuantizationConfig", false]], "mpdistanceweighting (class in model_compression_toolkit.core)": [[5, "model_compression_toolkit.core.MpDistanceWeighting", false]], "mpmetricnormalization (class in model_compression_toolkit.core)": [[5, "model_compression_toolkit.core.MpMetricNormalization", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.fusing attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing.name", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsetgroup attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup.name", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsset attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet.name", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.name", false]], "nodenamefilter (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.NodeNameFilter", false]], "nodenamescopefilter (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.NodeNameScopeFilter", false]], "nodetypefilter (class in model_compression_toolkit.core.network_editor)": [[42, "model_compression_toolkit.core.network_editor.NodeTypeFilter", false]], "noteq (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.NotEq", false]], "num_score_approximations (model_compression_toolkit.pruning.pruningconfig attribute)": [[6, "model_compression_toolkit.pruning.PruningConfig.num_score_approximations", false]], "operator_groups (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.fusing attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing.operator_groups", false]], "operator_set (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.operator_set", false]], "operators_set (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsetgroup attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup.operators_set", false]], "operatorsetgroup (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup", false]], "operatorsset (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet", false]], "opquantizationconfig (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OpQuantizationConfig", false]], "outputlosstype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.OutputLossType", false]], "pruning_masks (model_compression_toolkit.pruning.pruninginfo property)": [[7, "model_compression_toolkit.pruning.PruningInfo.pruning_masks", false]], "pruningconfig (class in model_compression_toolkit.pruning)": [[6, "model_compression_toolkit.pruning.PruningConfig", false]], "pruninginfo (class in model_compression_toolkit.pruning)": [[7, "model_compression_toolkit.pruning.PruningInfo", false]], "pytorch_data_generation_experimental() (in module model_compression_toolkit.data_generation)": [[27, "model_compression_toolkit.data_generation.pytorch_data_generation_experimental", false]], "pytorch_export_model (class in model_compression_toolkit.exporter)": [[40, "model_compression_toolkit.exporter.pytorch_export_model", false]], "pytorch_gradient_post_training_quantization() (in module model_compression_toolkit.gptq)": [[28, "model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization", false]], "pytorch_post_training_quantization() (in module model_compression_toolkit.ptq)": [[30, "model_compression_toolkit.ptq.pytorch_post_training_quantization", false]], "pytorch_pruning_experimental() (in module model_compression_toolkit.pruning)": [[31, "model_compression_toolkit.pruning.pytorch_pruning_experimental", false]], "pytorch_quantization_aware_training_finalize_experimental() (in module model_compression_toolkit.qat)": [[32, "model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental", false]], "pytorch_quantization_aware_training_init_experimental() (in module model_compression_toolkit.qat)": [[33, "model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental", false]], "pytorch_resource_utilization_data() (in module model_compression_toolkit.core)": [[29, "model_compression_toolkit.core.pytorch_resource_utilization_data", false]], "pytorchexportserializationformat (class in model_compression_toolkit.exporter)": [[40, "model_compression_toolkit.exporter.PytorchExportSerializationFormat", false]], "qatconfig (class in model_compression_toolkit.qat)": [[43, "model_compression_toolkit.qat.QATConfig", false]], "qc_options (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsset attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet.qc_options", false]], "qfractionlinearannealingconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.QFractionLinearAnnealingConfig", false]], "quantization_configurations (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.quantizationconfigoptions attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions.quantization_configurations", false]], "quantizationconfig (class in model_compression_toolkit.core)": [[8, "model_compression_toolkit.core.QuantizationConfig", false]], "quantizationconfigoptions (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions", false]], "quantizationerrormethod (class in model_compression_toolkit.core)": [[9, "model_compression_toolkit.core.QuantizationErrorMethod", false]], "quantizationformat (class in model_compression_toolkit.exporter)": [[40, "model_compression_toolkit.exporter.QuantizationFormat", false]], "quantizationmethod (class in model_compression_toolkit.target_platform_capabilities)": [[44, "model_compression_toolkit.target_platform_capabilities.QuantizationMethod", false]], "quantize_and_export() (model_compression_toolkit.wrapper.mct_wrapper.mctwrapper method)": [[11, "model_compression_toolkit.wrapper.mct_wrapper.MCTWrapper.quantize_and_export", false]], "resourceutilization (class in model_compression_toolkit.core)": [[10, "model_compression_toolkit.core.ResourceUtilization", false]], "roundingtype (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.RoundingType", false]], "schedulertype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.SchedulerType", false]], "schema_version (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.SCHEMA_VERSION", false]], "set_log_folder() (in module model_compression_toolkit)": [[34, "model_compression_toolkit.set_log_folder", false]], "smaller (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.Smaller", false]], "smallereq (class in model_compression_toolkit.target_platform_capabilities)": [[41, "model_compression_toolkit.target_platform_capabilities.SmallerEq", false]], "targetplatformcapabilities (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities", false]], "tpc_minor_version (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.tpc_minor_version", false]], "tpc_patch_version (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.tpc_patch_version", false]], "tpc_platform_type (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.tpc_platform_type", false]], "trainablequantizeractivationconfig (class in model_compression_toolkit.trainable_infrastructure)": [[45, "model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig", false]], "trainablequantizerweightsconfig (class in model_compression_toolkit.trainable_infrastructure)": [[45, "model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig", false]], "trainingmethod (class in model_compression_toolkit.trainable_infrastructure)": [[45, "model_compression_toolkit.trainable_infrastructure.TrainingMethod", false]], "type (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsset attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet.type", false]], "weights_n_bits (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.weights_n_bits", false]], "weights_per_channel_threshold (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.weights_per_channel_threshold", false]], "weights_quantization_method (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[44, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.weights_quantization_method", false]], "xquant_report_keras_experimental() (in module model_compression_toolkit.xquant.keras.facade_xquant_report)": [[35, "model_compression_toolkit.xquant.keras.facade_xquant_report.xquant_report_keras_experimental", false]], "xquant_report_pytorch_experimental() (in module model_compression_toolkit.xquant.pytorch.facade_xquant_report)": [[36, "model_compression_toolkit.xquant.pytorch.facade_xquant_report.xquant_report_pytorch_experimental", false]], "xquant_report_troubleshoot_pytorch_experimental() (in module model_compression_toolkit.xquant.pytorch.facade_xquant_report)": [[37, "model_compression_toolkit.xquant.pytorch.facade_xquant_report.xquant_report_troubleshoot_pytorch_experimental", false]], "xquantconfig (class in model_compression_toolkit.xquant.common.xquant_config)": [[12, "model_compression_toolkit.xquant.common.xquant_config.XQuantConfig", false]]}, "objects": {"model_compression_toolkit": [[2, 0, 1, "", "DefaultDict"], [18, 3, 1, "", "get_target_platform_capabilities"], [22, 3, 1, "", "keras_load_quantized_model"], [34, 3, 1, "", "set_log_folder"]], "model_compression_toolkit.DefaultDict": [[2, 1, 1, "", "get"], [2, 1, 1, "", "keys"]], "model_compression_toolkit.core": [[0, 0, 1, "", "BitWidthConfig"], [3, 0, 1, "", "ChannelAxis"], [38, 0, 1, "", "CoreConfig"], [39, 0, 1, "", "DebugConfig"], [3, 0, 1, "", "FrameworkInfo"], [5, 0, 1, "", "MixedPrecisionQuantizationConfig"], [5, 0, 1, "", "MpDistanceWeighting"], [5, 0, 1, "", "MpMetricNormalization"], [8, 0, 1, "", "QuantizationConfig"], [9, 0, 1, "", "QuantizationErrorMethod"], [10, 0, 1, "", "ResourceUtilization"], [21, 3, 1, "", "keras_resource_utilization_data"], [29, 3, 1, "", "pytorch_resource_utilization_data"]], "model_compression_toolkit.core.BitWidthConfig": [[0, 2, 1, "", "manual_activation_bit_width_selection_list"], [0, 2, 1, "", "manual_weights_bit_width_selection_list"]], "model_compression_toolkit.core.common.quantization.bit_width_config": [[0, 0, 1, "", "ManualBitWidthSelection"]], "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection": [[0, 2, 1, "", "bit_width"], [0, 2, 1, "", "filter"]], "model_compression_toolkit.core.network_editor": [[42, 0, 1, "", "ChangeCandidatesActivationQuantConfigAttr"], [42, 0, 1, "", "ChangeCandidatesActivationQuantizationMethod"], [42, 0, 1, "", "ChangeCandidatesWeightsQuantConfigAttr"], [42, 0, 1, "", "ChangeCandidatesWeightsQuantizationMethod"], [42, 0, 1, "", "ChangeFinalActivationQuantConfigAttr"], [42, 0, 1, "", "ChangeFinalWeightsQuantConfigAttr"], [42, 0, 1, "", "ChangeFinalWeightsQuantizationMethod"], [42, 0, 1, "", "ChangeQuantizationParamFunction"], [42, 0, 1, "", "EditRule"], [42, 0, 1, "", "NodeNameFilter"], [42, 0, 1, "", "NodeNameScopeFilter"], [42, 0, 1, "", "NodeTypeFilter"]], "model_compression_toolkit.data_generation": [[1, 0, 1, "", "BNLayerWeightingType"], [1, 0, 1, "", "BatchNormAlignemntLossType"], [1, 0, 1, "", "DataGenerationConfig"], [1, 0, 1, "", "DataInitType"], [1, 0, 1, "", "ImageGranularity"], [1, 0, 1, "", "ImageNormalizationType"], [1, 0, 1, "", "ImagePipelineType"], [1, 0, 1, "", "OutputLossType"], [1, 0, 1, "", "SchedulerType"], [14, 3, 1, "", "get_keras_data_generation_config"], [16, 3, 1, "", "get_pytorch_data_generation_config"], [19, 3, 1, "", "keras_data_generation_experimental"], [27, 3, 1, "", "pytorch_data_generation_experimental"]], "model_compression_toolkit.exporter": [[40, 0, 1, "", "KerasExportSerializationFormat"], [40, 0, 1, "", "PytorchExportSerializationFormat"], [40, 0, 1, "", "QuantizationFormat"], [40, 0, 1, "", "keras_export_model"], [40, 0, 1, "", "pytorch_export_model"]], "model_compression_toolkit.gptq": [[4, 0, 1, "", "GPTQHessianScoresConfig"], [4, 0, 1, "", "GradientPTQConfig"], [4, 0, 1, "", "GradualActivationQuantizationConfig"], [4, 0, 1, "", "QFractionLinearAnnealingConfig"], [4, 0, 1, "", "RoundingType"], [15, 3, 1, "", "get_keras_gptq_config"], [17, 3, 1, "", "get_pytorch_gptq_config"], [20, 3, 1, "", "keras_gradient_post_training_quantization"], [28, 3, 1, "", "pytorch_gradient_post_training_quantization"]], "model_compression_toolkit.pruning": [[6, 0, 1, "", "ChannelsFilteringStrategy"], [6, 0, 1, "", "ImportanceMetric"], [6, 0, 1, "", "PruningConfig"], [7, 0, 1, "", "PruningInfo"], [24, 3, 1, "", "keras_pruning_experimental"], [31, 3, 1, "", "pytorch_pruning_experimental"]], "model_compression_toolkit.pruning.PruningConfig": [[6, 2, 1, "", "channels_filtering_strategy"], [6, 2, 1, "", "importance_metric"], [6, 2, 1, "", "num_score_approximations"]], "model_compression_toolkit.pruning.PruningInfo": [[7, 4, 1, "", "importance_scores"], [7, 4, 1, "", "pruning_masks"]], "model_compression_toolkit.ptq": [[23, 3, 1, "", "keras_post_training_quantization"], [30, 3, 1, "", "pytorch_post_training_quantization"]], "model_compression_toolkit.qat": [[43, 0, 1, "", "QATConfig"], [25, 3, 1, "", "keras_quantization_aware_training_finalize_experimental"], [26, 3, 1, "", "keras_quantization_aware_training_init_experimental"], [32, 3, 1, "", "pytorch_quantization_aware_training_finalize_experimental"], [33, 3, 1, "", "pytorch_quantization_aware_training_init_experimental"]], "model_compression_toolkit.target_platform_capabilities": [[41, 0, 1, "", "AttributeFilter"], [41, 0, 1, "", "Eq"], [41, 0, 1, "", "Greater"], [41, 0, 1, "", "GreaterEq"], [41, 0, 1, "", "NotEq"], [44, 0, 1, "", "QuantizationMethod"], [41, 0, 1, "", "Smaller"], [41, 0, 1, "", "SmallerEq"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema": [[44, 0, 1, "", "AttributeQuantizationConfig"], [44, 0, 1, "", "Fusing"], [44, 0, 1, "", "OpQuantizationConfig"], [44, 0, 1, "", "OperatorSetGroup"], [44, 0, 1, "", "OperatorsSet"], [44, 0, 1, "", "QuantizationConfigOptions"], [44, 0, 1, "", "TargetPlatformCapabilities"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig": [[44, 2, 1, "", "enable_weights_quantization"], [44, 2, 1, "", "lut_values_bitwidth"], [44, 2, 1, "", "weights_n_bits"], [44, 2, 1, "", "weights_per_channel_threshold"], [44, 2, 1, "", "weights_quantization_method"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing": [[44, 2, 1, "", "fuse_op_quantization_config"], [44, 2, 1, "", "name"], [44, 2, 1, "", "operator_groups"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup": [[44, 2, 1, "", "name"], [44, 2, 1, "", "operators_set"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet": [[44, 2, 1, "", "name"], [44, 2, 1, "", "qc_options"], [44, 2, 1, "", "type"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions": [[44, 2, 1, "", "base_config"], [44, 2, 1, "", "quantization_configurations"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities": [[44, 2, 1, "", "SCHEMA_VERSION"], [44, 2, 1, "", "add_metadata"], [44, 2, 1, "", "default_qco"], [44, 2, 1, "", "fusing_patterns"], [44, 2, 1, "", "insert_preserving_quantizers"], [44, 2, 1, "", "is_simd_padding"], [44, 2, 1, "", "name"], [44, 2, 1, "", "operator_set"], [44, 2, 1, "", "tpc_minor_version"], [44, 2, 1, "", "tpc_patch_version"], [44, 2, 1, "", "tpc_platform_type"]], "model_compression_toolkit.trainable_infrastructure": [[45, 0, 1, "", "BaseKerasTrainableQuantizer"], [45, 0, 1, "", "BasePytorchTrainableQuantizer"], [45, 0, 1, "", "TrainableQuantizerActivationConfig"], [45, 0, 1, "", "TrainableQuantizerWeightsConfig"], [45, 0, 1, "", "TrainingMethod"]], "model_compression_toolkit.wrapper.mct_wrapper": [[11, 0, 1, "", "MCTWrapper"]], "model_compression_toolkit.wrapper.mct_wrapper.MCTWrapper": [[11, 1, 1, "", "quantize_and_export"]], "model_compression_toolkit.xquant.common.xquant_config": [[12, 0, 1, "", "XQuantConfig"]], "model_compression_toolkit.xquant.keras.facade_xquant_report": [[35, 3, 1, "", "xquant_report_keras_experimental"]], "model_compression_toolkit.xquant.pytorch.facade_xquant_report": [[36, 3, 1, "", "xquant_report_pytorch_experimental"], [37, 3, 1, "", "xquant_report_troubleshoot_pytorch_experimental"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "function", "Python function"], "4": ["py", "property", "Python property"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute", "3": "py:function", "4": "py:property"}, "terms": {"": [3, 6, 8, 10, 20, 23, 24, 25, 26, 28, 30, 31, 33, 34, 40, 41, 42, 44, 45, 47, 49], "0": [1, 3, 4, 5, 7, 8, 11, 12, 14, 15, 16, 20, 23, 24, 25, 26, 31, 40, 45, 47], "05": 8, "06": 5, "08153": 45, "1": [1, 3, 4, 5, 7, 8, 12, 17, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 32, 40, 47, 49], "10": [19, 20, 23, 26, 27, 28, 30, 33], "10000000000": 5, "15": [40, 47], "16": [12, 40, 47], "1902": 45, "1e": 5, "1st": 15, "2": [3, 8, 12, 15, 19, 27, 44, 45, 47, 49], "20": 48, "2021": 49, "2023": 49, "224": [20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 40], "228137651975462": 47, "2nd": 15, "3": [3, 15, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 40, 45, 47], "32": [4, 5], "3rd": 15, "4": [15, 19, 20, 23, 24, 26, 27, 28, 30, 31, 33], "4th": 15, "5": [11, 12, 15, 17, 24, 31, 47], "50": [24, 31], "52587890625e": 8, "6": [27, 47], "75": [20, 23, 25, 26], "758747418625537": 47, "8": [19, 20, 23, 25, 26, 27, 40, 44, 45], "9": [42, 47], "A": [0, 3, 4, 5, 7, 8, 13, 15, 17, 18, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 39, 42, 43, 44, 47, 49], "As": [5, 47, 48], "By": [4, 5, 24, 28, 30, 31, 40, 47, 48], "For": [3, 8, 12, 18, 19, 20, 23, 25, 26, 27, 33, 40, 44, 45, 46, 47, 48, 49], "If": [2, 3, 4, 5, 12, 15, 17, 20, 23, 25, 26, 28, 30, 38, 40, 41, 44, 47], "In": [5, 19, 20, 23, 26, 27, 28, 30, 33, 40, 41, 43, 47], "It": [2, 11, 12, 44, 45, 47], "No": 1, "Not": 47, "One": 48, "The": [0, 1, 3, 4, 5, 6, 7, 10, 11, 12, 14, 15, 16, 17, 19, 20, 23, 24, 25, 26, 27, 28, 30, 31, 33, 35, 36, 37, 40, 42, 44, 45, 47, 48], "Then": [3, 20, 23, 26, 28, 30, 33, 42, 48], "There": [40, 47, 48], "These": [47, 48], "To": [40, 47, 48], "With": 47, "_": [20, 23, 26, 28, 30, 33, 40, 47], "_input_data": 40, "_model_input_nam": 40, "_model_output_nam": 40, "_with_model_output_loss_object": 47, "about": [3, 4, 7, 13, 15, 17, 20, 23, 25, 26, 40, 44, 45], "abov": [12, 47], "absolut": 9, "abstract": [13, 45], "accept": [15, 44], "access": 7, "accord": [13, 20, 21, 23, 24, 26, 28, 29, 30, 31, 33, 40, 41], "accordingli": 44, "accuraci": [12, 47], "achiev": 24, "act": 7, "act_hessian_default_batch_s": [15, 17], "action": 39, "activ": [0, 3, 4, 5, 8, 10, 11, 20, 21, 23, 26, 28, 29, 30, 33, 40, 42, 43, 44, 45, 48], "activation_bias_correct": 8, "activation_bias_correction_threshold": 8, "activation_channel_equ": 8, "activation_error_method": [8, 11], "activation_memori": 10, "activation_min_max_map": 3, "activation_n_bit": [44, 45], "activation_op": 3, "activation_quantization_candid": 45, "activation_quantization_method": [42, 44, 45], "activation_quantization_param": 45, "activation_quantization_params_fn": 42, "activation_quantizer_map": 3, "activation_quantizer_params_overrid": 43, "activation_training_method": 43, "ad": 44, "adam": [14, 17], "add": [1, 3, 12, 14, 16, 22, 45, 47], "add_metadata": 44, "addit": [22, 40, 47], "addition": 47, "address": 44, "advanc": 3, "affect": [20, 23, 25, 26], "after": [13, 20, 22, 23, 26, 33, 47, 49], "aim": [24, 31], "algorithm": 5, "align": [1, 14, 16], "all": [1, 3, 4, 5, 8, 42, 45, 48], "allimag": [1, 16], "allow": [6, 12, 19, 27, 40, 44, 47], "along": [47, 48], "also": [24, 31, 47], "an": [1, 2, 3, 4, 7, 11, 13, 20, 23, 26, 33, 35, 36, 37, 40, 41, 42, 44, 45, 47, 49], "analysi": [24, 31], "analyz": [24, 31, 37], "analyze_similar": 39, "ani": [1, 2, 3, 5, 11, 35, 36, 37, 40, 41, 45], "anneal": 4, "api": [3, 4, 18, 23, 26, 33, 43], "appear": 47, "appli": [0, 1, 5, 8, 13, 40, 41, 42, 44, 47], "applic": [20, 21, 23, 24, 25, 26, 40], "approach": 6, "appropri": 47, "approxim": [6, 24, 31], "ar": [3, 5, 12, 18, 20, 23, 24, 26, 28, 30, 31, 33, 40, 44, 45, 46, 47, 48], "architectur": [24, 31], "argument": [4, 40, 44, 47], "arrai": [7, 11], "art": 49, "arxiv": [45, 49], "assess": [24, 31], "associ": [24, 31], "assum": [24, 31], "astyp": 40, "attach": 47, "attent": [4, 15, 17, 45], "attirbut": 3, "attr": 41, "attr_nam": 42, "attr_valu": 42, "attr_weights_configs_map": 44, "attribut": [42, 44, 45], "attributefilt": 41, "auto": 13, "auxiliri": [15, 17], "avail": 40, "averag": [1, 5, 14, 15, 16, 17, 47], "avg": 5, "awar": [13, 43, 45, 49], "axi": [3, 45, 47], "backend": 44, "base": [1, 4, 5, 8, 9, 11, 13, 15, 17, 19, 24, 27, 30, 31, 45, 47, 49], "base_config": 44, "basenod": 7, "basenodematch": 0, "basic": 45, "batch": [1, 4, 5, 14, 15, 16, 17, 19, 20, 23, 26, 27, 28, 30, 33], "batchnorm": [1, 14, 16, 19, 20, 23, 26, 28, 30, 33], "batchnorm2d": 27, "batchnormalignemntlosstyp": [14, 16], "batchwis": [1, 14], "been": [7, 47], "befor": 47, "begin": 4, "behavior": 39, "being": [20, 23, 26, 28, 30, 33, 44, 45], "below": [12, 47], "between": [4, 5, 12, 20, 28, 30, 44, 47, 48], "bia": [4, 11, 15, 17, 20, 23, 25, 26], "bidwidth": 5, "bin": 47, "bit": [0, 5, 10, 13, 20, 23, 25, 26, 33, 38, 40, 42, 44, 45, 47, 49], "bit_width": 0, "bit_width_config": [0, 38], "bitwidth": [5, 12, 20, 23, 25, 26, 47], "bitwidthconfig": [13, 38], "black": 47, "block": [45, 48], "bn_alignment_loss_typ": [1, 14, 16], "bn_layer_typ": [1, 14, 16], "bnlayerweightingtyp": [14, 16], "bool": [1, 4, 5, 11, 12, 14, 15, 16, 17, 39, 44, 45, 47], "boolean": 22, "bop": 10, "both": [11, 20, 23, 28, 30, 32, 45, 47, 48], "build": [21, 29, 45, 49], "built": [26, 33, 45], "bypass": 39, "byte": [10, 20, 23, 24, 26, 31, 33, 48], "c": [12, 47], "calcul": [5, 6, 13, 20, 21, 23, 24, 26, 28, 29, 30, 31, 33, 47], "calibr": [11, 20, 21, 23, 26, 28, 29, 30, 33], "call": [21, 29, 34, 44, 47, 48], "callabl": [3, 5, 11, 12, 15, 17, 20, 21, 23, 24, 26, 28, 29, 30, 31, 33, 35, 36, 37, 40, 41, 47], "can": [3, 4, 8, 11, 13, 15, 17, 19, 21, 24, 27, 29, 31, 39, 40, 42, 44, 45, 47, 48, 49], "candid": [5, 20, 23, 25, 26, 42], "cannot": 44, "capabl": [11, 18, 24, 29, 31], "case": [5, 47], "caus": [12, 13, 37, 47], "chang": [19, 27, 40, 42, 48], "changecandidatesactivationquantconfigattr": 42, "changecandidatesactivationquantizationmethod": 42, "changecandidatesweightsquantconfigattr": 42, "changecandidatesweightsquantizationmethod": 42, "changefinalactivationquantconfigattr": 42, "changefinalweightsquantconfigattr": 42, "changefinalweightsquantizationmethod": 42, "changequantizationmethod": 42, "changequantizationparamfunct": 42, "channel": [3, 6, 7, 13, 24, 31, 44, 45, 48], "channels_filtering_strategi": 6, "check": [5, 40, 41, 42], "choos": [1, 4, 40], "chosen": 48, "circl": 47, "class": [0, 1, 5, 6, 7, 8, 9, 10, 11, 12, 13, 22, 38, 39, 40, 41, 42, 43, 44, 45, 47], "clibrat": 30, "click": 48, "clip": [1, 14, 16], "clone": 49, "code": 47, "coeffici": [3, 20, 23, 25, 26, 28, 30, 44, 45], "cohen": 49, "collaps": 11, "collect": [3, 20, 23, 26, 28, 30, 33, 35, 36, 37, 48], "com": 49, "combin": 44, "common": [0, 12], "compar": [5, 20, 28, 30, 47, 48], "comparison": 49, "compat": 40, "compil": 22, "complet": [4, 11], "compli": 18, "compon": [44, 45, 47], "compress": [11, 13, 19, 24, 27, 28, 31, 47], "comput": [3, 4, 5, 9, 12, 13, 15, 17, 21, 29, 35, 39, 48], "compute_distance_fn": 5, "concat_threshold_upd": 8, "concaten": [12, 44, 47], "concatn": 12, "config": [4, 19, 20, 23, 24, 25, 26, 27, 28, 31, 32, 33, 38, 42, 45], "configur": [0, 4, 5, 8, 10, 11, 13, 14, 15, 16, 17, 19, 20, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47, 49], "configuration_overwrit": 5, "confirm": 47, "connect": [11, 47], "consid": [6, 14, 16, 24, 31, 44, 47], "consol": 47, "constant": [6, 42, 45], "constraint": [20, 23, 24, 28, 30, 31], "consult": 47, "contain": [7, 13, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 45, 47], "conv": 47, "conv2d": [3, 19, 20, 23, 25, 26, 27, 42, 44], "conveni": 34, "convent": 47, "convert": [25, 32], "core": [0, 3, 5, 8, 9, 10, 11, 20, 21, 23, 24, 25, 26, 28, 29, 31, 32, 33, 38, 39, 42, 47], "core_config": [20, 21, 23, 25, 26, 28, 29, 30, 32, 33, 47], "coreconfig": [13, 20, 21, 23, 25, 26, 28, 29, 30, 32, 33, 47], "correct": 11, "correspond": [7, 47], "cosin": 49, "count_param": [20, 23, 24, 25, 26], "countermeasur": 47, "cpuexecutionprovid": 40, "creat": [3, 4, 8, 11, 13, 14, 15, 16, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 40, 41, 42, 44, 47], "creation": 40, "crop": 1, "cudaexecutionprovid": 40, "current": [4, 40], "custom": [5, 12, 19, 22, 26, 27, 40, 47], "custom_metric_fn": 5, "custom_object": [22, 25, 26], "custom_similarity_metr": [12, 47], "custom_tpc_opset_to_lay": 8, "cut": 39, "dash": 47, "data": [13, 14, 16, 21, 24, 29, 31, 35, 36, 37, 40, 44, 47, 48, 49], "data_gen_batch_s": [1, 14, 16, 19, 27], "data_gener": [1, 14, 16, 19, 27], "data_generation_config": [19, 27], "data_init_typ": [1, 14, 16], "dataclass": [38, 39], "datagenerationconfig": [1, 13, 19, 27], "datainittyp": [14, 16], "dataset": [4, 11, 15, 17, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 40, 47, 48], "debug": [38, 39], "debug_config": 38, "debugconfig": 38, "deeper": 48, "def": [20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 40], "default": [1, 2, 4, 5, 6, 11, 14, 15, 16, 17, 18, 20, 23, 24, 28, 30, 31, 38, 40, 43, 44, 47, 48], "default_data_gen_b": [14, 16], "default_factori": 2, "default_keras_extra_pixel": 14, "default_keras_initial_lr": 14, "default_keras_output_loss_multipli": 14, "default_keras_tpc": [20, 23, 24, 26], "default_n_it": [14, 16], "default_onnx_opset_vers": 40, "default_pyotrch_tpc": 31, "default_pytorch_bn_layer_typ": 16, "default_pytorch_extra_pixel": 16, "default_pytorch_initial_lr": 16, "default_pytorch_last_layer_typ": 16, "default_pytorch_output_loss_multipli": 16, "default_pytorch_tpc": [28, 30, 31, 33], "default_qco": 44, "default_valu": 2, "default_weight_attr_config": 44, "defaultdict": [3, 13], "defin": [0, 4, 5, 15, 17, 19, 20, 23, 24, 25, 26, 27, 28, 30, 31, 44, 45], "degener": 18, "degrad": [12, 13, 37, 47], "degrat": 47, "demonstr": [40, 44], "dens": [3, 19], "dense_nparam": [24, 31], "depend": [1, 20, 23, 26, 28, 30, 33], "describ": 47, "descript": 11, "desir": [13, 20, 21, 23, 25, 26, 28, 29, 30, 33], "detail": [40, 44, 47], "detect": [12, 13, 37, 47], "determin": [6, 24, 31, 44], "develop": 49, "deviat": 47, "diagram": 44, "diamant": 49, "dict": [3, 7, 12, 35, 36, 37, 40, 44, 45, 47], "dictionari": [2, 3, 4, 12, 25, 26, 35, 36, 37, 40, 42, 43, 45], "differ": [1, 8, 13, 20, 23, 25, 26, 40, 44, 47, 48], "dikstein": 49, "dir": [12, 47, 48], "directori": [12, 13, 34, 47], "disabl": [15, 17, 47], "displai": [47, 48], "distanc": 5, "distance_weighting_method": 5, "distil": [4, 49], "distribut": 9, "diverg": [9, 48], "divers": 1, "divid": [3, 47], "divis": 48, "dnn": 45, "do": [1, 48], "document": [13, 23, 26, 33, 47], "doe": 47, "doesn": 49, "don": 34, "done": 48, "dot": 48, "dqa": 45, "dror": 49, "dtype": 40, "due": 47, "dummi": 17, "durat": [24, 31], "dure": [4, 13, 14, 15, 16, 17, 18, 35, 36, 37, 40, 42, 44, 45, 46, 48], "e": [3, 5, 11, 20, 23, 26, 28, 30, 33, 49], "each": [5, 6, 7, 12, 20, 23, 24, 26, 28, 30, 31, 33, 42, 44, 45, 47, 48], "easi": 47, "easili": [13, 49], "edit": [38, 39, 42], "editrul": 39, "either": 44, "element": [7, 44], "empti": 2, "emul": 45, "enabl": [1, 5, 8, 11, 13, 15, 17, 39, 45, 49], "enable_activation_quant": [44, 45], "enable_weights_quant": [44, 45], "encapsul": [0, 8], "end": 47, "end_step": 4, "engin": 49, "enhanc": 49, "ensur": 5, "entir": 13, "enum": [1, 3, 4, 6, 9, 45], "epoch": [4, 11, 15, 17], "epsilon": 5, "eptq": 49, "eq": 41, "equal": [41, 47], "er_list": 42, "error": [9, 11, 12], "estim": [4, 45], "etc": [3, 10, 13, 20, 23, 26, 28, 30, 33, 48], "euclidean": 48, "evalu": [5, 35, 36, 37], "even": 47, "exact": 17, "exampl": [3, 8, 11, 15, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 42, 44, 45, 49], "exce": 47, "exceed": 47, "execut": 47, "exist": [2, 18, 42, 47], "exp": 5, "exp_distance_weighting_sigma": 5, "expect": [4, 48], "experiment": [13, 19, 27, 49], "explain": [12, 13, 35, 36, 37, 45, 47], "explicitli": 44, "expon": 5, "exponenti": 5, "export": 11, "extend": [24, 31], "extens": [40, 49], "extra": [1, 14, 16], "extra_pixel": [1, 14, 16], "extrem": 47, "facade_xquant_report": [35, 36, 37], "factor": [4, 5, 9, 15, 17, 47], "factori": [0, 4, 38, 39], "fake": 40, "fake_qu": [26, 33], "fakely_qu": 40, "fallback": 44, "fals": [4, 5, 8, 11, 12, 14, 15, 17, 39, 45, 47], "familiar": 47, "featur": 47, "fetch": 44, "few": [48, 49], "field": [18, 41, 44, 46], "figur": [39, 48], "file": [22, 25, 26, 34, 40], "filepath": 22, "filter": [0, 1, 6], "final": [4, 5, 12, 13, 19, 27, 42, 47, 48, 49], "find": [20, 23, 26, 33], "fine": [15, 17, 24, 25, 26, 31, 32, 33, 47], "first": [1, 20, 23, 26, 28, 30, 33, 40, 47, 48], "first_layer_multipli": 1, "fix": 44, "fixed_scal": [18, 44, 46], "fixed_zero_point": [18, 44, 46], "flag": [1, 11, 39, 44], "flatten": [19, 27], "flip": 1, "float": [1, 4, 5, 11, 12, 14, 15, 16, 17, 20, 26, 28, 30, 33, 35, 36, 37, 40, 44, 45, 47, 48], "float32": [24, 31, 40], "float_model": [11, 35, 36, 37, 40, 47], "fold": [20, 23, 26, 28, 30, 33], "folder": [34, 47], "follow": [3, 4, 11, 12, 45, 47, 48], "footprint": [24, 31], "form": 44, "format": [3, 13], "found": 47, "fraction": 4, "framework": [3, 11, 18, 45], "frameworkquantizationcap": [21, 28, 29, 30], "free": [6, 19, 24, 27, 31, 49], "freez": 45, "freeze_quant_param": 45, "friendli": [24, 31, 49], "from": [3, 4, 11, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 40, 42, 44, 45, 46, 47, 48, 49], "from_config": 45, "function": [3, 4, 5, 11, 12, 13, 14, 15, 16, 17, 18, 19, 22, 24, 27, 31, 34, 42, 44, 45, 47], "further": 47, "fuse_op_quantization_config": 44, "fusing_pattern": 44, "futur": [18, 19, 27, 44, 46], "fw_name": 18, "g": [3, 11, 20, 23, 26, 28, 30, 33], "gather": [44, 48], "gaussian": [1, 14, 16], "gelu": 47, "gener": [2, 12, 13, 14, 16, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 35, 36, 37, 44, 47, 48, 49], "generated_imag": [19, 27], "get": [2, 3, 4, 5, 13, 20, 23, 25, 26, 28, 30, 32, 33, 44, 48], "get_config": 45, "get_input": 40, "get_keras_data_generation_config": [13, 14, 19], "get_keras_gptq_config": [13, 15, 20], "get_ort_session_opt": 40, "get_output": 40, "get_pytorch_data_generation_config": [13, 16, 27], "get_pytorch_gptq_config": [13, 17], "get_target_platform_cap": [13, 18, 44], "git": 49, "github": [40, 49], "given": [2, 20, 21, 23, 26, 28, 29, 30, 33], "gordon": 49, "gptq": [4, 11, 15, 17, 20, 28], "gptq_conf": [15, 17, 28], "gptq_config": [20, 28, 30], "gptq_quantizer_params_overrid": 4, "gptq_representative_data_gen": [20, 28], "grad": 1, "gradient": [1, 4, 11, 13, 30, 49], "gradientptq": [4, 13], "gradientptqconfig": [13, 20, 28], "gradual": 4, "gradual_activation_quant": [15, 17], "gradual_activation_quantization_config": 4, "gradualactivationquant": [15, 17], "gradualactivationquantizationconfig": [15, 17], "granular": [1, 14, 16], "graph": [21, 29, 42, 48], "greater": 41, "greatereq": 41, "greedi": [5, 6], "group": [3, 6, 24, 31, 44], "h": 49, "ha": [7, 40, 41, 42, 47], "habi": 49, "handl": [11, 20, 23, 26, 28, 30, 33], "handler": 34, "hardwar": [13, 24, 31, 44, 45, 49], "have": [3, 40, 41, 47, 48], "henc": 44, "here": [12, 24, 31, 40, 44, 47, 49], "hessian": [4, 5, 6, 9, 11, 15, 17, 24, 31, 49], "hessian_batch_s": [4, 5, 15, 17], "hessian_weights_config": 4, "hessians_num_sampl": 4, "higher": [24, 31], "highlight": 47, "hight": 27, "histogram": [20, 23, 26, 28, 30, 33, 47, 48], "hmse": 9, "hold": [3, 38, 41, 44], "holder": 45, "how": [3, 6, 20, 21, 23, 26, 28, 30, 33, 40, 45, 49], "howev": 40, "hptq": [44, 49], "http": [45, 49], "hw": 21, "i": [1, 2, 3, 4, 5, 6, 7, 9, 12, 13, 15, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 30, 31, 33, 34, 38, 39, 40, 41, 42, 44, 45, 47, 48, 49], "ident": [1, 5], "identifi": [24, 31, 44, 47], "ignor": [18, 44, 46], "ilp": [20, 23, 26, 33], "imag": [1, 4, 5, 11, 14, 16, 19, 20, 23, 26, 27, 28, 30, 33, 47, 48], "image_clip": [1, 14, 16], "image_granular": [1, 14, 16], "image_normalization_typ": [1, 14, 16], "image_pipeline_typ": [1, 14, 16], "imagegranular": [14, 16], "imagenet": 1, "imagenet1k_v1": 31, "imagenormalizationtyp": [14, 16], "imagepipelinetyp": [14, 16], "imagewis": 1, "impact": [24, 31], "implement": [12, 45], "implment": 45, "import": [3, 6, 7, 8, 11, 13, 15, 17, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 40, 42, 45, 47, 48], "importance_metr": 6, "importance_scor": 7, "improv": [5, 24, 31, 47], "imx500": [40, 44], "in_model": [20, 21, 23, 25, 26, 29, 32, 33], "in_modul": [30, 47], "includ": [4, 7, 11, 20, 23, 26, 28, 30, 33, 44, 45], "increas": [4, 5], "index": [3, 13], "indic": [3, 7, 24, 31, 44, 47], "individu": 47, "induc": 9, "inf": [8, 10, 11], "infer": [13, 18, 25, 32, 44, 45], "inferablequant": [25, 32], "inferencesess": 40, "info": [6, 34], "inform": [3, 4, 13, 15, 17, 18, 20, 23, 24, 26, 28, 30, 31, 33, 39, 44, 45, 46], "infrastructur": 45, "init": [13, 42, 49], "initi": [1, 2, 4, 6, 11, 12, 14, 16, 26, 33, 45, 47], "initial_lr": [1, 14, 16], "initial_q_fract": 4, "inner": 2, "input": [1, 5, 11, 14, 16, 20, 23, 26, 28, 30, 33, 39, 44, 47], "input_sc": 8, "input_shap": 19, "insert": 48, "insert_preserving_quant": 44, "instal": 40, "instanc": [4, 11, 13, 15, 17, 42, 44, 48], "instanti": [4, 8, 43], "instead": 47, "instruct": [44, 47], "insuffici": [12, 47], "int": [0, 1, 4, 5, 6, 12, 14, 15, 16, 17, 19, 27, 40, 44, 45, 47], "int8": 40, "integ": [5, 40, 44], "interest": 5, "interfac": [4, 11, 17], "internal_tpc": 11, "introduc": 45, "inverse_min_max_diff": 1, "involv": [19, 24, 27, 31], "is_detect_under_threshold_quantize_error": [12, 47], "is_keras_layer_export": 40, "is_layer_exportable_fn": 40, "is_pytorch_layer_export": 40, "is_simd_pad": 44, "issu": [5, 40, 47], "item": 47, "iter": [1, 14, 16, 19, 20, 23, 26, 27, 28, 30, 33], "its": [2, 3, 13, 22, 24, 31, 41, 44, 48], "jen": 49, "judg": [12, 13, 37, 47], "just": 49, "keep": [32, 49], "kei": [2, 11, 12, 24, 31, 41], "kept": [7, 26, 33], "ker": 26, "kera": [3, 11, 13, 42, 45, 49], "keras_appl": [1, 14], "keras_data_generation_experiment": [13, 19], "keras_default_tpc": 21, "keras_file_path": 40, "keras_gradient_post_training_quant": [13, 15, 20], "keras_load_quantized_model": 22, "keras_post_training_quant": [13, 23, 40, 42, 48], "keras_pruning_experiment": [13, 24], "keras_quantization_aware_training_finalize_experiment": [13, 25], "keras_quantization_aware_training_init_experiment": [13, 25, 26], "keras_resource_utilization_data": [13, 21], "kernel": [3, 20, 23, 25, 26, 42, 45], "kernel_channels_map": 3, "kernel_op": 3, "kernel_ops_attributes_map": 3, "keyword": 44, "kl": [9, 48], "know": [3, 13], "knowledg": [4, 49], "known_dict": 2, "kwarg": 42, "l": [24, 49], "l2": 1, "l2_squar": [1, 14, 16], "l_p_valu": 8, "label": [6, 24, 31, 44, 49], "lambda": 40, "larg": [12, 47], "larger": 5, "last": [3, 4, 5, 47], "last_lay": 5, "last_layer_typ": [1, 16], "latenc": 40, "latest": 49, "launch": 48, "layaer": [13, 37], "layer": [1, 3, 5, 7, 11, 12, 14, 15, 16, 17, 19, 20, 23, 24, 25, 26, 28, 30, 31, 32, 33, 39, 40, 42, 44, 45, 47, 48], "layer_min_max_map": 3, "layer_weighting_typ": [1, 14, 16], "layerfilterparam": 41, "learn": [1, 14, 15, 16, 45], "learnabl": 45, "least": 6, "less": 47, "let": 40, "level": 34, "lfh": [6, 24, 31], "librari": [3, 8], "like": [8, 44], "limit": [6, 20, 23, 25, 26, 28, 30, 33], "line": 47, "linear": [4, 11, 27], "linear_collaps": [8, 11, 47], "linearli": 4, "link": 47, "list": [0, 1, 3, 5, 11, 14, 15, 16, 19, 27, 39, 40, 42, 47, 49], "liter": 44, "ll": [19, 27], "load": [13, 25, 26, 40, 45], "load_model": [25, 26], "loadopt": 22, "log": [4, 12, 13, 15, 17, 34, 47, 48], "log_funct": [4, 15, 17], "log_norm": 4, "log_tensorboard_xqu": 47, "logdir": 48, "logger": [13, 39, 48], "longer": 40, "look": [23, 26, 33, 44, 49], "lookup": 44, "loss": [1, 4, 12, 14, 15, 16, 17, 20, 24, 28, 30, 31], "lower": 47, "lp": 9, "lsq": 45, "lut_pot_quant": 44, "lut_sym_quant": 44, "lut_values_bitwidth": 44, "mae": [9, 48], "mai": [19, 20, 23, 26, 27, 28, 30, 33, 41, 48], "main": [11, 44, 47, 48], "major": 47, "make": 9, "manag": [0, 11], "mandatori": 40, "mani": 48, "manipul": [0, 1], "manner": 44, "manual": [0, 13, 38, 47], "manual_activation_bit_width_selection_list": 0, "manual_weights_bit_width_selection_list": 0, "manualweightsbitwidthselect": 0, "map": [3, 44], "mask": 7, "match": [41, 42], "mathemat": 48, "max": [1, 3, 5, 8, 9, 20, 21, 23, 26, 28, 29, 30, 33, 48], "maxbit": 5, "maxim": [20, 23, 26, 33], "maximum": 47, "mct": [3, 8, 11, 13, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 38, 39, 40, 42, 44, 45, 46, 47, 48, 49], "mct_current_schema": 44, "mct_quantiz": 40, "mct_wrapper": 11, "mctwrapper": 11, "mean": [1, 4, 9, 48], "measur": [6, 10, 12, 47, 48], "meet": [24, 31], "memori": [10, 24, 31, 48], "messag": 47, "metadata": [7, 44], "method": [4, 5, 6, 9, 11, 13, 24, 31, 34, 40, 42, 43, 44, 45, 47], "metric": [4, 5, 6, 12, 35, 36, 37, 47], "metric_epsilon": 5, "metric_norm": 5, "metric_normalization_threshold": 5, "min": [1, 3, 5, 8, 9, 20, 23, 26, 28, 30, 33, 48], "min_threshold": [8, 45], "minbit": 5, "minim": [5, 9, 20, 24, 28, 30, 31], "minimum": 45, "minor": 44, "minut": 49, "mix": [5, 10, 11, 12, 13, 20, 21, 23, 25, 26, 28, 29, 30, 33, 38, 44, 49], "mixed_precis": 11, "mixed_precision_config": [20, 21, 23, 25, 26, 38], "mixedprecisionquantizationconfig": [13, 20, 21, 23, 25, 26, 38], "mkstemp": 40, "mobilenet": [20, 21], "mobilenet_v2": [23, 25, 26, 28, 29, 30, 32, 33, 40], "mobilenetv2": [23, 25, 26, 40, 48], "model": [3, 4, 5, 7, 8, 10, 11, 12, 13, 18, 19, 20, 23, 24, 27, 28, 30, 31, 35, 36, 37, 38, 39, 42, 43, 44, 45, 48], "model_compression_toolkit": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47, 48], "model_fil": [25, 26], "model_format_onnx_mctq": 40, "model_mp": 5, "model_output": 40, "modifi": [13, 42], "modul": [13, 27, 28, 29, 30, 31, 36, 37], "more": [9, 18, 23, 24, 26, 31, 33, 40, 44, 46, 47, 48], "most": 47, "move": 47, "mse": [8, 9, 11, 12, 47, 48], "multipl": [3, 5, 34, 44], "multiple_tensors_mse_loss": 4, "multipli": [1, 12, 14, 16, 47], "must": [24, 31, 44], "n_epoch": [4, 11, 15, 17, 20], "n_imag": [19, 27], "n_iter": [1, 14, 16, 19, 27], "nadam": 15, "name": [12, 18, 42, 44, 47, 48], "nchw": 3, "ndarrai": 7, "necessari": [4, 40, 45, 47], "need": [3, 11, 13, 20, 23, 26, 28, 30, 33, 40, 41, 45], "neg": [1, 5], "negative_min_max_diff": [1, 16], "network": [3, 6, 11, 32, 38, 39, 42, 48, 49], "network_editor": [13, 39], "netzer": 49, "neural": [6, 11, 49], "neuron": 7, "new": [42, 44], "next": [19, 27, 40, 41, 47], "nhwc": 3, "nn": [27, 36, 37], "no_norm": 1, "no_quantization_op": 3, "noclip": [8, 9], "node": [0, 26, 33, 40, 42, 45, 48], "node_nam": 42, "node_name_scop": 42, "node_typ": 42, "nodenamefilt": 42, "nodenamescopefilt": 42, "nodetypefilt": 42, "nois": 9, "non": [5, 15, 17, 44], "none": [1, 2, 4, 5, 8, 11, 12, 15, 17, 18, 20, 22, 23, 26, 28, 30, 33, 38, 40, 42, 43, 44, 45, 47], "norm": [9, 48], "norm_scor": [4, 5], "normal": [1, 4, 5, 14, 16], "note": [20, 23, 25, 26], "notebook": 49, "noteq": 41, "notic": [19, 24, 27, 31, 40], "now": [6, 18, 33, 40, 44, 45, 46, 48], "np": [7, 11, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 40], "num_calibration_batch": [20, 23, 26, 28, 30, 33], "num_interest_points_factor": 5, "num_of_imag": [5, 11, 20, 23], "num_score_approxim": [6, 24, 31], "number": [1, 4, 5, 6, 11, 12, 14, 15, 16, 17, 19, 20, 23, 24, 26, 27, 28, 30, 31, 33, 44, 45, 47], "numel": 31, "numer": 5, "numpi": [20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 40], "o": 49, "object": [0, 3, 4, 5, 6, 10, 12, 14, 15, 16, 17, 18, 20, 21, 22, 23, 25, 26, 28, 29, 30, 33, 40, 42, 44, 45], "observ": [20, 28, 30, 44, 48], "one": [5, 41, 48], "onli": [3, 4, 5, 6, 12, 18, 20, 23, 25, 26, 40, 44], "onlin": [26, 33], "onnx": 11, "onnx_file_path": 40, "onnx_opset_vers": 40, "onnxruntim": 40, "op": [41, 44], "open": [40, 48, 49], "oper": [3, 10, 39, 41, 44, 47], "operator_group": 44, "operator_set": 44, "operators_set": 44, "operatorsetnam": 44, "opquantizationconfig": [18, 46], "optim": [1, 3, 4, 10, 11, 13, 14, 15, 16, 17, 18, 20, 21, 23, 26, 28, 29, 30, 33, 38, 44, 45, 46, 47, 49], "optimizer_bia": 4, "optimizer_quantization_paramet": 4, "optimizer_rest": [4, 15, 17], "optimizerv2": 15, "option": [11, 13, 20, 22, 23, 24, 26, 28, 30, 31, 33, 40, 44], "order": [15, 17, 20, 23, 26, 33, 39, 40, 41, 43, 47], "org": 45, "orient": [13, 45], "origin": [24, 34, 35, 36, 37, 48], "ort": 40, "other": [1, 11, 15, 17], "otherwis": 44, "our": [20, 23, 25, 26, 33, 49], "out": [3, 6], "out1": 49, "out2": 49, "out3": 49, "out_channel_axis_map": 3, "outlier": 12, "outlier_histgram": 47, "outlin": 47, "output": [1, 3, 12, 14, 16, 19, 20, 23, 26, 27, 28, 30, 32, 33, 44, 48, 49], "output_image_s": [19, 27], "output_loss_multipli": [1, 14, 16], "output_loss_typ": [1, 14, 16], "output_nam": 40, "outputlosstyp": [14, 16], "over": 5, "overrid": [4, 43], "overwrit": 5, "p": 31, "packag": [40, 45, 49], "pad": 44, "page": 13, "pair": 48, "param": [17, 39, 42, 45], "param_item": 11, "paramet": [1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45], "pars": 44, "part": [40, 47], "pass": [2, 3, 5, 15, 17, 20, 23, 24, 25, 26, 28, 30, 31, 32, 33, 42], "patch": 44, "path": [11, 13, 22, 34, 40, 47, 48], "pattern": 44, "pdf": 45, "per": [1, 3, 4, 20, 23, 26, 33, 44, 45, 48], "per_sampl": 4, "percentag": 5, "peretz": 49, "perform": [6, 10, 11, 19, 24, 27, 31], "phase": 48, "pinpoint": 39, "pip": [40, 49], "pipelin": [1, 11, 14, 16], "pixel": [1, 14, 16], "place": 44, "plan": 40, "platform": [11, 13, 18, 20, 23, 24, 25, 26, 29, 31, 44], "pleas": [23, 26, 33, 40, 43, 47, 49], "plot": [39, 48], "png": 47, "point": [4, 5, 15, 17, 20, 28, 30, 35, 36, 37, 44, 48], "posit": 44, "possibl": [9, 20, 23, 26, 33, 44, 47, 48], "post": [4, 11, 13, 24, 26, 31, 33, 49], "power": [20, 23, 26, 28, 30, 33, 44], "power_of_two": 44, "poweroftwo": 45, "pre": 5, "preced": [20, 23, 26, 28, 30, 33], "precis": [5, 10, 11, 12, 13, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 33, 38, 44, 49], "predefin": [5, 6], "predict": 40, "prepar": [11, 13, 26, 33], "preprint": 49, "present": [2, 47, 48], "preserv": 44, "pretrain": [32, 33], "prevent": 5, "primari": 47, "prior": 5, "problemat": 39, "procedur": 47, "process": [4, 5, 8, 13, 14, 15, 16, 17, 18, 19, 24, 27, 31, 38, 39, 42, 43, 44, 46, 48], "product": 48, "project": [40, 49], "properti": 7, "propos": [45, 47], "provid": [2, 11, 19, 24, 27, 31, 40, 44, 45, 47, 48], "prune": [10, 49], "pruned_model": [24, 31], "pruning_config": [24, 31], "pruning_info": [24, 31], "pruning_mask": 7, "pruning_num_score_approxim": 6, "pruningconfig": [6, 13, 24, 31], "pruninginfo": [7, 13, 24, 31], "ptq": [11, 23, 30, 40, 47], "purpos": [19, 27, 39], "py": 49, "pydantic_cor": 44, "pypi": 49, "python": [34, 49], "pytorch": [11, 13, 44, 45, 49], "pytorch_data_generation_experiment": [13, 27], "pytorch_default_tpc": 29, "pytorch_gradient_post_training_quant": [13, 17, 28], "pytorch_post_training_quant": [13, 30, 40, 47], "pytorch_pruning_experiment": [13, 31], "pytorch_quantization_aware_training_finalize_experiment": [13, 32], "pytorch_quantization_aware_training_init_experiment": [13, 32, 33], "pytorch_resource_utilization_data": [13, 29], "q": 40, "q_fraction_scheduler_polici": 4, "qat": [25, 26, 32, 33, 43], "qat_config": [13, 26, 33], "qatconfig": [26, 33], "qc": 8, "qc_option": 44, "qmodel": 11, "qnnpack": 44, "quant": 40, "quantifi": [7, 48], "quantiz": [0, 3, 4, 5, 8, 9, 11, 12, 13, 15, 17, 19, 21, 27, 29, 35, 36, 37, 38, 39, 42, 43, 44, 45, 48, 49], "quantization_config": [38, 45], "quantization_configur": 44, "quantization_format": 40, "quantization_info": [20, 23, 25, 26, 28, 30, 32, 33], "quantization_preserv": [18, 44, 46], "quantizationconfig": [13, 38, 47], "quantizationerrormethod": [8, 11, 13], "quantizationmethod": [3, 45], "quantize_and_export": 11, "quantize_reported_dir": [12, 47], "quantized_exportable_model": 40, "quantized_info": 47, "quantized_model": [11, 20, 23, 25, 26, 32, 33, 35, 36, 37, 47], "quantized_modul": [28, 30], "quantizewrapp": [13, 26, 32, 33], "question": 40, "r": 49, "radam": 16, "rais": 44, "random": [20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 40], "random_data_gen": 47, "rang": [3, 12, 20, 23, 26, 28, 30, 33, 47], "rate": [1, 14, 15, 16], "ratio": [11, 12, 47], "readi": 32, "readm": 40, "recent": 47, "recommend": 47, "recov": [24, 31], "red": 47, "reduc": [5, 24, 31], "reduce_on_plateau": [1, 14], "reduce_on_plateau_with_reset": 16, "reduceonplateau": 1, "refer": [40, 47], "refine_mp_solut": 5, "regard": 41, "regular": [1, 4, 15, 17], "regularization_factor": [4, 15, 17], "regularized_min_max_diff": [1, 14], "relat": [3, 7, 13, 44], "releas": 49, "relev": [40, 47], "relu": 3, "relu_bound_to_power_of_2": 8, "remov": [12, 24, 31, 32], "replac": [25, 47], "report": [12, 13, 47], "report_dir": [12, 47], "repositori": 40, "repr_datagen": [20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33], "repr_dataset": [35, 36, 37, 40], "repres": [4, 5, 10, 11, 15, 17, 20, 23, 24, 25, 26, 28, 30, 31, 32, 33, 35, 36, 37, 40, 42, 44, 47, 48], "representative_data_gen": [20, 21, 23, 24, 26, 28, 29, 30, 31, 33, 40, 47], "representative_dataset": 11, "request": 2, "requir": [20, 23, 26, 28, 30, 33, 45, 47, 48], "research": 49, "reshap": [3, 19], "residu": 11, "residual_collaps": [8, 11, 47], "resnet50": [24, 31, 40], "resnet50_weight": 31, "resolv": 47, "resourc": [6, 10, 11, 13, 20, 23, 24, 25, 26, 31, 32, 33, 48], "resourceutil": [13, 20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 33], "respectivli": 3, "rest": 4, "retrain": [24, 31], "return": [2, 4, 5, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 39, 40], "round": 4, "rounding_typ": 4, "ru": [20, 23, 25, 26], "ru_data": [21, 29], "rule": [39, 42], "run": [4, 15, 17, 40, 48], "runner": 39, "runnnig": 47, "same": [1, 40, 44], "sampl": [4, 15, 17, 48], "save": [3, 11, 12, 26, 34, 40, 45, 47], "save_model_path": [11, 40], "saved_model": 22, "savedmodel": 22, "scalar": 48, "scale": [4, 5, 44, 47], "scale_log_norm": 4, "schedul": [1, 4, 14, 16, 39], "scheduler_typ": [1, 14, 16], "schedulertyp": [14, 16], "schema": 44, "schema_vers": 44, "score": [4, 5, 6, 7, 9, 11, 15, 17, 24, 31, 47], "search": [5, 10, 13, 20, 23, 26, 28, 30, 33], "second": [47, 48], "section": 47, "see": [4, 17, 49], "seen": 48, "select": [0, 3, 6, 8, 9, 13, 38, 40, 43, 44, 45], "self": 44, "semiconductor": 49, "sensit": [5, 6, 24, 31], "sequenti": [19, 27], "serial": 13, "serialization_format": 40, "sess": 40, "session": 40, "set": [3, 11, 12, 13, 15, 17, 19, 20, 23, 24, 25, 26, 27, 28, 30, 31, 33, 34, 35, 36, 37, 40, 42, 44, 45, 47, 48], "set_log_fold": [34, 47, 48], "setup": [11, 49], "sever": [20, 23, 26, 28, 30, 33, 48], "shift_negative_activation_correct": 8, "shift_negative_params_search": 8, "shift_negative_ratio": 8, "shift_negative_threshold_recalcul": 8, "shortli": 44, "should": [3, 6, 15, 20, 21, 23, 24, 25, 26, 28, 30, 31, 33, 40, 44, 48], "show": [47, 48], "shown": 47, "side": 47, "sigma": 5, "signal": 9, "signed": 44, "signific": 7, "significantli": 47, "simd": [24, 31, 44], "simd_siz": 44, "similar": [9, 12, 35, 36, 37, 39, 49], "similarli": 44, "simpl": [19, 27], "simplic": [19, 27], "simul": 39, "simulate_schedul": 39, "simultan": 44, "singl": 44, "six": 47, "size": [1, 4, 5, 14, 15, 16, 17, 19, 20, 23, 25, 26, 27, 33, 40, 45], "skip": [12, 39, 40, 47], "slowli": 40, "small": 47, "smaller": 41, "smallereq": 41, "smooth": [1, 45], "smoothing_and_augment": [1, 14, 16], "so": 40, "softmax": 3, "softmax_shift": 8, "softquant": 4, "solut": 49, "solver": [20, 23, 26, 33], "some": [18, 19, 27, 40, 44, 46, 47, 48], "soni": 49, "sonysemiconductorsolut": 49, "sourc": 49, "specif": [0, 3, 11, 13, 24, 31, 42, 47, 48], "specifi": [6, 12, 14, 16, 19, 22, 24, 27, 31, 40, 47], "sphinx": 13, "sqnr": [12, 47], "squar": [1, 9], "stabl": 49, "stage": 48, "stages_0_blocks_0_token_mixer_mixer_conv_kxk_0_conv_bn": 47, "stages_0_blocks_0_token_mixer_mixer_conv_scale_conv_bn": 47, "standard": [24, 31, 45], "start": [19, 27, 40, 45, 49], "start_step": 4, "state": [47, 49], "state_dict": 31, "statist": [3, 20, 23, 26, 28, 30, 33, 48], "ste": [4, 43, 45], "stem_0_act": 47, "stem_1_act": 47, "stem_2_act": 47, "stem_2_conv_kxk_0_conv_bn": 47, "step": [1, 4, 45, 47], "store": [7, 45], "str": [3, 11, 12, 20, 21, 23, 24, 26, 28, 29, 30, 31, 33, 35, 36, 37, 40, 41, 44, 47], "straight": [4, 45], "strategi": [6, 24, 31], "string": 42, "structur": [13, 49], "student": 4, "success": 11, "suffer": 40, "suggest": 47, "sum": [10, 21, 24, 29, 31], "support": [4, 11, 40], "supported_input_activation_n_bit": 44, "symmetr": [20, 23, 26, 28, 30, 33, 44, 45], "t": [34, 49], "tab": 48, "tabl": [44, 47], "tag": 48, "take": [5, 23, 26, 33, 49], "target": [4, 11, 13, 18, 20, 21, 23, 24, 25, 26, 29, 31, 32, 33, 44], "target_platform_cap": [20, 21, 23, 24, 26, 28, 29, 30, 31, 33, 41, 45], "target_platform_nam": 18, "target_platform_vers": [11, 18], "target_q_fract": 4, "target_resource_util": [20, 23, 24, 26, 28, 30, 31, 33], "targetplatformcap": [13, 18, 20, 21, 23, 24, 26, 28, 29, 30, 31, 33], "teacher": 4, "tempfil": 40, "tensor": [5, 11, 12, 15, 17, 19, 21, 27, 29, 44, 45, 48, 49], "tensorboard": [39, 47, 49], "tensorflow": [3, 11, 13, 15, 19, 20, 21, 23, 24, 25, 26, 40, 42, 44, 49], "tf": [3, 11, 15, 19, 22, 25, 26], "tflite": [40, 44], "than": [5, 41, 47], "thei": 3, "them": [44, 48], "therefor": 47, "thi": [5, 7, 8, 9, 11, 13, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 30, 31, 33, 34, 40, 44, 45, 47, 49], "three": [3, 47], "threshold": [5, 8, 9, 11, 12, 20, 23, 26, 28, 30, 33, 44, 45, 47], "threshold_bitwidth_mixed_precis": 47, "threshold_bitwidth_mixed_precision_with_model_output_loss_object": [12, 47], "threshold_degrade_layer_ratio": [12, 47], "threshold_degration_layer_ratio": 47, "threshold_quantize_error": [12, 47], "threshold_ratio_unbalanced_concaten": [12, 47], "threshold_ratio_unbalanced_concatn": 47, "threshold_zscore_outlier_remov": [12, 47], "through": [4, 19, 24, 27, 45], "throughout": 4, "thu": [24, 31, 48], "time": [3, 6, 45], "togeth": [24, 31], "tool": [13, 45, 49], "toolkit": [11, 13, 19, 27, 28, 47], "torch": [17, 27, 36, 37, 40, 49], "torchscript": 40, "torchvis": [1, 16, 28, 29, 30, 31, 32, 33, 40], "total": [10, 21, 29, 47], "total_memori": 10, "tpc": [11, 18, 24, 31, 44], "tpc_minor_vers": 44, "tpc_patch_vers": 44, "tpc_platform_typ": 44, "tpc_version": 11, "trace": 40, "train": [4, 11, 13, 43, 45, 49], "train_bia": 4, "trainabl": [22, 25, 45], "trainable_infrastructur": 43, "trainablequant": 25, "transform": [1, 20, 23, 26, 28, 30, 33], "transpos": 3, "treat": 44, "troubleshoot": [13, 47], "true": [1, 5, 8, 11, 12, 15, 16, 17, 22, 32, 33, 45, 47], "try": 5, "tun": 33, "tune": [15, 17, 24, 25, 26, 31, 32], "tupl": [1, 3, 11, 14, 16, 19, 20, 23, 24, 27, 28, 30, 31, 42, 44], "tutori": 47, "two": [5, 12, 20, 23, 26, 28, 30, 33, 40, 44, 47, 48], "type": [0, 1, 2, 4, 5, 6, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 27, 28, 29, 30, 31, 35, 36, 37, 40, 42, 44, 47], "ui": 48, "unbalanc": 12, "unchang": 39, "under": 48, "unifi": 11, "uniform": [44, 45], "union": [1, 14, 16, 19, 20, 21, 23, 24, 26, 27, 28, 29, 30, 31, 33, 44], "uniqu": 44, "unusu": 47, "up": [6, 19, 27, 34, 44, 48], "updat": [4, 11], "upon": 45, "upper": 47, "us": [0, 1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 48, 49], "use_hessian_based_scor": [5, 11], "use_hessian_based_weight": [15, 17], "use_hessian_sample_attent": [15, 17], "use_internal_tpc": 11, "use_mixed_precis": 11, "user": [11, 13, 20, 23, 25, 26, 28, 30, 32, 33, 47], "userinform": [20, 23, 28, 30], "util": [6, 11, 13, 20, 23, 24, 25, 26, 31, 32, 33, 45], "v": 49, "v1": 11, "valid": [35, 36, 37, 44, 45, 47], "validation_dataset": [35, 36, 37, 47], "validationerror": 44, "valu": [1, 2, 3, 4, 5, 6, 9, 11, 12, 20, 23, 24, 25, 26, 31, 40, 41, 42, 44, 45, 47], "valuabl": 9, "variabl": [15, 17], "variou": [11, 19, 27, 48], "vector": [4, 48], "verbos": 34, "version": [11, 18, 19, 27, 44], "via": [40, 49], "view": 48, "visit": [43, 49], "visual": [47, 49], "wa": [2, 40, 47], "wai": [48, 49], "walk": [19, 27], "want": 3, "warn": 47, "we": [3, 19, 20, 23, 24, 26, 27, 31, 33, 40, 42, 44, 45, 47, 48], "weight": [0, 1, 3, 4, 5, 8, 10, 11, 14, 15, 16, 17, 20, 21, 24, 26, 28, 29, 30, 31, 32, 33, 40, 42, 43, 44, 45, 48], "weight_quantizer_params_overrid": 43, "weight_training_method": 43, "weights_bias_correct": [8, 11], "weights_channels_axi": 45, "weights_compression_ratio": 11, "weights_error_method": 8, "weights_memori": [6, 10, 20, 23, 24, 26, 31, 33], "weights_n_bit": [42, 44, 45], "weights_per_channel_threshold": [44, 45], "weights_quantization_candid": 45, "weights_quantization_method": [42, 44, 45], "weights_quantization_param": 45, "weights_quantization_params_fn": 42, "weights_second_moment_correct": 8, "were": 48, "when": [1, 2, 3, 4, 5, 6, 9, 10, 12, 13, 15, 17, 20, 23, 25, 26, 39, 40, 41, 43, 44, 45, 47, 48], "where": [7, 12, 40, 42, 47, 48], "whether": [4, 5, 7, 11, 14, 15, 16, 17, 22, 39, 40, 44, 45], "which": [4, 6, 39, 40, 41, 42, 44, 45, 47], "while": [8, 20, 23, 25, 26, 33, 44], "who": 47, "width": [0, 5, 12, 13, 20, 23, 26, 27, 33, 38, 44, 47, 49], "within": [39, 44, 49], "without": 13, "work": 49, "would": 48, "wrap": [2, 3, 22, 26, 33, 41, 44, 45], "wrapper": [26, 32, 33, 45], "writer": 48, "x": 47, "xquant": 49, "xquant_config": [12, 35, 36, 37, 47], "xquant_report_keras_experiment": [13, 35], "xquant_report_pytorch_experiment": [13, 36, 47], "xquant_report_troubleshoot_pytorch_experiment": [12, 13, 37, 47], "xquantconfig": [12, 13, 35, 36, 37], "y": 47, "yield": [20, 21, 23, 24, 25, 26, 28, 29, 30, 31, 32, 33, 40], "you": [8, 40, 47, 48, 49], "your": 40, "z": [11, 47], "z_score": [12, 47], "z_threshold": [8, 11, 47], "zero": [5, 44], "zscore": 47}, "titles": ["BitWidthConfig", "Data Generation Configuration", "DefaultDict Class", "FrameworkInfo Class", "GradientPTQConfig Class", "MixedPrecisionQuantizationConfig", "Pruning Configuration", "Pruning Information", "QuantizationConfig", "QuantizationErrorMethod", "ResourceUtilization", "wrapper", "XQuant Configuration", "API Docs", "Get DataGenerationConfig for Keras Models", "Get GradientPTQConfig for Keras Models", "Get DataGenerationConfig for Pytorch Models", "Get GradientPTQConfig for Pytorch Models", "Get FrameworkQuantizationCapabilities", "Keras Data Generation", "Keras Gradient Based Post Training Quantization", "Get Resource Utilization information for Keras Models", "Load Quantized Keras Model", "Keras Post Training Quantization", "Keras Structured Pruning", "Keras Quantization Aware Training Model Finalize", "Keras Quantization Aware Training Model Init", "Pytorch Data Generation", "Pytorch Gradient Based Post Training Quantization", "Get Resource Utilization information for PyTorch Models", "Pytorch Post Training Quantization", "Pytorch Structured Pruning", "PyTorch Quantization Aware Training Model Finalize", "PyTorch Quantization Aware Training Model Init", "Enable a Logger", "XQuant Report Keras", "XQuant Report Pytorch", "XQuant Report Troubleshoot Pytorch", "CoreConfig", "debug_config Module", "exporter Module", "Layer Attributes Filters", "network_editor Module", "qat_config Module", "target_platform_capabilities Module", "trainable_infrastructure Module", "<no title>", "XQuant Extension Tool", "Visualization within TensorBoard", "Model Compression Toolkit User Guide"], "titleterms": {"about": 47, "action": 42, "activ": 47, "api": [13, 49], "attribut": 41, "attributequantizationconfig": 44, "awar": [25, 26, 32, 33], "base": [20, 28], "basekerastrainablequant": 45, "basepytorchtrainablequant": 45, "batchnormalignemntlosstyp": 1, "bit": 48, "bitwidthconfig": 0, "bnlayerweightingtyp": 1, "channelaxi": 3, "channelsfilteringstrategi": 6, "class": [2, 3, 4], "comparison": 48, "compress": 49, "concatn": 47, "configur": [1, 6, 12, 48], "constraint": 49, "core": 13, "coreconfig": 38, "cosin": 48, "data": [1, 19, 27], "data_gener": 13, "datagenerationconfig": [14, 16], "datainittyp": 1, "debug_config": 39, "debugconfig": 39, "defaultdict": 2, "doc": 13, "document": 49, "editrul": 42, "enabl": 34, "error": 47, "exampl": 47, "export": [13, 40], "extens": 47, "featur": 49, "filter": [41, 42], "final": [25, 32], "flow": 47, "format": [40, 47], "frameworkinfo": 3, "frameworkquantizationcap": 18, "fuse": 44, "gener": [1, 19, 27], "get": [14, 15, 16, 17, 18, 21, 29], "gptq": 13, "gptqhessianscoresconfig": 4, "gradient": [20, 28], "gradientptqconfig": [4, 15, 17], "gradualactivationquantizationconfig": 4, "graph": 47, "guid": 49, "how": 47, "imagegranular": 1, "imagenormalizationtyp": 1, "imagepipelinetyp": 1, "importancemetr": 6, "indic": 13, "infer": 40, "inform": [7, 21, 29], "init": [26, 33], "instal": 49, "judgment": 47, "kera": [14, 15, 19, 20, 21, 22, 23, 24, 25, 26, 35, 40], "keras_export_model": 40, "keras_load_quantized_model": 13, "kerasexportserializationformat": 40, "layer": 41, "load": 22, "logger": 34, "loss": 47, "manualbitwidthselect": 0, "mctq": 40, "mix": [47, 48], "mixedprecisionquantizationconfig": 5, "model": [14, 15, 16, 17, 21, 22, 25, 26, 29, 32, 33, 40, 47, 49], "modul": [39, 40, 42, 43, 44, 45], "mpdistanceweight": 5, "mpmetricnorm": 5, "name": 40, "neg": 47, "network_editor": 42, "object": 47, "onnx": 40, "operatorsetgroup": 44, "operatorsset": 44, "opquantizationconfig": 44, "opset": 40, "outlier": 47, "output": [40, 47], "outputlosstyp": 1, "overal": 47, "overview": 49, "paramet": 47, "post": [20, 23, 28, 30], "precis": [47, 48], "process": 47, "prune": [6, 7, 13, 24, 31], "ptq": 13, "pytorch": [16, 17, 27, 28, 29, 30, 31, 32, 33, 36, 37, 40], "pytorch_export_model": 40, "pytorchexportserializationformat": 40, "qat": 13, "qat_config": 43, "qatconfig": 43, "qfractionlinearannealingconfig": 4, "quantiz": [20, 22, 23, 25, 26, 28, 30, 32, 33, 40, 47], "quantizationconfig": 8, "quantizationconfigopt": 44, "quantizationerrormethod": 9, "quantizationformat": 40, "quantizationmethod": 44, "quickstart": 49, "refer": 49, "remov": 47, "report": [35, 36, 37], "resourc": [21, 29], "resourceutil": 10, "result": 47, "roundingtyp": 4, "run": 47, "schedulertyp": 1, "serial": 40, "set_log_fold": 13, "shift": 47, "similar": 48, "structur": [24, 31], "support": 49, "tabl": 13, "target_platform_cap": [13, 44], "targetplatformcap": 44, "technic": 49, "tensorboard": 48, "tool": 47, "toolkit": 49, "train": [20, 23, 25, 26, 28, 30, 32, 33], "trainable_infrastructur": [13, 45], "trainablequantizeractivationconfig": 45, "trainablequantizerweightsconfig": 45, "trainingmethod": [43, 45], "troubleshoot": 37, "tutori": 40, "unbalanc": 47, "understand": 47, "us": 40, "user": 49, "util": [21, 29], "version": 40, "visual": 48, "width": 48, "within": 48, "wrapper": [11, 13], "xquant": [12, 13, 35, 36, 37, 47], "xquantconfig": 47}}) \ No newline at end of file +Search.setIndex({"alltitles": {"API Docs": [[13, null]], "API Documentation": [[50, "api-documentation"]], "About XQuant Extension Tool": [[48, "about-xquant-extension-tool"]], "Actions": [[43, "actions"]], "Attribute Filters": [[42, "attribute-filters"]], "AttributeQuantizationConfig": [[45, "attributequantizationconfig"]], "BNLayerWeightingType": [[1, "bnlayerweightingtype"]], "BaseKerasTrainableQuantizer": [[46, "basekerastrainablequantizer"]], "BasePytorchTrainableQuantizer": [[46, "basepytorchtrainablequantizer"]], "BatchNormAlignemntLossType": [[1, "batchnormalignemntlosstype"]], "BitWidthConfig": [[0, null]], "ChannelAxis": [[3, "channelaxis"]], "ChannelsFilteringStrategy": [[6, "channelsfilteringstrategy"]], "CoreConfig": [[39, null]], "Cosine Similarity Comparison": [[49, "cosine-similarity-comparison"]], "Data Generation Configuration": [[1, null]], "DataInitType": [[1, "datainittype"]], "DebugConfig": [[40, "debugconfig"]], "DefaultDict Class": [[2, null]], "EditRule": [[43, "editrule"]], "Enable a Logger": [[35, null]], "Filters": [[43, "filters"]], "FrameworkInfo Class": [[3, null]], "Fusing": [[45, "fusing"]], "GPTQHessianScoresConfig Class": [[4, "gptqhessianscoresconfig-class"]], "Get DataGenerationConfig for Keras Models": [[14, null]], "Get DataGenerationConfig for Pytorch Models": [[16, null]], "Get GradientPTQConfig for Keras Models": [[15, null]], "Get GradientPTQConfig for Pytorch Models": [[17, null]], "Get Resource Utilization information for Keras Models": [[22, null]], "Get Resource Utilization information for PyTorch Models": [[30, null]], "Get TargetPlatformCapabilities for sdsp converter version": [[19, null]], "Get TargetPlatformCapabilities for tpc version": [[18, null]], "GradientPTQConfig Class": [[4, null]], "GradualActivationQuantizationConfig": [[4, "gradualactivationquantizationconfig"]], "How to Run": [[48, "how-to-run"]], "ImageGranularity": [[1, "imagegranularity"]], "ImageNormalizationType": [[1, "imagenormalizationtype"]], "ImagePipelineType": [[1, "imagepipelinetype"]], "ImportanceMetric": [[6, "importancemetric"]], "Indices and tables": [[13, "indices-and-tables"]], "Install": [[50, "install"]], "Keras Data Generation": [[20, null]], "Keras Gradient Based Post Training Quantization": [[21, null]], "Keras Post Training Quantization": [[24, null]], "Keras Quantization Aware Training Model Finalize": [[26, null]], "Keras Quantization Aware Training Model Init": [[27, null]], "Keras Structured Pruning": [[25, null]], "Keras Tutorial": [[41, "keras-tutorial"]], "KerasExportSerializationFormat": [[41, "kerasexportserializationformat"]], "Layer Attributes Filters": [[42, null]], "Load Quantized Keras Model": [[23, null]], "MCTQ": [[41, "mctq"]], "MCTQ Quantization Format": [[41, "mctq-quantization-format"]], "ManualBitWidthSelection": [[0, "manualbitwidthselection"]], "Mixed Precision with model output loss objective": [[48, "mixed-precision-with-model-output-loss-objective"]], "Mixed-precision Configuration Bit-width": [[49, "mixed-precision-configuration-bit-width"]], "MixedPrecisionQuantizationConfig": [[5, null]], "Model Compression Toolkit User Guide": [[50, null]], "MpDistanceWeighting": [[5, "mpdistanceweighting"]], "MpMetricNormalization": [[5, "mpmetricnormalization"]], "ONNX": [[41, "onnx"]], "ONNX model output names": [[41, "onnx-model-output-names"]], "ONNX opset version": [[41, "onnx-opset-version"]], "OpQuantizationConfig": [[45, "opquantizationconfig"]], "OperatorSetGroup": [[45, "operatorsetgroup"]], "OperatorsSet": [[45, "operatorsset"]], "Outlier Removal": [[48, "outlier-removal"]], "OutputLossType": [[1, "outputlosstype"]], "Overall Process Flow": [[48, "overall-process-flow"]], "Overview": [[50, "overview"]], "Pruning Configuration": [[6, null]], "Pruning Information": [[7, null]], "PyTorch Quantization Aware Training Model Finalize": [[33, null]], "PyTorch Quantization Aware Training Model Init": [[34, null]], "Pytorch Data Generation": [[28, null]], "Pytorch Gradient Based Post Training Quantization": [[29, null]], "Pytorch Post Training Quantization": [[31, null]], "Pytorch Structured Pruning": [[32, null]], "Pytorch Tutorial": [[41, "pytorch-tutorial"]], "PytorchExportSerializationFormat": [[41, "pytorchexportserializationformat"]], "QATConfig": [[44, "qatconfig"]], "QFractionLinearAnnealingConfig": [[4, "qfractionlinearannealingconfig"]], "QuantizationConfig": [[8, null]], "QuantizationConfigOptions": [[45, "quantizationconfigoptions"]], "QuantizationErrorMethod": [[9, null]], "QuantizationFormat": [[41, "quantizationformat"]], "QuantizationMethod": [[45, "quantizationmethod"]], "Quickstart": [[50, "quickstart"]], "References": [[50, "references"]], "ResourceUtilization": [[10, null]], "RoundingType": [[4, "roundingtype"]], "SchedulerType": [[1, "schedulertype"]], "Shift Negative Activation": [[48, "shift-negative-activation"]], "Supported Features": [[50, "supported-features"]], "TargetPlatformCapabilities": [[45, "targetplatformcapabilities"]], "Technical Constraints": [[50, "technical-constraints"]], "TrainableQuantizerActivationConfig": [[46, "trainablequantizeractivationconfig"]], "TrainableQuantizerWeightsConfig": [[46, "trainablequantizerweightsconfig"]], "TrainingMethod": [[44, "trainingmethod"], [46, "trainingmethod"]], "Unbalanced Concatnation": [[48, "unbalanced-concatnation"]], "Understanding the Quantization Error Graph": [[48, "understanding-the-quantization-error-graph"]], "Understanding the judgment result": [[48, "understanding-the-judgment-result"]], "Use exported model for inference": [[41, "use-exported-model-for-inference"]], "Visualization within TensorBoard": [[49, null]], "XQuant Configuration": [[12, null]], "XQuant Extension Tool": [[48, null]], "XQuant Report Keras": [[36, null]], "XQuant Report Pytorch": [[37, null]], "XQuant Report Troubleshoot Pytorch": [[38, null]], "XQuantConfig Format and Examples": [[48, "xquantconfig-format-and-examples"]], "XQuantConfig parameter": [[48, "id1"]], "core": [[13, "core"]], "data_generation": [[13, "data-generation"]], "debug_config Module": [[40, null]], "exporter": [[13, "exporter"]], "exporter Module": [[41, null]], "gptq": [[13, "gptq"]], "keras serialization format": [[41, "keras-serialization-format"]], "keras_export_model": [[41, "keras-export-model"]], "keras_load_quantized_model": [[13, "keras-load-quantized-model"]], "network_editor Module": [[43, null]], "pruning": [[13, "pruning"]], "ptq": [[13, "ptq"]], "pytorch_export_model": [[41, "pytorch-export-model"]], "qat": [[13, "qat"]], "qat_config Module": [[44, null]], "set_log_folder": [[13, "set-log-folder"]], "target_platform_capabilities": [[13, "target-platform-capabilities"]], "target_platform_capabilities Module": [[45, null]], "trainable_infrastructure": [[13, "trainable-infrastructure"]], "trainable_infrastructure Module": [[46, null]], "wrapper": [[11, null], [13, "wrapper"]], "xquant": [[13, "xquant"]]}, "docnames": ["api/api_docs/classes/BitWidthConfig", "api/api_docs/classes/DataGenerationConfig", "api/api_docs/classes/DefaultDict", "api/api_docs/classes/FrameworkInfo", "api/api_docs/classes/GradientPTQConfig", "api/api_docs/classes/MixedPrecisionQuantizationConfig", "api/api_docs/classes/PruningConfig", "api/api_docs/classes/PruningInfo", "api/api_docs/classes/QuantizationConfig", "api/api_docs/classes/QuantizationErrorMethod", "api/api_docs/classes/ResourceUtilization", "api/api_docs/classes/Wrapper", "api/api_docs/classes/XQuantConfig", "api/api_docs/index", "api/api_docs/methods/get_keras_data_generation_config", "api/api_docs/methods/get_keras_gptq_config", "api/api_docs/methods/get_pytorch_data_generation_config", "api/api_docs/methods/get_pytroch_gptq_config", "api/api_docs/methods/get_target_platform_capabilities", "api/api_docs/methods/get_target_platform_capabilities_sdsp", "api/api_docs/methods/keras_data_generation_experimental", "api/api_docs/methods/keras_gradient_post_training_quantization", "api/api_docs/methods/keras_kpi_data", "api/api_docs/methods/keras_load_quantizad_model", "api/api_docs/methods/keras_post_training_quantization", "api/api_docs/methods/keras_pruning_experimental", "api/api_docs/methods/keras_quantization_aware_training_finalize_experimental", "api/api_docs/methods/keras_quantization_aware_training_init_experimental", "api/api_docs/methods/pytorch_data_generation_experimental", "api/api_docs/methods/pytorch_gradient_post_training_quantization", "api/api_docs/methods/pytorch_kpi_data", "api/api_docs/methods/pytorch_post_training_quantization", "api/api_docs/methods/pytorch_pruning_experimental", "api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental", "api/api_docs/methods/pytorch_quantization_aware_training_init_experimental", "api/api_docs/methods/set_logger_path", "api/api_docs/methods/xquant_report_keras_experimental", "api/api_docs/methods/xquant_report_pytorch_experimental", "api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental", "api/api_docs/modules/core_config", "api/api_docs/modules/debug_config", "api/api_docs/modules/exporter", "api/api_docs/modules/layer_filters", "api/api_docs/modules/network_editor", "api/api_docs/modules/qat_config", "api/api_docs/modules/target_platform_capabilities", "api/api_docs/modules/trainable_infrastructure", "api/api_docs/notes/tpc_note", "guidelines/XQuant_Extension_Tool", "guidelines/visualization", "index"], "envversion": {"sphinx": 64, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["api/api_docs/classes/BitWidthConfig.rst", "api/api_docs/classes/DataGenerationConfig.rst", "api/api_docs/classes/DefaultDict.rst", "api/api_docs/classes/FrameworkInfo.rst", "api/api_docs/classes/GradientPTQConfig.rst", "api/api_docs/classes/MixedPrecisionQuantizationConfig.rst", "api/api_docs/classes/PruningConfig.rst", "api/api_docs/classes/PruningInfo.rst", "api/api_docs/classes/QuantizationConfig.rst", "api/api_docs/classes/QuantizationErrorMethod.rst", "api/api_docs/classes/ResourceUtilization.rst", "api/api_docs/classes/Wrapper.rst", "api/api_docs/classes/XQuantConfig.rst", "api/api_docs/index.rst", "api/api_docs/methods/get_keras_data_generation_config.rst", "api/api_docs/methods/get_keras_gptq_config.rst", "api/api_docs/methods/get_pytorch_data_generation_config.rst", "api/api_docs/methods/get_pytroch_gptq_config.rst", "api/api_docs/methods/get_target_platform_capabilities.rst", "api/api_docs/methods/get_target_platform_capabilities_sdsp.rst", "api/api_docs/methods/keras_data_generation_experimental.rst", "api/api_docs/methods/keras_gradient_post_training_quantization.rst", "api/api_docs/methods/keras_kpi_data.rst", "api/api_docs/methods/keras_load_quantizad_model.rst", "api/api_docs/methods/keras_post_training_quantization.rst", "api/api_docs/methods/keras_pruning_experimental.rst", "api/api_docs/methods/keras_quantization_aware_training_finalize_experimental.rst", "api/api_docs/methods/keras_quantization_aware_training_init_experimental.rst", "api/api_docs/methods/pytorch_data_generation_experimental.rst", "api/api_docs/methods/pytorch_gradient_post_training_quantization.rst", "api/api_docs/methods/pytorch_kpi_data.rst", "api/api_docs/methods/pytorch_post_training_quantization.rst", "api/api_docs/methods/pytorch_pruning_experimental.rst", "api/api_docs/methods/pytorch_quantization_aware_training_finalize_experimental.rst", "api/api_docs/methods/pytorch_quantization_aware_training_init_experimental.rst", "api/api_docs/methods/set_logger_path.rst", "api/api_docs/methods/xquant_report_keras_experimental.rst", "api/api_docs/methods/xquant_report_pytorch_experimental.rst", "api/api_docs/methods/xquant_report_troubleshoot_pytorch_experimental.rst", "api/api_docs/modules/core_config.rst", "api/api_docs/modules/debug_config.rst", "api/api_docs/modules/exporter.rst", "api/api_docs/modules/layer_filters.rst", "api/api_docs/modules/network_editor.rst", "api/api_docs/modules/qat_config.rst", "api/api_docs/modules/target_platform_capabilities.rst", "api/api_docs/modules/trainable_infrastructure.rst", "api/api_docs/notes/tpc_note.rst", "guidelines/XQuant_Extension_Tool.rst", "guidelines/visualization.rst", "index.rst"], "indexentries": {"add_metadata (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.add_metadata", false]], "attributefilter (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.AttributeFilter", false]], "attributequantizationconfig (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig", false]], "base_config (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.quantizationconfigoptions attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions.base_config", false]], "basekerastrainablequantizer (class in model_compression_toolkit.trainable_infrastructure)": [[46, "model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer", false]], "basepytorchtrainablequantizer (class in model_compression_toolkit.trainable_infrastructure)": [[46, "model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer", false]], "batchnormalignemntlosstype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.BatchNormAlignemntLossType", false]], "bit_width (model_compression_toolkit.core.common.quantization.bit_width_config.manualbitwidthselection attribute)": [[0, "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection.bit_width", false]], "bitwidthconfig (class in model_compression_toolkit.core)": [[0, "model_compression_toolkit.core.BitWidthConfig", false]], "bnlayerweightingtype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.BNLayerWeightingType", false]], "changecandidatesactivationquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr", false]], "changecandidatesactivationquantizationmethod (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod", false]], "changecandidatesweightsquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr", false]], "changecandidatesweightsquantizationmethod (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod", false]], "changefinalactivationquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr", false]], "changefinalweightsquantconfigattr (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr", false]], "changefinalweightsquantizationmethod (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod", false]], "changequantizationparamfunction (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction", false]], "channelaxis (class in model_compression_toolkit.core)": [[3, "model_compression_toolkit.core.ChannelAxis", false]], "channels_filtering_strategy (model_compression_toolkit.pruning.pruningconfig attribute)": [[6, "model_compression_toolkit.pruning.PruningConfig.channels_filtering_strategy", false]], "channelsfilteringstrategy (class in model_compression_toolkit.pruning)": [[6, "model_compression_toolkit.pruning.ChannelsFilteringStrategy", false]], "coreconfig (class in model_compression_toolkit.core)": [[39, "model_compression_toolkit.core.CoreConfig", false]], "datagenerationconfig (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.DataGenerationConfig", false]], "datainittype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.DataInitType", false]], "debugconfig (class in model_compression_toolkit.core)": [[40, "model_compression_toolkit.core.DebugConfig", false]], "default_qco (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.default_qco", false]], "defaultdict (class in model_compression_toolkit)": [[2, "model_compression_toolkit.DefaultDict", false]], "editrule (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.EditRule", false]], "enable_weights_quantization (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.enable_weights_quantization", false]], "eq (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.Eq", false]], "filter (model_compression_toolkit.core.common.quantization.bit_width_config.manualbitwidthselection attribute)": [[0, "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection.filter", false]], "frameworkinfo (class in model_compression_toolkit.core)": [[3, "model_compression_toolkit.core.FrameworkInfo", false]], "fuse_op_quantization_config (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.fusing attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing.fuse_op_quantization_config", false]], "fusing (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing", false]], "fusing_patterns (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.fusing_patterns", false]], "get() (model_compression_toolkit.defaultdict method)": [[2, "model_compression_toolkit.DefaultDict.get", false]], "get_keras_data_generation_config() (in module model_compression_toolkit.data_generation)": [[14, "model_compression_toolkit.data_generation.get_keras_data_generation_config", false]], "get_keras_gptq_config() (in module model_compression_toolkit.gptq)": [[15, "model_compression_toolkit.gptq.get_keras_gptq_config", false]], "get_pytorch_data_generation_config() (in module model_compression_toolkit.data_generation)": [[16, "model_compression_toolkit.data_generation.get_pytorch_data_generation_config", false]], "get_pytorch_gptq_config() (in module model_compression_toolkit.gptq)": [[17, "model_compression_toolkit.gptq.get_pytorch_gptq_config", false]], "get_target_platform_capabilities() (in module model_compression_toolkit)": [[18, "model_compression_toolkit.get_target_platform_capabilities", false]], "get_target_platform_capabilities_sdsp() (in module model_compression_toolkit)": [[19, "model_compression_toolkit.get_target_platform_capabilities_sdsp", false]], "gptqhessianscoresconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.GPTQHessianScoresConfig", false]], "gradientptqconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.GradientPTQConfig", false]], "gradualactivationquantizationconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.GradualActivationQuantizationConfig", false]], "greater (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.Greater", false]], "greatereq (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.GreaterEq", false]], "imagegranularity (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.ImageGranularity", false]], "imagenormalizationtype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.ImageNormalizationType", false]], "imagepipelinetype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.ImagePipelineType", false]], "importance_metric (model_compression_toolkit.pruning.pruningconfig attribute)": [[6, "model_compression_toolkit.pruning.PruningConfig.importance_metric", false]], "importance_scores (model_compression_toolkit.pruning.pruninginfo property)": [[7, "model_compression_toolkit.pruning.PruningInfo.importance_scores", false]], "importancemetric (class in model_compression_toolkit.pruning)": [[6, "model_compression_toolkit.pruning.ImportanceMetric", false]], "insert_preserving_quantizers (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.insert_preserving_quantizers", false]], "is_simd_padding (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.is_simd_padding", false]], "keras_data_generation_experimental() (in module model_compression_toolkit.data_generation)": [[20, "model_compression_toolkit.data_generation.keras_data_generation_experimental", false]], "keras_export_model (class in model_compression_toolkit.exporter)": [[41, "model_compression_toolkit.exporter.keras_export_model", false]], "keras_gradient_post_training_quantization() (in module model_compression_toolkit.gptq)": [[21, "model_compression_toolkit.gptq.keras_gradient_post_training_quantization", false]], "keras_load_quantized_model() (in module model_compression_toolkit)": [[23, "model_compression_toolkit.keras_load_quantized_model", false]], "keras_post_training_quantization() (in module model_compression_toolkit.ptq)": [[24, "model_compression_toolkit.ptq.keras_post_training_quantization", false]], "keras_pruning_experimental() (in module model_compression_toolkit.pruning)": [[25, "model_compression_toolkit.pruning.keras_pruning_experimental", false]], "keras_quantization_aware_training_finalize_experimental() (in module model_compression_toolkit.qat)": [[26, "model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental", false]], "keras_quantization_aware_training_init_experimental() (in module model_compression_toolkit.qat)": [[27, "model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental", false]], "keras_resource_utilization_data() (in module model_compression_toolkit.core)": [[22, "model_compression_toolkit.core.keras_resource_utilization_data", false]], "kerasexportserializationformat (class in model_compression_toolkit.exporter)": [[41, "model_compression_toolkit.exporter.KerasExportSerializationFormat", false]], "keys() (model_compression_toolkit.defaultdict method)": [[2, "model_compression_toolkit.DefaultDict.keys", false]], "lut_values_bitwidth (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.lut_values_bitwidth", false]], "manual_activation_bit_width_selection_list (model_compression_toolkit.core.bitwidthconfig attribute)": [[0, "model_compression_toolkit.core.BitWidthConfig.manual_activation_bit_width_selection_list", false]], "manual_weights_bit_width_selection_list (model_compression_toolkit.core.bitwidthconfig attribute)": [[0, "model_compression_toolkit.core.BitWidthConfig.manual_weights_bit_width_selection_list", false]], "manualbitwidthselection (class in model_compression_toolkit.core.common.quantization.bit_width_config)": [[0, "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection", false]], "mctwrapper (class in model_compression_toolkit.wrapper.mct_wrapper)": [[11, "model_compression_toolkit.wrapper.mct_wrapper.MCTWrapper", false]], "mixedprecisionquantizationconfig (class in model_compression_toolkit.core)": [[5, "model_compression_toolkit.core.MixedPrecisionQuantizationConfig", false]], "mpdistanceweighting (class in model_compression_toolkit.core)": [[5, "model_compression_toolkit.core.MpDistanceWeighting", false]], "mpmetricnormalization (class in model_compression_toolkit.core)": [[5, "model_compression_toolkit.core.MpMetricNormalization", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.fusing attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing.name", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsetgroup attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup.name", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsset attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet.name", false]], "name (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.name", false]], "nodenamefilter (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.NodeNameFilter", false]], "nodenamescopefilter (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.NodeNameScopeFilter", false]], "nodetypefilter (class in model_compression_toolkit.core.network_editor)": [[43, "model_compression_toolkit.core.network_editor.NodeTypeFilter", false]], "noteq (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.NotEq", false]], "num_score_approximations (model_compression_toolkit.pruning.pruningconfig attribute)": [[6, "model_compression_toolkit.pruning.PruningConfig.num_score_approximations", false]], "operator_groups (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.fusing attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing.operator_groups", false]], "operator_set (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.operator_set", false]], "operators_set (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsetgroup attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup.operators_set", false]], "operatorsetgroup (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup", false]], "operatorsset (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet", false]], "opquantizationconfig (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OpQuantizationConfig", false]], "outputlosstype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.OutputLossType", false]], "pruning_masks (model_compression_toolkit.pruning.pruninginfo property)": [[7, "model_compression_toolkit.pruning.PruningInfo.pruning_masks", false]], "pruningconfig (class in model_compression_toolkit.pruning)": [[6, "model_compression_toolkit.pruning.PruningConfig", false]], "pruninginfo (class in model_compression_toolkit.pruning)": [[7, "model_compression_toolkit.pruning.PruningInfo", false]], "pytorch_data_generation_experimental() (in module model_compression_toolkit.data_generation)": [[28, "model_compression_toolkit.data_generation.pytorch_data_generation_experimental", false]], "pytorch_export_model (class in model_compression_toolkit.exporter)": [[41, "model_compression_toolkit.exporter.pytorch_export_model", false]], "pytorch_gradient_post_training_quantization() (in module model_compression_toolkit.gptq)": [[29, "model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization", false]], "pytorch_post_training_quantization() (in module model_compression_toolkit.ptq)": [[31, "model_compression_toolkit.ptq.pytorch_post_training_quantization", false]], "pytorch_pruning_experimental() (in module model_compression_toolkit.pruning)": [[32, "model_compression_toolkit.pruning.pytorch_pruning_experimental", false]], "pytorch_quantization_aware_training_finalize_experimental() (in module model_compression_toolkit.qat)": [[33, "model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental", false]], "pytorch_quantization_aware_training_init_experimental() (in module model_compression_toolkit.qat)": [[34, "model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental", false]], "pytorch_resource_utilization_data() (in module model_compression_toolkit.core)": [[30, "model_compression_toolkit.core.pytorch_resource_utilization_data", false]], "pytorchexportserializationformat (class in model_compression_toolkit.exporter)": [[41, "model_compression_toolkit.exporter.PytorchExportSerializationFormat", false]], "qatconfig (class in model_compression_toolkit.qat)": [[44, "model_compression_toolkit.qat.QATConfig", false]], "qc_options (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsset attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet.qc_options", false]], "qfractionlinearannealingconfig (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.QFractionLinearAnnealingConfig", false]], "quantization_configurations (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.quantizationconfigoptions attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions.quantization_configurations", false]], "quantizationconfig (class in model_compression_toolkit.core)": [[8, "model_compression_toolkit.core.QuantizationConfig", false]], "quantizationconfigoptions (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions", false]], "quantizationerrormethod (class in model_compression_toolkit.core)": [[9, "model_compression_toolkit.core.QuantizationErrorMethod", false]], "quantizationformat (class in model_compression_toolkit.exporter)": [[41, "model_compression_toolkit.exporter.QuantizationFormat", false]], "quantizationmethod (class in model_compression_toolkit.target_platform_capabilities)": [[45, "model_compression_toolkit.target_platform_capabilities.QuantizationMethod", false]], "quantize_and_export() (model_compression_toolkit.wrapper.mct_wrapper.mctwrapper method)": [[11, "model_compression_toolkit.wrapper.mct_wrapper.MCTWrapper.quantize_and_export", false]], "resourceutilization (class in model_compression_toolkit.core)": [[10, "model_compression_toolkit.core.ResourceUtilization", false]], "roundingtype (class in model_compression_toolkit.gptq)": [[4, "model_compression_toolkit.gptq.RoundingType", false]], "schedulertype (class in model_compression_toolkit.data_generation)": [[1, "model_compression_toolkit.data_generation.SchedulerType", false]], "schema_version (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.SCHEMA_VERSION", false]], "set_log_folder() (in module model_compression_toolkit)": [[35, "model_compression_toolkit.set_log_folder", false]], "smaller (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.Smaller", false]], "smallereq (class in model_compression_toolkit.target_platform_capabilities)": [[42, "model_compression_toolkit.target_platform_capabilities.SmallerEq", false]], "targetplatformcapabilities (class in model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities", false]], "tpc_minor_version (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.tpc_minor_version", false]], "tpc_patch_version (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.tpc_patch_version", false]], "tpc_platform_type (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.targetplatformcapabilities attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities.tpc_platform_type", false]], "trainablequantizeractivationconfig (class in model_compression_toolkit.trainable_infrastructure)": [[46, "model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig", false]], "trainablequantizerweightsconfig (class in model_compression_toolkit.trainable_infrastructure)": [[46, "model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig", false]], "trainingmethod (class in model_compression_toolkit.trainable_infrastructure)": [[46, "model_compression_toolkit.trainable_infrastructure.TrainingMethod", false]], "type (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.operatorsset attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet.type", false]], "weights_n_bits (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.weights_n_bits", false]], "weights_per_channel_threshold (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.weights_per_channel_threshold", false]], "weights_quantization_method (model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.attributequantizationconfig attribute)": [[45, "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig.weights_quantization_method", false]], "xquant_report_keras_experimental() (in module model_compression_toolkit.xquant.keras.facade_xquant_report)": [[36, "model_compression_toolkit.xquant.keras.facade_xquant_report.xquant_report_keras_experimental", false]], "xquant_report_pytorch_experimental() (in module model_compression_toolkit.xquant.pytorch.facade_xquant_report)": [[37, "model_compression_toolkit.xquant.pytorch.facade_xquant_report.xquant_report_pytorch_experimental", false]], "xquant_report_troubleshoot_pytorch_experimental() (in module model_compression_toolkit.xquant.pytorch.facade_xquant_report)": [[38, "model_compression_toolkit.xquant.pytorch.facade_xquant_report.xquant_report_troubleshoot_pytorch_experimental", false]], "xquantconfig (class in model_compression_toolkit.xquant.common.xquant_config)": [[12, "model_compression_toolkit.xquant.common.xquant_config.XQuantConfig", false]]}, "objects": {"model_compression_toolkit": [[2, 0, 1, "", "DefaultDict"], [18, 3, 1, "", "get_target_platform_capabilities"], [19, 3, 1, "", "get_target_platform_capabilities_sdsp"], [23, 3, 1, "", "keras_load_quantized_model"], [35, 3, 1, "", "set_log_folder"]], "model_compression_toolkit.DefaultDict": [[2, 1, 1, "", "get"], [2, 1, 1, "", "keys"]], "model_compression_toolkit.core": [[0, 0, 1, "", "BitWidthConfig"], [3, 0, 1, "", "ChannelAxis"], [39, 0, 1, "", "CoreConfig"], [40, 0, 1, "", "DebugConfig"], [3, 0, 1, "", "FrameworkInfo"], [5, 0, 1, "", "MixedPrecisionQuantizationConfig"], [5, 0, 1, "", "MpDistanceWeighting"], [5, 0, 1, "", "MpMetricNormalization"], [8, 0, 1, "", "QuantizationConfig"], [9, 0, 1, "", "QuantizationErrorMethod"], [10, 0, 1, "", "ResourceUtilization"], [22, 3, 1, "", "keras_resource_utilization_data"], [30, 3, 1, "", "pytorch_resource_utilization_data"]], "model_compression_toolkit.core.BitWidthConfig": [[0, 2, 1, "", "manual_activation_bit_width_selection_list"], [0, 2, 1, "", "manual_weights_bit_width_selection_list"]], "model_compression_toolkit.core.common.quantization.bit_width_config": [[0, 0, 1, "", "ManualBitWidthSelection"]], "model_compression_toolkit.core.common.quantization.bit_width_config.ManualBitWidthSelection": [[0, 2, 1, "", "bit_width"], [0, 2, 1, "", "filter"]], "model_compression_toolkit.core.network_editor": [[43, 0, 1, "", "ChangeCandidatesActivationQuantConfigAttr"], [43, 0, 1, "", "ChangeCandidatesActivationQuantizationMethod"], [43, 0, 1, "", "ChangeCandidatesWeightsQuantConfigAttr"], [43, 0, 1, "", "ChangeCandidatesWeightsQuantizationMethod"], [43, 0, 1, "", "ChangeFinalActivationQuantConfigAttr"], [43, 0, 1, "", "ChangeFinalWeightsQuantConfigAttr"], [43, 0, 1, "", "ChangeFinalWeightsQuantizationMethod"], [43, 0, 1, "", "ChangeQuantizationParamFunction"], [43, 0, 1, "", "EditRule"], [43, 0, 1, "", "NodeNameFilter"], [43, 0, 1, "", "NodeNameScopeFilter"], [43, 0, 1, "", "NodeTypeFilter"]], "model_compression_toolkit.data_generation": [[1, 0, 1, "", "BNLayerWeightingType"], [1, 0, 1, "", "BatchNormAlignemntLossType"], [1, 0, 1, "", "DataGenerationConfig"], [1, 0, 1, "", "DataInitType"], [1, 0, 1, "", "ImageGranularity"], [1, 0, 1, "", "ImageNormalizationType"], [1, 0, 1, "", "ImagePipelineType"], [1, 0, 1, "", "OutputLossType"], [1, 0, 1, "", "SchedulerType"], [14, 3, 1, "", "get_keras_data_generation_config"], [16, 3, 1, "", "get_pytorch_data_generation_config"], [20, 3, 1, "", "keras_data_generation_experimental"], [28, 3, 1, "", "pytorch_data_generation_experimental"]], "model_compression_toolkit.exporter": [[41, 0, 1, "", "KerasExportSerializationFormat"], [41, 0, 1, "", "PytorchExportSerializationFormat"], [41, 0, 1, "", "QuantizationFormat"], [41, 0, 1, "", "keras_export_model"], [41, 0, 1, "", "pytorch_export_model"]], "model_compression_toolkit.gptq": [[4, 0, 1, "", "GPTQHessianScoresConfig"], [4, 0, 1, "", "GradientPTQConfig"], [4, 0, 1, "", "GradualActivationQuantizationConfig"], [4, 0, 1, "", "QFractionLinearAnnealingConfig"], [4, 0, 1, "", "RoundingType"], [15, 3, 1, "", "get_keras_gptq_config"], [17, 3, 1, "", "get_pytorch_gptq_config"], [21, 3, 1, "", "keras_gradient_post_training_quantization"], [29, 3, 1, "", "pytorch_gradient_post_training_quantization"]], "model_compression_toolkit.pruning": [[6, 0, 1, "", "ChannelsFilteringStrategy"], [6, 0, 1, "", "ImportanceMetric"], [6, 0, 1, "", "PruningConfig"], [7, 0, 1, "", "PruningInfo"], [25, 3, 1, "", "keras_pruning_experimental"], [32, 3, 1, "", "pytorch_pruning_experimental"]], "model_compression_toolkit.pruning.PruningConfig": [[6, 2, 1, "", "channels_filtering_strategy"], [6, 2, 1, "", "importance_metric"], [6, 2, 1, "", "num_score_approximations"]], "model_compression_toolkit.pruning.PruningInfo": [[7, 4, 1, "", "importance_scores"], [7, 4, 1, "", "pruning_masks"]], "model_compression_toolkit.ptq": [[24, 3, 1, "", "keras_post_training_quantization"], [31, 3, 1, "", "pytorch_post_training_quantization"]], "model_compression_toolkit.qat": [[44, 0, 1, "", "QATConfig"], [26, 3, 1, "", "keras_quantization_aware_training_finalize_experimental"], [27, 3, 1, "", "keras_quantization_aware_training_init_experimental"], [33, 3, 1, "", "pytorch_quantization_aware_training_finalize_experimental"], [34, 3, 1, "", "pytorch_quantization_aware_training_init_experimental"]], "model_compression_toolkit.target_platform_capabilities": [[42, 0, 1, "", "AttributeFilter"], [42, 0, 1, "", "Eq"], [42, 0, 1, "", "Greater"], [42, 0, 1, "", "GreaterEq"], [42, 0, 1, "", "NotEq"], [45, 0, 1, "", "QuantizationMethod"], [42, 0, 1, "", "Smaller"], [42, 0, 1, "", "SmallerEq"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema": [[45, 0, 1, "", "AttributeQuantizationConfig"], [45, 0, 1, "", "Fusing"], [45, 0, 1, "", "OpQuantizationConfig"], [45, 0, 1, "", "OperatorSetGroup"], [45, 0, 1, "", "OperatorsSet"], [45, 0, 1, "", "QuantizationConfigOptions"], [45, 0, 1, "", "TargetPlatformCapabilities"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.AttributeQuantizationConfig": [[45, 2, 1, "", "enable_weights_quantization"], [45, 2, 1, "", "lut_values_bitwidth"], [45, 2, 1, "", "weights_n_bits"], [45, 2, 1, "", "weights_per_channel_threshold"], [45, 2, 1, "", "weights_quantization_method"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.Fusing": [[45, 2, 1, "", "fuse_op_quantization_config"], [45, 2, 1, "", "name"], [45, 2, 1, "", "operator_groups"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorSetGroup": [[45, 2, 1, "", "name"], [45, 2, 1, "", "operators_set"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.OperatorsSet": [[45, 2, 1, "", "name"], [45, 2, 1, "", "qc_options"], [45, 2, 1, "", "type"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.QuantizationConfigOptions": [[45, 2, 1, "", "base_config"], [45, 2, 1, "", "quantization_configurations"]], "model_compression_toolkit.target_platform_capabilities.schema.mct_current_schema.TargetPlatformCapabilities": [[45, 2, 1, "", "SCHEMA_VERSION"], [45, 2, 1, "", "add_metadata"], [45, 2, 1, "", "default_qco"], [45, 2, 1, "", "fusing_patterns"], [45, 2, 1, "", "insert_preserving_quantizers"], [45, 2, 1, "", "is_simd_padding"], [45, 2, 1, "", "name"], [45, 2, 1, "", "operator_set"], [45, 2, 1, "", "tpc_minor_version"], [45, 2, 1, "", "tpc_patch_version"], [45, 2, 1, "", "tpc_platform_type"]], "model_compression_toolkit.trainable_infrastructure": [[46, 0, 1, "", "BaseKerasTrainableQuantizer"], [46, 0, 1, "", "BasePytorchTrainableQuantizer"], [46, 0, 1, "", "TrainableQuantizerActivationConfig"], [46, 0, 1, "", "TrainableQuantizerWeightsConfig"], [46, 0, 1, "", "TrainingMethod"]], "model_compression_toolkit.wrapper.mct_wrapper": [[11, 0, 1, "", "MCTWrapper"]], "model_compression_toolkit.wrapper.mct_wrapper.MCTWrapper": [[11, 1, 1, "", "quantize_and_export"]], "model_compression_toolkit.xquant.common.xquant_config": [[12, 0, 1, "", "XQuantConfig"]], "model_compression_toolkit.xquant.keras.facade_xquant_report": [[36, 3, 1, "", "xquant_report_keras_experimental"]], "model_compression_toolkit.xquant.pytorch.facade_xquant_report": [[37, 3, 1, "", "xquant_report_pytorch_experimental"], [38, 3, 1, "", "xquant_report_troubleshoot_pytorch_experimental"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "function", "Python function"], "4": ["py", "property", "Python property"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute", "3": "py:function", "4": "py:property"}, "terms": {"": [3, 6, 8, 10, 21, 24, 25, 26, 27, 29, 31, 32, 34, 35, 41, 42, 43, 45, 46, 48, 50], "0": [1, 3, 4, 5, 7, 8, 11, 12, 14, 15, 16, 21, 24, 25, 26, 27, 32, 41, 46, 48], "05": 8, "06": 5, "08153": 46, "1": [1, 3, 4, 5, 7, 8, 12, 17, 20, 21, 22, 24, 25, 26, 28, 29, 30, 31, 32, 33, 41, 48, 50], "10": [20, 21, 24, 27, 28, 29, 31, 34], "10000000000": 5, "15": [41, 48], "16": [12, 41, 48], "1902": 46, "1e": 5, "1st": 15, "2": [3, 8, 12, 15, 20, 28, 45, 46, 48, 50], "20": 49, "2021": 50, "2023": 50, "224": [21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 41], "228137651975462": 48, "2nd": 15, "3": [3, 15, 17, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 41, 46, 48], "32": [4, 5], "3rd": 15, "4": [15, 20, 21, 24, 25, 27, 28, 29, 31, 32, 34], "4th": 15, "5": [11, 12, 15, 17, 25, 32, 48], "50": [25, 32], "52587890625e": 8, "6": [28, 48], "75": [21, 24, 26, 27], "758747418625537": 48, "8": [20, 21, 24, 26, 27, 28, 41, 45, 46], "9": [43, 48], "A": [0, 3, 4, 5, 7, 8, 13, 15, 17, 21, 22, 23, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 43, 44, 45, 48, 50], "As": [5, 48, 49], "By": [4, 5, 25, 29, 31, 32, 41, 48, 49], "For": [3, 8, 12, 18, 19, 20, 21, 24, 26, 27, 28, 34, 41, 45, 46, 47, 48, 49, 50], "If": [2, 3, 4, 5, 12, 15, 17, 21, 24, 26, 27, 29, 31, 39, 41, 42, 45, 48], "In": [5, 20, 21, 24, 27, 28, 29, 31, 34, 41, 42, 44, 48], "It": [2, 11, 12, 45, 46, 48], "No": 1, "Not": 48, "One": 49, "The": [0, 1, 3, 4, 5, 6, 7, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 24, 25, 26, 27, 28, 29, 31, 32, 34, 36, 37, 38, 41, 43, 45, 46, 48, 49], "Then": [3, 21, 24, 27, 29, 31, 34, 43, 49], "There": [41, 48, 49], "These": [48, 49], "To": [41, 48, 49], "With": 48, "_": [21, 24, 27, 29, 31, 34, 41, 48], "_input_data": 41, "_model_input_nam": 41, "_model_output_nam": 41, "_with_model_output_loss_object": 48, "about": [3, 4, 7, 13, 15, 17, 21, 24, 26, 27, 41, 45, 46], "abov": [12, 48], "absolut": 9, "abstract": [13, 46], "accept": [15, 45], "access": 7, "accord": [13, 21, 22, 24, 25, 27, 29, 30, 31, 32, 34, 41, 42], "accordingli": 45, "accuraci": [12, 48], "achiev": 25, "act": 7, "act_hessian_default_batch_s": [15, 17], "action": 40, "activ": [0, 3, 4, 5, 8, 10, 11, 21, 22, 24, 27, 29, 30, 31, 34, 41, 43, 44, 45, 46, 49], "activation_bias_correct": 8, "activation_bias_correction_threshold": 8, "activation_channel_equ": 8, "activation_error_method": [8, 11], "activation_memori": 10, "activation_min_max_map": 3, "activation_n_bit": [45, 46], "activation_op": 3, "activation_quantization_candid": 46, "activation_quantization_method": [43, 45, 46], "activation_quantization_param": 46, "activation_quantization_params_fn": 43, "activation_quantizer_map": 3, "activation_quantizer_params_overrid": 44, "activation_training_method": 44, "ad": 45, "adam": [14, 17], "add": [1, 3, 12, 14, 16, 23, 46, 48], "add_metadata": 45, "addit": [23, 41, 48], "addition": 48, "address": 45, "advanc": 3, "affect": [21, 24, 26, 27], "after": [13, 21, 23, 24, 27, 34, 48, 50], "aim": [25, 32], "algorithm": 5, "align": [1, 14, 16], "all": [1, 3, 4, 5, 8, 43, 46, 49], "allimag": [1, 16], "allow": [6, 12, 20, 28, 41, 45, 48], "along": [48, 49], "also": [25, 32, 45, 48], "an": [1, 2, 3, 4, 7, 11, 13, 21, 24, 27, 34, 36, 37, 38, 41, 42, 43, 45, 46, 48, 50], "analysi": [25, 32], "analyz": [25, 32, 38], "analyze_similar": 40, "ani": [1, 2, 3, 5, 11, 36, 37, 38, 41, 42, 46], "anneal": 4, "api": [3, 4, 24, 27, 34, 44], "appear": 48, "appli": [0, 1, 5, 8, 13, 41, 42, 43, 45, 48], "applic": [21, 22, 24, 25, 26, 27, 41], "approach": 6, "appropri": 48, "approxim": [6, 25, 32], "ar": [3, 5, 12, 18, 19, 21, 24, 25, 27, 29, 31, 32, 34, 41, 45, 46, 47, 48, 49], "architectur": [25, 32], "argument": [4, 41, 45, 48], "arrai": [7, 11], "art": 50, "arxiv": [46, 50], "assess": [25, 32], "associ": [25, 32], "assum": [25, 32], "astyp": 41, "attach": 48, "attent": [4, 15, 17, 46], "attirbut": 3, "attr": 42, "attr_nam": 43, "attr_valu": 43, "attr_weights_configs_map": 45, "attribut": [43, 45, 46], "attributefilt": 42, "auto": 13, "auxiliri": [15, 17], "avail": 41, "averag": [1, 5, 14, 15, 16, 17, 48], "avg": 5, "awar": [13, 44, 46, 50], "axi": [3, 46, 48], "backend": 45, "base": [1, 4, 5, 8, 9, 11, 13, 15, 17, 18, 19, 20, 25, 28, 31, 32, 46, 48, 50], "base_config": 45, "basenod": 7, "basenodematch": 0, "basic": 46, "batch": [1, 4, 5, 14, 15, 16, 17, 20, 21, 24, 27, 28, 29, 31, 34], "batchnorm": [1, 14, 16, 20, 21, 24, 27, 29, 31, 34], "batchnorm2d": 28, "batchnormalignemntlosstyp": [14, 16], "batchwis": [1, 14], "been": [7, 48], "befor": 48, "begin": 4, "behavior": 40, "being": [21, 24, 27, 29, 31, 34, 45, 46], "below": [12, 48], "between": [4, 5, 12, 21, 29, 31, 45, 48, 49], "bia": [4, 11, 15, 17, 21, 24, 26, 27], "bidwidth": 5, "bin": 48, "bit": [0, 5, 10, 13, 21, 24, 26, 27, 34, 39, 41, 43, 45, 46, 48, 50], "bit_width": 0, "bit_width_config": [0, 39], "bitwidth": [5, 12, 21, 24, 26, 27, 48], "bitwidthconfig": [13, 39], "black": 48, "block": [46, 49], "bn_alignment_loss_typ": [1, 14, 16], "bn_layer_typ": [1, 14, 16], "bnlayerweightingtyp": [14, 16], "bool": [1, 4, 5, 11, 12, 14, 15, 16, 17, 40, 45, 46, 48], "boolean": 23, "bop": 10, "both": [11, 21, 24, 29, 31, 33, 46, 48, 49], "build": [22, 30, 46, 50], "built": [27, 34, 46], "bypass": 40, "byte": [10, 21, 24, 25, 27, 32, 34, 49], "c": [12, 48], "calcul": [5, 6, 13, 21, 22, 24, 25, 27, 29, 30, 31, 32, 34, 48], "calibr": [11, 21, 22, 24, 27, 29, 30, 31, 34], "call": [22, 30, 35, 45, 48, 49], "callabl": [3, 5, 11, 12, 15, 17, 21, 22, 24, 25, 27, 29, 30, 31, 32, 34, 36, 37, 38, 41, 42, 48], "can": [3, 4, 8, 11, 13, 15, 17, 20, 22, 25, 28, 30, 32, 40, 41, 43, 45, 46, 48, 49, 50], "candid": [5, 21, 24, 26, 27, 43], "cannot": 45, "capabl": [11, 18, 19, 25, 30, 32], "case": [5, 48], "caus": [12, 13, 38, 48], "chang": [20, 28, 41, 43, 49], "changecandidatesactivationquantconfigattr": 43, "changecandidatesactivationquantizationmethod": 43, "changecandidatesweightsquantconfigattr": 43, "changecandidatesweightsquantizationmethod": 43, "changefinalactivationquantconfigattr": 43, "changefinalweightsquantconfigattr": 43, "changefinalweightsquantizationmethod": 43, "changequantizationmethod": 43, "changequantizationparamfunct": 43, "channel": [3, 6, 7, 13, 25, 32, 45, 46, 49], "channels_filtering_strategi": 6, "check": [5, 41, 42, 43], "choos": [1, 4, 41], "chosen": 49, "circl": 48, "class": [0, 1, 5, 6, 7, 8, 9, 10, 11, 12, 13, 23, 39, 40, 41, 42, 43, 44, 45, 46, 48], "clibrat": 31, "click": 49, "clip": [1, 14, 16], "clone": 50, "code": 48, "coeffici": [3, 21, 24, 26, 27, 29, 31, 45, 46], "cohen": 50, "collaps": 11, "collect": [3, 21, 24, 27, 29, 31, 34, 36, 37, 38, 49], "com": 50, "combin": 45, "common": [0, 12], "compar": [5, 21, 29, 31, 48, 49], "comparison": 50, "compat": 41, "compil": 23, "complet": [4, 11], "compon": [45, 46, 48], "compress": [11, 13, 20, 25, 28, 29, 32, 48], "comput": [3, 4, 5, 9, 12, 13, 15, 17, 22, 30, 36, 40, 49], "compute_distance_fn": 5, "concat_threshold_upd": 8, "concaten": [12, 45, 48], "concatn": 12, "config": [4, 20, 21, 24, 25, 26, 27, 28, 29, 32, 33, 34, 39, 43, 46], "configur": [0, 4, 5, 8, 10, 11, 13, 14, 15, 16, 17, 20, 21, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 48, 50], "configuration_overwrit": 5, "confirm": 48, "connect": [11, 48], "consid": [6, 14, 16, 25, 32, 45, 48], "consol": 48, "constant": [6, 43, 46], "constraint": [21, 24, 25, 29, 31, 32], "consult": 48, "contain": [7, 13, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 46, 48], "conv": 48, "conv2d": [3, 20, 21, 24, 26, 27, 28, 43, 45], "conveni": 35, "convent": 48, "convert": [13, 26, 33, 45], "core": [0, 3, 5, 8, 9, 10, 11, 21, 22, 24, 25, 26, 27, 29, 30, 32, 33, 34, 39, 40, 43, 48], "core_config": [21, 22, 24, 26, 27, 29, 30, 31, 33, 34, 48], "coreconfig": [13, 21, 22, 24, 26, 27, 29, 30, 31, 33, 34, 48], "correct": 11, "correspond": [7, 48], "cosin": 50, "count_param": [21, 24, 25, 26, 27], "countermeasur": 48, "cpuexecutionprovid": 41, "creat": [3, 4, 8, 11, 13, 14, 15, 16, 17, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 41, 42, 43, 45, 48], "creation": 41, "crop": 1, "cudaexecutionprovid": 41, "current": [4, 41], "custom": [5, 12, 20, 23, 27, 28, 41, 48], "custom_metric_fn": 5, "custom_object": [23, 26, 27], "custom_similarity_metr": [12, 48], "custom_tpc_opset_to_lay": 8, "cut": 40, "dash": 48, "data": [13, 14, 16, 22, 25, 30, 32, 36, 37, 38, 41, 45, 48, 49, 50], "data_gen_batch_s": [1, 14, 16, 20, 28], "data_gener": [1, 14, 16, 20, 28], "data_generation_config": [20, 28], "data_init_typ": [1, 14, 16], "dataclass": [39, 40], "datagenerationconfig": [1, 13, 20, 28], "datainittyp": [14, 16], "dataset": [4, 11, 15, 17, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 36, 37, 38, 41, 48, 49], "debug": [39, 40], "debug_config": 39, "debugconfig": 39, "deeper": 49, "def": [21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 41], "default": [1, 2, 4, 5, 6, 11, 14, 15, 16, 17, 21, 24, 25, 29, 31, 32, 39, 41, 44, 45, 48, 49], "default_data_gen_b": [14, 16], "default_factori": 2, "default_keras_extra_pixel": 14, "default_keras_initial_lr": 14, "default_keras_output_loss_multipli": 14, "default_keras_tpc": [21, 24, 25, 27], "default_n_it": [14, 16], "default_onnx_opset_vers": 41, "default_pytorch_bn_layer_typ": 16, "default_pytorch_extra_pixel": 16, "default_pytorch_initial_lr": 16, "default_pytorch_last_layer_typ": 16, "default_pytorch_output_loss_multipli": 16, "default_pytorch_tpc": [29, 31, 32, 34], "default_qco": 45, "default_valu": 2, "default_weight_attr_config": 45, "defaultdict": [3, 13], "defin": [0, 4, 5, 15, 17, 20, 21, 24, 25, 26, 27, 28, 29, 31, 32, 45, 46], "degrad": [12, 13, 38, 48], "degrat": 48, "demonstr": [41, 45], "dens": [3, 20], "dense_nparam": [25, 32], "depend": [1, 21, 24, 27, 29, 31, 34], "describ": 48, "descript": 11, "desir": [13, 21, 22, 24, 26, 27, 29, 30, 31, 34], "detail": [41, 45, 48], "detect": [12, 13, 38, 48], "determin": [6, 25, 32, 45], "develop": 50, "deviat": 48, "devic": [13, 18], "device_typ": 18, "diagram": 45, "diamant": 50, "dict": [3, 7, 12, 36, 37, 38, 41, 45, 46, 48], "dictionari": [2, 3, 4, 12, 26, 27, 36, 37, 38, 41, 43, 44, 46], "differ": [1, 8, 13, 21, 24, 26, 27, 41, 45, 48, 49], "dikstein": 50, "dir": [12, 48, 49], "directori": [12, 13, 35, 48], "disabl": [15, 17, 48], "displai": [48, 49], "distanc": 5, "distance_weighting_method": 5, "distil": [4, 50], "distribut": 9, "diverg": [9, 49], "divers": 1, "divid": [3, 48], "divis": 49, "dnn": 46, "do": [1, 49], "document": [13, 24, 27, 34, 48], "doe": 48, "doesn": 50, "don": 35, "done": 49, "dot": 49, "dqa": 46, "dror": 50, "dtype": 41, "due": 48, "dummi": 17, "durat": [25, 32], "dure": [4, 13, 14, 15, 16, 17, 18, 19, 36, 37, 38, 41, 43, 45, 46, 47, 49], "e": [3, 5, 11, 21, 24, 27, 29, 31, 34, 50], "each": [5, 6, 7, 12, 21, 24, 25, 27, 29, 31, 32, 34, 43, 45, 46, 48, 49], "easi": 48, "easili": [13, 50], "edit": [39, 40, 43], "editrul": 40, "either": 45, "element": [7, 45], "empti": 2, "emul": 46, "enabl": [1, 5, 8, 11, 13, 15, 17, 40, 46, 50], "enable_activation_quant": [45, 46], "enable_weights_quant": [45, 46], "encapsul": [0, 8], "end": 48, "end_step": 4, "engin": 50, "enhanc": 50, "ensur": 5, "entir": 13, "enum": [1, 3, 4, 6, 9, 46], "epoch": [4, 11, 15, 17], "epsilon": 5, "eptq": 50, "eq": 42, "equal": [42, 48], "er_list": 43, "error": [9, 11, 12], "estim": [4, 46], "etc": [3, 10, 13, 21, 24, 27, 29, 31, 34, 49], "euclidean": 49, "evalu": [5, 36, 37, 38], "even": 48, "exact": 17, "exampl": [3, 8, 11, 15, 17, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 43, 45, 46, 50], "exce": 48, "exceed": 48, "execut": 48, "exist": [2, 43, 48], "exp": 5, "exp_distance_weighting_sigma": 5, "expect": [4, 49], "experiment": [13, 20, 28, 50], "explain": [12, 13, 36, 37, 38, 46, 48], "explicitli": 45, "expon": 5, "exponenti": 5, "export": 11, "extend": [25, 32], "extens": [41, 50], "extra": [1, 14, 16], "extra_pixel": [1, 14, 16], "extrem": 48, "facade_xquant_report": [36, 37, 38], "factor": [4, 5, 9, 15, 17, 48], "factori": [0, 4, 39, 40], "fake": 41, "fake_qu": [27, 34], "fakely_qu": 41, "fallback": 45, "fals": [4, 5, 8, 11, 12, 14, 15, 17, 40, 46, 48], "familiar": 48, "featur": 48, "fetch": 45, "few": [49, 50], "field": [18, 19, 42, 45, 47], "figur": [40, 49], "file": [23, 26, 27, 35, 41], "filepath": 23, "filter": [0, 1, 6], "final": [4, 5, 12, 13, 20, 28, 43, 48, 49, 50], "find": [21, 24, 27, 34], "fine": [15, 17, 25, 26, 27, 32, 33, 34, 48], "first": [1, 21, 24, 27, 29, 31, 34, 41, 48, 49], "first_layer_multipli": 1, "fix": 45, "fixed_scal": [18, 19, 45, 47], "fixed_zero_point": [18, 19, 45, 47], "flag": [1, 11, 40, 45], "flatten": [20, 28], "flip": 1, "float": [1, 4, 5, 11, 12, 14, 15, 16, 17, 21, 27, 29, 31, 34, 36, 37, 38, 41, 45, 46, 48, 49], "float32": [25, 32, 41], "float_model": [11, 36, 37, 38, 41, 48], "fold": [21, 24, 27, 29, 31, 34], "folder": [35, 48], "follow": [3, 4, 11, 12, 46, 48, 49], "footprint": [25, 32], "form": 45, "format": [3, 13], "found": 48, "fraction": 4, "framework": [3, 11, 46], "frameworkquantizationcap": [22, 29, 30, 31], "free": [6, 20, 25, 28, 32, 50], "freez": 46, "freeze_quant_param": 46, "friendli": [25, 32, 50], "from": [3, 4, 11, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 41, 43, 45, 46, 47, 48, 49, 50], "from_config": 46, "function": [3, 4, 5, 11, 12, 13, 14, 15, 16, 17, 20, 23, 25, 28, 32, 35, 43, 45, 46, 48], "further": 48, "fuse_op_quantization_config": 45, "fusing_pattern": 45, "futur": [18, 19, 20, 28, 45, 47], "g": [3, 11, 21, 24, 27, 29, 31, 34], "gather": [45, 49], "gaussian": [1, 14, 16], "gelu": 48, "gener": [2, 12, 13, 14, 16, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 36, 37, 38, 45, 48, 49, 50], "generated_imag": [20, 28], "get": [2, 3, 4, 5, 13, 21, 24, 26, 27, 29, 31, 33, 34, 45, 49], "get_config": 46, "get_input": 41, "get_keras_data_generation_config": [13, 14, 20], "get_keras_gptq_config": [13, 15, 21], "get_ort_session_opt": 41, "get_output": 41, "get_pytorch_data_generation_config": [13, 16, 28], "get_pytorch_gptq_config": [13, 17], "get_target_platform_cap": [13, 18, 45], "get_target_platform_capabilities_sdsp": [13, 19, 45], "git": 50, "github": [41, 50], "given": [2, 21, 22, 24, 27, 29, 30, 31, 34], "gordon": 50, "gptq": [4, 11, 15, 17, 21, 29], "gptq_conf": [15, 17, 29], "gptq_config": [21, 29, 31], "gptq_quantizer_params_overrid": 4, "gptq_representative_data_gen": [21, 29], "grad": 1, "gradient": [1, 4, 11, 13, 31, 50], "gradientptq": [4, 13], "gradientptqconfig": [13, 21, 29], "gradual": 4, "gradual_activation_quant": [15, 17], "gradual_activation_quantization_config": 4, "gradualactivationquant": [15, 17], "gradualactivationquantizationconfig": [15, 17], "granular": [1, 14, 16], "graph": [22, 30, 43, 49], "greater": 42, "greatereq": 42, "greedi": [5, 6], "group": [3, 6, 25, 32, 45], "h": 50, "ha": [7, 41, 42, 43, 48], "habi": 50, "handl": [11, 21, 24, 27, 29, 31, 34], "handler": 35, "hardwar": [13, 25, 32, 45, 46, 50], "have": [3, 41, 42, 48, 49], "henc": 45, "here": [12, 25, 32, 41, 45, 48, 50], "hessian": [4, 5, 6, 9, 11, 15, 17, 25, 32, 50], "hessian_batch_s": [4, 5, 15, 17], "hessian_weights_config": 4, "hessians_num_sampl": 4, "higher": [25, 32], "highlight": 48, "hight": 28, "histogram": [21, 24, 27, 29, 31, 34, 48, 49], "hmse": 9, "hold": [3, 39, 42, 45], "holder": 46, "how": [3, 6, 21, 22, 24, 27, 29, 31, 34, 41, 46, 50], "howev": 41, "hptq": [45, 50], "http": [46, 50], "hw": 22, "i": [1, 2, 3, 4, 5, 6, 7, 9, 12, 13, 15, 17, 20, 21, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 39, 40, 41, 42, 43, 45, 46, 48, 49, 50], "ident": [1, 5], "identifi": [25, 32, 45, 48], "ignor": [18, 19, 45, 47], "ilp": [21, 24, 27, 34], "imag": [1, 4, 5, 11, 14, 16, 20, 21, 24, 27, 28, 29, 31, 34, 48, 49], "image_clip": [1, 14, 16], "image_granular": [1, 14, 16], "image_normalization_typ": [1, 14, 16], "image_pipeline_typ": [1, 14, 16], "imagegranular": [14, 16], "imagenet": 1, "imagenet1k_v1": 32, "imagenormalizationtyp": [14, 16], "imagepipelinetyp": [14, 16], "imagewis": 1, "impact": [25, 32], "implement": [12, 46], "implment": 46, "import": [3, 6, 7, 8, 11, 13, 15, 17, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 41, 43, 46, 48, 49], "importance_metr": 6, "importance_scor": 7, "improv": [5, 25, 32, 48], "imx500": [41, 45], "imx500_tp_model": 18, "in_model": [21, 22, 24, 26, 27, 30, 33, 34], "in_modul": [31, 48], "includ": [4, 7, 11, 21, 24, 27, 29, 31, 34, 45, 46], "increas": [4, 5], "index": [3, 13], "indic": [3, 7, 25, 32, 45, 48], "individu": 48, "induc": 9, "inf": [8, 10, 11], "infer": [13, 26, 33, 45, 46], "inferablequant": [26, 33], "inferencesess": 41, "info": [6, 35], "inform": [3, 4, 13, 15, 17, 18, 19, 21, 24, 25, 27, 29, 31, 32, 34, 40, 45, 46, 47], "infrastructur": 46, "init": [13, 43, 50], "initi": [1, 2, 4, 6, 11, 12, 14, 16, 27, 34, 46, 48], "initial_lr": [1, 14, 16], "initial_q_fract": 4, "inner": 2, "input": [1, 5, 11, 14, 16, 21, 24, 27, 29, 31, 34, 40, 45, 48], "input_sc": 8, "input_shap": 20, "insert": 49, "insert_preserving_quant": 45, "instal": 41, "instanc": [4, 11, 13, 15, 17, 43, 45, 49], "instanti": [4, 8, 44], "instead": 48, "instruct": [45, 48], "insuffici": [12, 48], "int": [0, 1, 4, 5, 6, 12, 14, 15, 16, 17, 20, 28, 35, 41, 45, 46, 48], "int8": 41, "integ": [5, 41, 45], "interest": 5, "interfac": [4, 11, 17], "internal_tpc": 11, "introduc": 46, "inverse_min_max_diff": 1, "involv": [20, 25, 28, 32], "is_detect_under_threshold_quantize_error": [12, 48], "is_keras_layer_export": 41, "is_layer_exportable_fn": 41, "is_pytorch_layer_export": 41, "is_simd_pad": 45, "issu": [5, 41, 48], "item": 48, "iter": [1, 14, 16, 20, 21, 24, 27, 28, 29, 31, 34], "its": [2, 3, 13, 23, 25, 32, 42, 45, 49], "jen": 50, "judg": [12, 13, 38, 48], "just": 50, "keep": [33, 50], "kei": [2, 11, 12, 25, 32, 42], "kept": [7, 27, 34], "ker": 27, "kera": [3, 11, 13, 43, 46, 50], "keras_appl": [1, 14], "keras_data_generation_experiment": [13, 20], "keras_default_tpc": 22, "keras_file_path": 41, "keras_gradient_post_training_quant": [13, 15, 21], "keras_load_quantized_model": 23, "keras_post_training_quant": [13, 24, 41, 43, 49], "keras_pruning_experiment": [13, 25], "keras_quantization_aware_training_finalize_experiment": [13, 26], "keras_quantization_aware_training_init_experiment": [13, 26, 27], "keras_resource_utilization_data": [13, 22], "kernel": [3, 21, 24, 26, 27, 43, 46], "kernel_channels_map": 3, "kernel_op": 3, "kernel_ops_attributes_map": 3, "keyword": 45, "kl": [9, 49], "know": [3, 13], "knowledg": [4, 50], "known_dict": 2, "kwarg": 43, "l": [25, 50], "l2": 1, "l2_squar": [1, 14, 16], "l_p_valu": 8, "label": [6, 25, 32, 45, 50], "lambda": 41, "larg": [12, 48], "larger": 5, "last": [3, 4, 5, 48], "last_lay": 5, "last_layer_typ": [1, 16], "latenc": 41, "latest": 50, "launch": 49, "layaer": [13, 38], "layer": [1, 3, 5, 7, 11, 12, 14, 15, 16, 17, 20, 21, 24, 25, 26, 27, 29, 31, 32, 33, 34, 40, 41, 43, 45, 46, 48, 49], "layer_min_max_map": 3, "layer_weighting_typ": [1, 14, 16], "layerfilterparam": 42, "learn": [1, 14, 15, 16, 46], "learnabl": 46, "least": 6, "less": 48, "let": 41, "level": 35, "lfh": [6, 25, 32], "librari": [3, 8], "like": [8, 45], "limit": [6, 21, 24, 26, 27, 29, 31, 34], "line": 48, "linear": [4, 11, 28], "linear_collaps": [8, 11, 48], "linearli": 4, "link": 48, "list": [0, 1, 3, 5, 11, 14, 15, 16, 20, 28, 40, 41, 43, 48, 50], "liter": 45, "ll": [20, 28], "load": [13, 26, 27, 41, 46], "load_model": [26, 27], "loadopt": 23, "log": [4, 12, 13, 15, 17, 35, 48, 49], "log_funct": [4, 15, 17], "log_norm": 4, "log_tensorboard_xqu": 48, "logdir": 49, "logger": [13, 40, 49], "longer": 41, "look": [24, 27, 34, 45, 50], "lookup": 45, "loss": [1, 4, 12, 14, 15, 16, 17, 21, 25, 29, 31, 32], "lower": 48, "lp": 9, "lsq": 46, "lut_pot_quant": 45, "lut_sym_quant": 45, "lut_values_bitwidth": 45, "mae": [9, 49], "mai": [20, 21, 24, 27, 28, 29, 31, 34, 42, 49], "main": [11, 45, 48, 49], "major": 48, "make": 9, "manag": [0, 11], "mandatori": 41, "mani": 49, "manipul": [0, 1], "manner": 45, "manual": [0, 13, 39, 48], "manual_activation_bit_width_selection_list": 0, "manual_weights_bit_width_selection_list": 0, "manualweightsbitwidthselect": 0, "map": [3, 45], "mask": 7, "match": [18, 19, 42, 43], "mathemat": 49, "max": [1, 3, 5, 8, 9, 21, 22, 24, 27, 29, 30, 31, 34, 49], "maxbit": 5, "maxim": [21, 24, 27, 34], "maximum": 48, "mct": [3, 8, 11, 13, 15, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 39, 40, 41, 43, 45, 46, 47, 48, 49, 50], "mct_current_schema": 45, "mct_quantiz": 41, "mct_wrapper": 11, "mctwrapper": 11, "mean": [1, 4, 9, 49], "measur": [6, 10, 12, 48, 49], "meet": [25, 32], "memori": [10, 25, 32, 49], "messag": 48, "metadata": [7, 45], "method": [4, 5, 6, 9, 11, 13, 25, 32, 35, 41, 43, 44, 45, 46, 48], "metric": [4, 5, 6, 12, 36, 37, 38, 48], "metric_epsilon": 5, "metric_norm": 5, "metric_normalization_threshold": 5, "min": [1, 3, 5, 8, 9, 21, 24, 27, 29, 31, 34, 49], "min_threshold": [8, 46], "minbit": 5, "minim": [5, 9, 21, 25, 29, 31, 32], "minimum": 46, "minor": 45, "minut": 50, "mix": [5, 10, 11, 12, 13, 21, 22, 24, 26, 27, 29, 30, 31, 34, 39, 45, 50], "mixed_precis": 11, "mixed_precision_config": [21, 22, 24, 26, 27, 39], "mixedprecisionquantizationconfig": [13, 21, 22, 24, 26, 27, 39], "mkstemp": 41, "mobilenet": [21, 22], "mobilenet_v2": [24, 26, 27, 29, 30, 31, 33, 34, 41], "mobilenetv2": [24, 26, 27, 41, 49], "model": [3, 4, 5, 7, 8, 10, 11, 12, 13, 18, 19, 20, 21, 24, 25, 28, 29, 31, 32, 36, 37, 38, 39, 40, 43, 44, 45, 46, 49], "model_compression_toolkit": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 48, 49], "model_fil": [26, 27], "model_format_onnx_mctq": 41, "model_mp": 5, "model_output": 41, "modifi": [13, 43], "modul": [13, 28, 29, 30, 31, 32, 37, 38], "more": [9, 18, 19, 24, 25, 27, 32, 34, 41, 45, 47, 48, 49], "most": 48, "move": 48, "mse": [8, 9, 11, 12, 48, 49], "multipl": [3, 5, 35, 45], "multiple_tensors_mse_loss": 4, "multipli": [1, 12, 14, 16, 48], "must": [25, 32, 45], "n_epoch": [4, 11, 15, 17, 21], "n_imag": [20, 28], "n_iter": [1, 14, 16, 20, 28], "nadam": 15, "name": [12, 43, 45, 48, 49], "nchw": 3, "ndarrai": 7, "necessari": [4, 41, 46, 48], "need": [3, 11, 13, 21, 24, 27, 29, 31, 34, 41, 42, 46], "neg": [1, 5], "negative_min_max_diff": [1, 16], "network": [3, 6, 11, 33, 39, 40, 43, 49, 50], "network_editor": [13, 40], "netzer": 50, "neural": [6, 11, 50], "neuron": 7, "new": [43, 45], "next": [20, 28, 41, 42, 48], "nhwc": 3, "nn": [28, 37, 38], "no_norm": 1, "no_quantization_op": 3, "noclip": [8, 9], "node": [0, 27, 34, 41, 43, 46, 49], "node_nam": 43, "node_name_scop": 43, "node_typ": 43, "nodenamefilt": 43, "nodenamescopefilt": 43, "nodetypefilt": 43, "nois": 9, "non": [5, 15, 17, 45], "none": [1, 2, 4, 5, 8, 11, 12, 15, 17, 21, 23, 24, 27, 29, 31, 34, 35, 39, 41, 43, 44, 45, 46, 48], "norm": [9, 49], "norm_scor": [4, 5], "normal": [1, 4, 5, 14, 16], "note": [21, 24, 26, 27], "notebook": 50, "noteq": 42, "notic": [20, 25, 28, 32, 41], "now": [6, 18, 19, 34, 41, 45, 46, 47, 49], "np": [7, 11, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 41], "num_calibration_batch": [21, 24, 27, 29, 31, 34], "num_interest_points_factor": 5, "num_of_imag": [5, 11, 21, 24], "num_score_approxim": [6, 25, 32], "number": [1, 4, 5, 6, 11, 12, 14, 15, 16, 17, 20, 21, 24, 25, 27, 28, 29, 31, 32, 34, 45, 46, 48], "numel": 32, "numer": 5, "numpi": [21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 41], "o": 50, "object": [0, 3, 4, 5, 6, 10, 12, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 26, 27, 29, 30, 31, 34, 41, 43, 45, 46], "observ": [21, 29, 31, 45, 49], "one": [5, 42, 49], "onli": [3, 4, 5, 6, 12, 21, 24, 26, 27, 41, 45], "onlin": [27, 34], "onnx": 11, "onnx_file_path": 41, "onnx_opset_vers": 41, "onnxruntim": 41, "op": [42, 45], "open": [41, 49, 50], "oper": [3, 10, 40, 42, 45, 48], "operator_group": 45, "operator_set": 45, "operators_set": 45, "operatorsetnam": 45, "opquantizationconfig": [18, 19, 47], "optim": [1, 3, 4, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 24, 27, 29, 30, 31, 34, 39, 45, 46, 47, 48, 50], "optimizer_bia": 4, "optimizer_quantization_paramet": 4, "optimizer_rest": [4, 15, 17], "optimizerv2": 15, "option": [11, 13, 21, 23, 24, 25, 27, 29, 31, 32, 34, 41, 45], "order": [15, 17, 21, 24, 27, 34, 40, 41, 42, 44, 48], "org": 46, "orient": [13, 46], "origin": [25, 35, 36, 37, 38, 49], "ort": 41, "other": [1, 11, 15, 17], "otherwis": 45, "our": [21, 24, 26, 27, 34, 50], "out": [3, 6], "out1": 50, "out2": 50, "out3": 50, "out_channel_axis_map": 3, "outlier": 12, "outlier_histgram": 48, "outlin": 48, "output": [1, 3, 12, 14, 16, 20, 21, 24, 27, 28, 29, 31, 33, 34, 45, 49, 50], "output_image_s": [20, 28], "output_loss_multipli": [1, 14, 16], "output_loss_typ": [1, 14, 16], "output_nam": 41, "outputlosstyp": [14, 16], "over": 5, "overrid": [4, 44], "overwrit": 5, "p": 32, "packag": [41, 46, 50], "pad": 45, "page": 13, "pair": 49, "param": [17, 40, 43, 46], "param_item": 11, "paramet": [1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46], "pars": 45, "part": [41, 48], "pass": [2, 3, 5, 15, 17, 21, 24, 25, 26, 27, 29, 31, 32, 33, 34, 43], "patch": 45, "path": [11, 13, 23, 35, 41, 48, 49], "pattern": 45, "pdf": 46, "per": [1, 3, 4, 21, 24, 27, 34, 45, 46, 49], "per_sampl": 4, "percentag": 5, "peretz": 50, "perform": [6, 10, 11, 20, 25, 28, 32], "phase": 49, "pinpoint": 40, "pip": [41, 50], "pipelin": [1, 11, 14, 16], "pixel": [1, 14, 16], "place": 45, "plan": 41, "platform": [11, 18, 19, 21, 24, 25, 26, 27, 30, 32, 45], "pleas": [24, 27, 34, 41, 44, 48, 50], "plot": [40, 49], "png": 48, "point": [4, 5, 15, 17, 21, 29, 31, 36, 37, 38, 45, 49], "posit": 45, "possibl": [9, 21, 24, 27, 34, 45, 48, 49], "post": [4, 11, 13, 25, 27, 32, 34, 50], "power": [21, 24, 27, 29, 31, 34, 45], "power_of_two": 45, "poweroftwo": 46, "pre": 5, "preced": [21, 24, 27, 29, 31, 34], "precis": [5, 10, 11, 12, 13, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 34, 39, 45, 50], "predefin": [5, 6], "predict": 41, "prepar": [11, 13, 27, 34], "preprint": 50, "present": [2, 48, 49], "preserv": 45, "pretrain": [33, 34], "prevent": 5, "primari": 48, "prior": 5, "problemat": 40, "procedur": 48, "process": [4, 5, 8, 13, 14, 15, 16, 17, 18, 19, 20, 25, 28, 32, 39, 40, 43, 44, 45, 47, 49], "product": 49, "project": [41, 50], "properti": 7, "propos": [46, 48], "provid": [2, 11, 20, 25, 28, 32, 41, 45, 46, 48, 49], "prune": [10, 50], "pruned_model": [25, 32], "pruning_config": [25, 32], "pruning_info": [25, 32], "pruning_mask": 7, "pruning_num_score_approxim": 6, "pruningconfig": [6, 13, 25, 32], "pruninginfo": [7, 13, 25, 32], "ptq": [11, 24, 31, 41, 48], "purpos": [20, 28, 40], "py": 50, "pydantic_cor": 45, "pypi": 50, "python": [35, 50], "pytorch": [11, 13, 45, 46, 50], "pytorch_data_generation_experiment": [13, 28], "pytorch_default_tpc": 30, "pytorch_gradient_post_training_quant": [13, 17, 29], "pytorch_post_training_quant": [13, 31, 41, 48], "pytorch_pruning_experiment": [13, 32], "pytorch_quantization_aware_training_finalize_experiment": [13, 33], "pytorch_quantization_aware_training_init_experiment": [13, 33, 34], "pytorch_resource_utilization_data": [13, 30], "q": 41, "q_fraction_scheduler_polici": 4, "qat": [26, 27, 33, 34, 44], "qat_config": [13, 27, 34], "qatconfig": [27, 34], "qc": 8, "qc_option": 45, "qmodel": 11, "qnnpack": 45, "quant": 41, "quantifi": [7, 49], "quantiz": [0, 3, 4, 5, 8, 9, 11, 12, 13, 15, 17, 20, 22, 28, 30, 36, 37, 38, 39, 40, 43, 44, 45, 46, 49, 50], "quantization_config": [39, 46], "quantization_configur": 45, "quantization_format": 41, "quantization_info": [21, 24, 26, 27, 29, 31, 33, 34], "quantization_preserv": [18, 19, 45, 47], "quantizationconfig": [13, 39, 48], "quantizationerrormethod": [8, 11, 13], "quantizationmethod": [3, 46], "quantize_and_export": 11, "quantize_reported_dir": [12, 48], "quantized_exportable_model": 41, "quantized_info": 48, "quantized_model": [11, 21, 24, 26, 27, 33, 34, 36, 37, 38, 48], "quantized_modul": [29, 31], "quantizewrapp": [13, 27, 33, 34], "question": 41, "r": 50, "radam": 16, "rais": 45, "random": [21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 41], "random_data_gen": 48, "rang": [3, 12, 21, 24, 27, 29, 31, 34, 48], "rate": [1, 14, 15, 16], "ratio": [11, 12, 48], "readi": 33, "readm": 41, "recent": 48, "recommend": 48, "recov": [25, 32], "red": 48, "reduc": [5, 25, 32], "reduce_on_plateau": [1, 14], "reduce_on_plateau_with_reset": 16, "reduceonplateau": 1, "refer": [41, 48], "refine_mp_solut": 5, "regard": 42, "regular": [1, 4, 15, 17], "regularization_factor": [4, 15, 17], "regularized_min_max_diff": [1, 14], "relat": [3, 7, 13, 45], "releas": 50, "relev": [41, 48], "relu": 3, "relu_bound_to_power_of_2": 8, "remov": [12, 25, 32, 33], "replac": [26, 48], "report": [12, 13, 48], "report_dir": [12, 48], "repositori": 41, "repr_datagen": [21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34], "repr_dataset": [36, 37, 38, 41], "repres": [4, 5, 10, 11, 15, 17, 21, 24, 25, 26, 27, 29, 31, 32, 33, 34, 36, 37, 38, 41, 43, 45, 48, 49], "representative_data_gen": [21, 22, 24, 25, 27, 29, 30, 31, 32, 34, 41, 48], "representative_dataset": 11, "request": 2, "requir": [21, 24, 27, 29, 31, 34, 46, 48, 49], "research": 50, "reshap": [3, 20], "residu": 11, "residual_collaps": [8, 11, 48], "resnet50": [25, 32, 41], "resnet50_weight": 32, "resolv": 48, "resourc": [6, 10, 11, 13, 21, 24, 25, 26, 27, 32, 33, 34, 49], "resourceutil": [13, 21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 34], "respectivli": 3, "rest": 4, "retrain": [25, 32], "retriev": [18, 19, 45], "return": [2, 4, 5, 7, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 41], "round": 4, "rounding_typ": 4, "ru": [21, 24, 26, 27], "ru_data": [22, 30], "rule": [40, 43], "run": [4, 15, 17, 41, 49], "runner": 40, "runnnig": 48, "same": [1, 41, 45], "sampl": [4, 15, 17, 49], "save": [3, 11, 12, 27, 35, 41, 46, 48], "save_model_path": [11, 41], "saved_model": 23, "savedmodel": 23, "scalar": 49, "scale": [4, 5, 45, 48], "scale_log_norm": 4, "schedul": [1, 4, 14, 16, 40], "scheduler_typ": [1, 14, 16], "schedulertyp": [14, 16], "schema": 45, "schema_vers": 45, "score": [4, 5, 6, 7, 9, 11, 15, 17, 25, 32, 48], "sdsp": [13, 45], "sdsp_v3_14": 19, "sdsp_version": 19, "search": [5, 10, 13, 21, 24, 27, 29, 31, 34], "second": [48, 49], "section": 48, "see": [4, 17, 50], "seen": 49, "select": [0, 3, 6, 8, 9, 13, 39, 41, 44, 45, 46], "self": 45, "semiconductor": 50, "sensit": [5, 6, 25, 32], "sequenti": [20, 28], "serial": 13, "serialization_format": 41, "sess": 41, "session": 41, "set": [3, 11, 12, 13, 15, 17, 20, 21, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 36, 37, 38, 41, 43, 45, 46, 48, 49], "set_log_fold": [35, 48, 49], "setup": [11, 50], "sever": [21, 24, 27, 29, 31, 34, 49], "shift_negative_activation_correct": 8, "shift_negative_params_search": 8, "shift_negative_ratio": 8, "shift_negative_threshold_recalcul": 8, "shortli": 45, "should": [3, 6, 15, 21, 22, 24, 25, 26, 27, 29, 31, 32, 34, 41, 45, 49], "show": [48, 49], "shown": 48, "side": 48, "sigma": 5, "signal": 9, "signed": 45, "signific": 7, "significantli": 48, "simd": [25, 32, 45], "simd_siz": 45, "similar": [9, 12, 36, 37, 38, 40, 50], "similarli": 45, "simpl": [20, 28], "simplic": [20, 28], "simul": 40, "simulate_schedul": 40, "simultan": 45, "singl": 45, "six": 48, "size": [1, 4, 5, 14, 15, 16, 17, 20, 21, 24, 26, 27, 28, 34, 41, 46], "skip": [12, 40, 41, 48], "slowli": 41, "small": 48, "smaller": 42, "smallereq": 42, "smooth": [1, 46], "smoothing_and_augment": [1, 14, 16], "so": 41, "softmax": 3, "softmax_shift": 8, "softquant": 4, "solut": 50, "solver": [21, 24, 27, 34], "some": [18, 19, 20, 28, 41, 45, 47, 48, 49], "soni": 50, "sonysemiconductorsolut": 50, "sourc": 50, "specif": [0, 3, 11, 13, 25, 32, 43, 48, 49], "specifi": [6, 12, 14, 16, 18, 20, 23, 25, 28, 32, 41, 45, 48], "sphinx": 13, "sqnr": [12, 48], "squar": [1, 9], "stabl": 50, "stage": 49, "stages_0_blocks_0_token_mixer_mixer_conv_kxk_0_conv_bn": 48, "stages_0_blocks_0_token_mixer_mixer_conv_scale_conv_bn": 48, "standard": [25, 32, 46], "start": [20, 28, 41, 46, 50], "start_step": 4, "state": [48, 50], "state_dict": 32, "statist": [3, 21, 24, 27, 29, 31, 34, 49], "ste": [4, 44, 46], "stem_0_act": 48, "stem_1_act": 48, "stem_2_act": 48, "stem_2_conv_kxk_0_conv_bn": 48, "step": [1, 4, 46, 48], "store": [7, 46], "str": [3, 11, 12, 18, 19, 21, 22, 24, 25, 27, 29, 30, 31, 32, 34, 35, 36, 37, 38, 41, 42, 45, 48], "straight": [4, 46], "strategi": [6, 25, 32], "string": 43, "structur": [13, 50], "student": 4, "success": 11, "suffer": 41, "suggest": 48, "sum": [10, 22, 25, 30, 32], "support": [4, 11, 41], "supported_input_activation_n_bit": 45, "symmetr": [21, 24, 27, 29, 31, 34, 45, 46], "t": [35, 50], "tab": 49, "tabl": [45, 48], "tag": 49, "take": [5, 24, 27, 34, 50], "target": [4, 11, 13, 18, 19, 21, 22, 24, 25, 26, 27, 30, 32, 33, 34, 45], "target_platform_cap": [21, 22, 24, 25, 27, 29, 30, 31, 32, 34, 42, 46], "target_platform_vers": 11, "target_q_fract": 4, "target_resource_util": [21, 24, 25, 27, 29, 31, 32, 34], "targetplatformcap": [13, 21, 22, 24, 25, 27, 29, 30, 31, 32, 34], "teacher": 4, "tempfil": 41, "tensor": [5, 11, 12, 15, 17, 20, 22, 28, 30, 45, 46, 49, 50], "tensorboard": [40, 48, 50], "tensorflow": [3, 11, 13, 15, 20, 21, 22, 24, 25, 26, 27, 41, 43, 45, 50], "tf": [3, 11, 15, 20, 23, 26, 27], "tflite": [41, 45], "than": [5, 42, 48], "thei": 3, "them": [45, 49], "therefor": 48, "thi": [5, 7, 8, 9, 11, 13, 20, 21, 23, 24, 25, 26, 27, 28, 29, 31, 32, 34, 35, 41, 45, 46, 48, 50], "three": [3, 48], "threshold": [5, 8, 9, 11, 12, 21, 24, 27, 29, 31, 34, 45, 46, 48], "threshold_bitwidth_mixed_precis": 48, "threshold_bitwidth_mixed_precision_with_model_output_loss_object": [12, 48], "threshold_degrade_layer_ratio": [12, 48], "threshold_degration_layer_ratio": 48, "threshold_quantize_error": [12, 48], "threshold_ratio_unbalanced_concaten": [12, 48], "threshold_ratio_unbalanced_concatn": 48, "threshold_zscore_outlier_remov": [12, 48], "through": [4, 20, 25, 28, 46], "throughout": 4, "thu": [25, 32, 49], "time": [3, 6, 46], "togeth": [25, 32], "tool": [13, 46, 50], "toolkit": [11, 13, 20, 28, 29, 48], "torch": [17, 28, 37, 38, 41, 50], "torchscript": 41, "torchvis": [1, 16, 29, 30, 31, 32, 33, 34, 41], "total": [10, 22, 30, 48], "total_memori": 10, "tpc": [11, 13, 25, 32, 45], "tpc_minor_vers": 45, "tpc_patch_vers": 45, "tpc_platform_typ": 45, "tpc_v1_0": 18, "tpc_version": [11, 18], "trace": 41, "train": [4, 11, 13, 44, 46, 50], "train_bia": 4, "trainabl": [23, 26, 46], "trainable_infrastructur": 44, "trainablequant": 26, "transform": [1, 21, 24, 27, 29, 31, 34], "transpos": 3, "treat": 45, "troubleshoot": [13, 48], "true": [1, 5, 8, 11, 12, 15, 16, 17, 23, 33, 34, 46, 48], "try": 5, "tun": 34, "tune": [15, 17, 25, 26, 27, 32, 33], "tupl": [1, 3, 11, 14, 16, 20, 21, 24, 25, 28, 29, 31, 32, 43, 45], "tutori": 48, "two": [5, 12, 21, 24, 27, 29, 31, 34, 41, 45, 48, 49], "type": [0, 1, 2, 4, 5, 6, 7, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 28, 29, 30, 31, 32, 35, 36, 37, 38, 41, 43, 45, 48], "ui": 49, "unbalanc": 12, "unchang": 40, "under": 49, "unifi": 11, "uniform": [45, 46], "union": [1, 14, 16, 20, 21, 22, 24, 25, 27, 28, 29, 30, 31, 32, 34, 45], "uniqu": 45, "unusu": 48, "up": [6, 20, 28, 35, 45, 49], "updat": [4, 11], "upon": 46, "upper": 48, "us": [0, 1, 2, 3, 4, 5, 6, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50], "use_hessian_based_scor": [5, 11], "use_hessian_based_weight": [15, 17], "use_hessian_sample_attent": [15, 17], "use_internal_tpc": 11, "use_mixed_precis": 11, "user": [11, 13, 21, 24, 26, 27, 29, 31, 33, 34, 48], "userinform": [21, 24, 29, 31], "util": [6, 11, 13, 21, 24, 25, 26, 27, 32, 33, 34, 46], "v": 50, "v1": 11, "valid": [36, 37, 38, 45, 46, 48], "validation_dataset": [36, 37, 38, 48], "validationerror": 45, "valu": [1, 2, 3, 4, 5, 6, 9, 11, 12, 21, 24, 25, 26, 27, 32, 41, 42, 43, 45, 46, 48], "valuabl": 9, "variabl": [15, 17], "variou": [11, 20, 28, 49], "vector": [4, 49], "verbos": 35, "version": [11, 13, 20, 28, 45], "via": [41, 50], "view": 49, "visit": [44, 50], "visual": [48, 50], "wa": [2, 41, 48], "wai": [49, 50], "walk": [20, 28], "want": 3, "warn": 48, "we": [3, 20, 21, 24, 25, 27, 28, 32, 34, 41, 43, 45, 46, 48, 49], "weight": [0, 1, 3, 4, 5, 8, 10, 11, 14, 15, 16, 17, 21, 22, 25, 27, 29, 30, 31, 32, 33, 34, 41, 43, 44, 45, 46, 49], "weight_quantizer_params_overrid": 44, "weight_training_method": 44, "weights_bias_correct": [8, 11], "weights_channels_axi": 46, "weights_compression_ratio": 11, "weights_error_method": 8, "weights_memori": [6, 10, 21, 24, 25, 27, 32, 34], "weights_n_bit": [43, 45, 46], "weights_per_channel_threshold": [45, 46], "weights_quantization_candid": 46, "weights_quantization_method": [43, 45, 46], "weights_quantization_param": 46, "weights_quantization_params_fn": 43, "weights_second_moment_correct": 8, "were": 49, "when": [1, 2, 3, 4, 5, 6, 9, 10, 12, 13, 15, 17, 21, 24, 26, 27, 40, 41, 42, 44, 45, 46, 48, 49], "where": [7, 12, 41, 43, 48, 49], "whether": [4, 5, 7, 11, 14, 15, 16, 17, 23, 40, 41, 45, 46], "which": [4, 6, 40, 41, 42, 43, 45, 46, 48], "while": [8, 21, 24, 26, 27, 34, 45], "who": 48, "width": [0, 5, 12, 13, 21, 24, 27, 28, 34, 39, 45, 48, 50], "within": [40, 45, 50], "without": 13, "work": 50, "would": 49, "wrap": [2, 3, 23, 27, 34, 42, 45, 46], "wrapper": [27, 33, 34, 46], "writer": 49, "x": 48, "xquant": 50, "xquant_config": [12, 36, 37, 38, 48], "xquant_report_keras_experiment": [13, 36], "xquant_report_pytorch_experiment": [13, 37, 48], "xquant_report_troubleshoot_pytorch_experiment": [12, 13, 38, 48], "xquantconfig": [12, 13, 36, 37, 38], "y": 48, "yield": [21, 22, 24, 25, 26, 27, 29, 30, 31, 32, 33, 34, 41], "you": [8, 41, 45, 48, 49, 50], "your": 41, "z": [11, 48], "z_score": [12, 48], "z_threshold": [8, 11, 48], "zero": [5, 45], "zscore": 48}, "titles": ["BitWidthConfig", "Data Generation Configuration", "DefaultDict Class", "FrameworkInfo Class", "GradientPTQConfig Class", "MixedPrecisionQuantizationConfig", "Pruning Configuration", "Pruning Information", "QuantizationConfig", "QuantizationErrorMethod", "ResourceUtilization", "wrapper", "XQuant Configuration", "API Docs", "Get DataGenerationConfig for Keras Models", "Get GradientPTQConfig for Keras Models", "Get DataGenerationConfig for Pytorch Models", "Get GradientPTQConfig for Pytorch Models", "Get TargetPlatformCapabilities for tpc version", "Get TargetPlatformCapabilities for sdsp converter version", "Keras Data Generation", "Keras Gradient Based Post Training Quantization", "Get Resource Utilization information for Keras Models", "Load Quantized Keras Model", "Keras Post Training Quantization", "Keras Structured Pruning", "Keras Quantization Aware Training Model Finalize", "Keras Quantization Aware Training Model Init", "Pytorch Data Generation", "Pytorch Gradient Based Post Training Quantization", "Get Resource Utilization information for PyTorch Models", "Pytorch Post Training Quantization", "Pytorch Structured Pruning", "PyTorch Quantization Aware Training Model Finalize", "PyTorch Quantization Aware Training Model Init", "Enable a Logger", "XQuant Report Keras", "XQuant Report Pytorch", "XQuant Report Troubleshoot Pytorch", "CoreConfig", "debug_config Module", "exporter Module", "Layer Attributes Filters", "network_editor Module", "qat_config Module", "target_platform_capabilities Module", "trainable_infrastructure Module", "<no title>", "XQuant Extension Tool", "Visualization within TensorBoard", "Model Compression Toolkit User Guide"], "titleterms": {"about": 48, "action": 43, "activ": 48, "api": [13, 50], "attribut": 42, "attributequantizationconfig": 45, "awar": [26, 27, 33, 34], "base": [21, 29], "basekerastrainablequant": 46, "basepytorchtrainablequant": 46, "batchnormalignemntlosstyp": 1, "bit": 49, "bitwidthconfig": 0, "bnlayerweightingtyp": 1, "channelaxi": 3, "channelsfilteringstrategi": 6, "class": [2, 3, 4], "comparison": 49, "compress": 50, "concatn": 48, "configur": [1, 6, 12, 49], "constraint": 50, "convert": 19, "core": 13, "coreconfig": 39, "cosin": 49, "data": [1, 20, 28], "data_gener": 13, "datagenerationconfig": [14, 16], "datainittyp": 1, "debug_config": 40, "debugconfig": 40, "defaultdict": 2, "doc": 13, "document": 50, "editrul": 43, "enabl": 35, "error": 48, "exampl": 48, "export": [13, 41], "extens": 48, "featur": 50, "filter": [42, 43], "final": [26, 33], "flow": 48, "format": [41, 48], "frameworkinfo": 3, "fuse": 45, "gener": [1, 20, 28], "get": [14, 15, 16, 17, 18, 19, 22, 30], "gptq": 13, "gptqhessianscoresconfig": 4, "gradient": [21, 29], "gradientptqconfig": [4, 15, 17], "gradualactivationquantizationconfig": 4, "graph": 48, "guid": 50, "how": 48, "imagegranular": 1, "imagenormalizationtyp": 1, "imagepipelinetyp": 1, "importancemetr": 6, "indic": 13, "infer": 41, "inform": [7, 22, 30], "init": [27, 34], "instal": 50, "judgment": 48, "kera": [14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 36, 41], "keras_export_model": 41, "keras_load_quantized_model": 13, "kerasexportserializationformat": 41, "layer": 42, "load": 23, "logger": 35, "loss": 48, "manualbitwidthselect": 0, "mctq": 41, "mix": [48, 49], "mixedprecisionquantizationconfig": 5, "model": [14, 15, 16, 17, 22, 23, 26, 27, 30, 33, 34, 41, 48, 50], "modul": [40, 41, 43, 44, 45, 46], "mpdistanceweight": 5, "mpmetricnorm": 5, "name": 41, "neg": 48, "network_editor": 43, "object": 48, "onnx": 41, "operatorsetgroup": 45, "operatorsset": 45, "opquantizationconfig": 45, "opset": 41, "outlier": 48, "output": [41, 48], "outputlosstyp": 1, "overal": 48, "overview": 50, "paramet": 48, "post": [21, 24, 29, 31], "precis": [48, 49], "process": 48, "prune": [6, 7, 13, 25, 32], "ptq": 13, "pytorch": [16, 17, 28, 29, 30, 31, 32, 33, 34, 37, 38, 41], "pytorch_export_model": 41, "pytorchexportserializationformat": 41, "qat": 13, "qat_config": 44, "qatconfig": 44, "qfractionlinearannealingconfig": 4, "quantiz": [21, 23, 24, 26, 27, 29, 31, 33, 34, 41, 48], "quantizationconfig": 8, "quantizationconfigopt": 45, "quantizationerrormethod": 9, "quantizationformat": 41, "quantizationmethod": 45, "quickstart": 50, "refer": 50, "remov": 48, "report": [36, 37, 38], "resourc": [22, 30], "resourceutil": 10, "result": 48, "roundingtyp": 4, "run": 48, "schedulertyp": 1, "sdsp": 19, "serial": 41, "set_log_fold": 13, "shift": 48, "similar": 49, "structur": [25, 32], "support": 50, "tabl": 13, "target_platform_cap": [13, 45], "targetplatformcap": [18, 19, 45], "technic": 50, "tensorboard": 49, "tool": 48, "toolkit": 50, "tpc": 18, "train": [21, 24, 26, 27, 29, 31, 33, 34], "trainable_infrastructur": [13, 46], "trainablequantizeractivationconfig": 46, "trainablequantizerweightsconfig": 46, "trainingmethod": [44, 46], "troubleshoot": 38, "tutori": 41, "unbalanc": 48, "understand": 48, "us": 41, "user": 50, "util": [22, 30], "version": [18, 19, 41], "visual": 49, "width": 49, "within": 49, "wrapper": [11, 13], "xquant": [12, 13, 36, 37, 38, 48], "xquantconfig": 48}}) \ No newline at end of file diff --git a/docs/static/bizstyle.js b/docs/static/bizstyle.js index c41d70ef0..0c0229c5d 100644 --- a/docs/static/bizstyle.js +++ b/docs/static/bizstyle.js @@ -17,7 +17,7 @@ const initialiseBizStyle = () => { } window.addEventListener("resize", - () => (document.querySelector("li.nav-item-0 a").innerText = (window.innerWidth <= 776) ? "Top" : "MCT Documentation: ver 2.5.0") + () => (document.querySelector("li.nav-item-0 a").innerText = (window.innerWidth <= 776) ? "Top" : "MCT Documentation: ver 2.5.1") ) if (document.readyState !== "loading") initialiseBizStyle() diff --git a/docs/static/documentation_options.js b/docs/static/documentation_options.js index 041a37c40..af417e6d9 100644 --- a/docs/static/documentation_options.js +++ b/docs/static/documentation_options.js @@ -1,5 +1,5 @@ const DOCUMENTATION_OPTIONS = { - VERSION: '2.5.0', + VERSION: '2.5.1', LANGUAGE: 'en', COLLAPSE_INDEX: false, BUILDER: 'html', diff --git a/docsrc/source/api/api_docs/index.rst b/docsrc/source/api/api_docs/index.rst index 53a0ef9b1..9299c1f9f 100644 --- a/docsrc/source/api/api_docs/index.rst +++ b/docsrc/source/api/api_docs/index.rst @@ -109,7 +109,8 @@ keras_load_quantized_model target_platform_capabilities ============================== - :ref:`target_platform_capabilities`: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference. -- :ref:`get_target_platform_capabilities`: A function to get a target platform model for Tensorflow and Pytorch. +- :ref:`get_target_platform_capabilities`: A function to get a TargetPlatformCapabilities for tpc version and device type. +- :ref:`get_target_platform_capabilities_sdsp`: A function to get a TargetPlatformCapabilities for sdsp converter version. - :ref:`DefaultDict`: Util class for creating a TargetPlatformCapabilities. wrapper diff --git a/docsrc/source/api/api_docs/methods/get_target_platform_capabilities.rst b/docsrc/source/api/api_docs/methods/get_target_platform_capabilities.rst index e8346a359..0fbb7ff66 100644 --- a/docsrc/source/api/api_docs/methods/get_target_platform_capabilities.rst +++ b/docsrc/source/api/api_docs/methods/get_target_platform_capabilities.rst @@ -3,9 +3,9 @@ .. _ug-get_target_platform_capabilities: -======================================= -Get FrameworkQuantizationCapabilities -======================================= +===================================================== +Get TargetPlatformCapabilities for tpc version +===================================================== .. autofunction:: model_compression_toolkit.get_target_platform_capabilities diff --git a/docsrc/source/api/api_docs/methods/get_target_platform_capabilities_sdsp.rst b/docsrc/source/api/api_docs/methods/get_target_platform_capabilities_sdsp.rst new file mode 100644 index 000000000..d5b0f0f24 --- /dev/null +++ b/docsrc/source/api/api_docs/methods/get_target_platform_capabilities_sdsp.rst @@ -0,0 +1,13 @@ +:orphan: + +.. _ug-get_target_platform_capabilities_sdsp: + + +============================================================= +Get TargetPlatformCapabilities for sdsp converter version +============================================================= + +.. autofunction:: model_compression_toolkit.get_target_platform_capabilities_sdsp + + +.. include:: ../notes/tpc_note.rst \ No newline at end of file diff --git a/docsrc/source/api/api_docs/modules/target_platform_capabilities.rst b/docsrc/source/api/api_docs/modules/target_platform_capabilities.rst index f0d1eb94a..c6b0504e6 100644 --- a/docsrc/source/api/api_docs/modules/target_platform_capabilities.rst +++ b/docsrc/source/api/api_docs/modules/target_platform_capabilities.rst @@ -16,7 +16,8 @@ Conv2D `_, and can be used using :ref:`get_target_platform_capabilities function`. +Models for IMX500, TFLite and qnnpack can be observed `here `_, and can be retrieved using :ref:`get_target_platform_capabilities function`. +You can also get the model for IMX500 using :ref:`get_target_platform_capabilities_sdsp function` that specifies the sdsp converter version. | diff --git a/model_compression_toolkit/__init__.py b/model_compression_toolkit/__init__.py index 3ca04916d..e0ca0782c 100644 --- a/model_compression_toolkit/__init__.py +++ b/model_compression_toolkit/__init__.py @@ -15,7 +15,8 @@ from model_compression_toolkit.defaultdict import DefaultDict from model_compression_toolkit import target_platform_capabilities -from model_compression_toolkit.target_platform_capabilities.tpc_models.get_target_platform_capabilities import get_target_platform_capabilities +from model_compression_toolkit.target_platform_capabilities.tpc_models.get_target_platform_capabilities import get_target_platform_capabilities, \ + get_target_platform_capabilities_sdsp from model_compression_toolkit import core from model_compression_toolkit.logger import set_log_folder from model_compression_toolkit import trainable_infrastructure diff --git a/model_compression_toolkit/target_platform_capabilities/tpc_models/get_target_platform_capabilities.py b/model_compression_toolkit/target_platform_capabilities/tpc_models/get_target_platform_capabilities.py index 186abffb1..2428f4551 100644 --- a/model_compression_toolkit/target_platform_capabilities/tpc_models/get_target_platform_capabilities.py +++ b/model_compression_toolkit/target_platform_capabilities/tpc_models/get_target_platform_capabilities.py @@ -28,7 +28,7 @@ def get_target_platform_capabilities(tpc_version: str = TPC_V1_0, device_type (str): The type of device for the target platform. Returns: - TargetPlatformCapabilities: The TargetPlatformCapabilities object. + The TargetPlatformCapabilities object matching the tpc version. """ # Generate a function containing tpc configurations for the specified device type. tpc_func = generate_tpc_func(device_type=device_type) @@ -48,7 +48,7 @@ def get_target_platform_capabilities_sdsp(sdsp_version: str = SDSP_V3_14) -> Tar sdsp_version (str): Sdsp converter version. Returns: - TargetPlatformCapabilities: The TargetPlatformCapabilities object. + The TargetPlatformCapabilities object matching the sdsp converter version. """ sdsp_version = str(sdsp_version) # Get the corresponding tpc version from sdsp converter version. @@ -77,7 +77,7 @@ def get_tpc_model(name: str, tpc: TargetPlatformCapabilities): tpc (TargetPlatformCapabilities): a TargetPlatformCapabilities to return. Returns: - TargetPlatformCapabilities: The given TargetPlatformCapabilities object. + The given TargetPlatformCapabilities object. """