From 79a800ca901d408b92036486493fd59ace810536 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Thu, 7 Mar 2024 16:55:01 +0200
Subject: [PATCH 1/9] remove tfmot - docsrc

---
 docsrc/source/index.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docsrc/source/index.rst b/docsrc/source/index.rst
index bd91fe81f..c6a9b0be0 100644
--- a/docsrc/source/index.rst
+++ b/docsrc/source/index.rst
@@ -41,7 +41,7 @@ A nightly version is also available (unstable):
 
 For using with Tensorflow please install the packages:
 `tensorflow <https://www.tensorflow.org/install>`_
-`tensorflow-model-optimization <https://www.tensorflow.org/model_optimization/guide/install>`_
+
 
 For using with Pytorch please install the package:
 `torch <https://pytorch.org/>`_

From 3dd18320fec3ec847bd872858be4c0ae59e64002 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Thu, 7 Mar 2024 17:11:20 +0200
Subject: [PATCH 2/9] update mct internal packaging - docsrc

---
 .../api/api_docs/methods/keras_kpi_data.rst   |  2 +-
 .../keras_post_training_quantization.rst      |  2 +-
 ..._training_quantization_mixed_precision.rst | 10 --------
 .../api/api_docs/methods/pytorch_kpi_data.rst |  2 +-
 .../pytorch_post_training_quantization.rst    |  2 +-
 ..._training_quantization_mixed_precision.rst | 10 --------
 .../mixed_precision_quantization_config.rst   |  4 ++--
 .../classes/FolderImageLoader.rst             |  2 +-
 .../classes/FrameworkInfo.rst                 |  4 ++--
 .../classes/GradientPTQConfig.rst             |  9 -------
 .../keras_data_generation_experimental.rst    |  4 ++--
 ...ost_training_quantization_experimental.rst |  4 ++--
 .../methods/keras_kpi_data_experimental.rst   |  4 ++--
 ...ost_training_quantization_experimental.rst |  4 ++--
 ...s_quantization_aware_training_finalize.rst |  4 ++--
 ...keras_quantization_aware_training_init.rst |  4 ++--
 ...ost_training_quantization_experimental.rst |  4 ++--
 .../methods/pytorch_kpi_data_experimental.rst |  4 ++--
 ...ost_training_quantization_experimental.rst |  4 ++--
 ...h_quantization_aware_training_finalize.rst |  4 ++--
 ...torch_quantization_aware_training_init.rst |  4 ++--
 .../modules/debug_config.rst                  |  2 +-
 .../mixed_precision_quantization_config.rst   |  4 ++--
 .../modules/network_editor.rst                | 24 +++++++++----------
 .../modules/quantization_config.rst           |  4 ++--
 25 files changed, 48 insertions(+), 77 deletions(-)
 delete mode 100644 docsrc/source/api/api_docs/methods/keras_post_training_quantization_mixed_precision.rst
 delete mode 100644 docsrc/source/api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.rst

diff --git a/docsrc/source/api/api_docs/methods/keras_kpi_data.rst b/docsrc/source/api/api_docs/methods/keras_kpi_data.rst
index d1af078dc..a0205814f 100644
--- a/docsrc/source/api/api_docs/methods/keras_kpi_data.rst
+++ b/docsrc/source/api/api_docs/methods/keras_kpi_data.rst
@@ -7,4 +7,4 @@
 Get KPI information for Keras Models
 =======================================
 
-.. autofunction:: model_compression_toolkit.keras_kpi_data
+.. autofunction:: model_compression_toolkit.core.keras_kpi_data
diff --git a/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst b/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst
index 9a14b4510..82a351716 100644
--- a/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst
+++ b/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst
@@ -7,4 +7,4 @@
 Keras Post Training Quantization
 =================================
 
-.. autofunction:: model_compression_toolkit.keras_post_training_quantization
+.. autofunction:: model_compression_toolkit.ptq.keras_post_training_quantization
diff --git a/docsrc/source/api/api_docs/methods/keras_post_training_quantization_mixed_precision.rst b/docsrc/source/api/api_docs/methods/keras_post_training_quantization_mixed_precision.rst
deleted file mode 100644
index 650cc4c70..000000000
--- a/docsrc/source/api/api_docs/methods/keras_post_training_quantization_mixed_precision.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-:orphan:
-
-.. _ug-keras_post_training_quantization_mixed_precision:
-
-
-==================================================================
-Keras Post Training Mixed Precision Quantization
-==================================================================
-
-.. autofunction:: model_compression_toolkit.keras_post_training_quantization_mixed_precision
diff --git a/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst b/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst
index be83da8d2..86f512eae 100644
--- a/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst
+++ b/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst
@@ -7,4 +7,4 @@
 Get KPI information for PyTorch Models
 =======================================
 
-.. autofunction:: model_compression_toolkit.pytorch_kpi_data
+.. autofunction:: model_compression_toolkit.core.pytorch_kpi_data
diff --git a/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst b/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst
index e3ddfb201..46feca7ba 100644
--- a/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst
+++ b/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst
@@ -7,4 +7,4 @@
 Pytorch Post Training Quantization
 =====================================
 
-.. autofunction:: model_compression_toolkit.pytorch_post_training_quantization
+.. autofunction:: model_compression_toolkit.ptq.pytorch_post_training_quantization
diff --git a/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.rst b/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.rst
deleted file mode 100644
index 72d318522..000000000
--- a/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-:orphan:
-
-.. _ug-pytorch_post_training_quantization_mixed_precision:
-
-
-==================================================================
-PyTorch Post Training Mixed Precision Quantization
-==================================================================
-
-.. autofunction:: model_compression_toolkit.pytorch_post_training_quantization_mixed_precision
diff --git a/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst b/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst
index e48b66381..4745b0b69 100644
--- a/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst
+++ b/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst
@@ -12,7 +12,7 @@ KPI
 ================================
 **Object to configure resources to use when searching for a mixed-precision configuration for a model:**
 
-.. autoclass:: model_compression_toolkit.KPI
+.. autoclass:: model_compression_toolkit.core.KPI
     :noindex:
 
 
@@ -23,5 +23,5 @@ MixedPrecisionQuantizationConfig
 =================================
 **Class to configure the quantization process of the model when quantizing in mixed-precision:**
 
-.. autoclass:: model_compression_toolkit.MixedPrecisionQuantizationConfig
+.. autoclass:: model_compression_toolkit.core.MixedPrecisionQuantizationConfig
 
diff --git a/docsrc/source/api/experimental_api_docs/classes/FolderImageLoader.rst b/docsrc/source/api/experimental_api_docs/classes/FolderImageLoader.rst
index e9fda9d43..6897e353f 100644
--- a/docsrc/source/api/experimental_api_docs/classes/FolderImageLoader.rst
+++ b/docsrc/source/api/experimental_api_docs/classes/FolderImageLoader.rst
@@ -8,7 +8,7 @@ Folder Image Loader API
 
 **The following API can be used to load a folder of images to create a representative dataset for PTQ calibration**
 
-.. autoclass:: model_compression_toolkit.FolderImageLoader
+.. autoclass:: model_compression_toolkit.core.FolderImageLoader
     :members:
 
 
diff --git a/docsrc/source/api/experimental_api_docs/classes/FrameworkInfo.rst b/docsrc/source/api/experimental_api_docs/classes/FrameworkInfo.rst
index 8aa3bcd52..2338a7dd4 100644
--- a/docsrc/source/api/experimental_api_docs/classes/FrameworkInfo.rst
+++ b/docsrc/source/api/experimental_api_docs/classes/FrameworkInfo.rst
@@ -9,7 +9,7 @@ FrameworkInfo Class
 
 **The following API can be used to pass MCT framework-related information to use when optimizing the network**
 
-.. autoclass:: model_compression_toolkit.FrameworkInfo
+.. autoclass:: model_compression_toolkit.core.FrameworkInfo
 
 
 |
@@ -19,5 +19,5 @@ ChannelAxis
 ==========================
 **Enum to select the output channels format in the model:**
 
-.. autoclass:: model_compression_toolkit.ChannelAxis
+.. autoclass:: model_compression_toolkit.core.ChannelAxis
 
diff --git a/docsrc/source/api/experimental_api_docs/classes/GradientPTQConfig.rst b/docsrc/source/api/experimental_api_docs/classes/GradientPTQConfig.rst
index caea133e0..11a79e1c8 100644
--- a/docsrc/source/api/experimental_api_docs/classes/GradientPTQConfig.rst
+++ b/docsrc/source/api/experimental_api_docs/classes/GradientPTQConfig.rst
@@ -2,15 +2,6 @@
 
 .. _ug-GradientPTQConfig:
 
-=================================
-GradientPTQConfigV2 Class
-=================================
-
-**The following API can be used to create a GradientPTQConfigV2 instance which can be used for post training quantization using knowledge distillation from a teacher (float model) to a student (the quantized model). This is experimental and subject to future changes.**
-
-.. autoclass:: model_compression_toolkit.gptq.GradientPTQConfigV2
-    :members:
-
 
 =================================
 GradientPTQConfig Class
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_data_generation_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/keras_data_generation_experimental.rst
index 20865d616..66dfa8dcf 100644
--- a/docsrc/source/api/experimental_api_docs/methods/keras_data_generation_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/keras_data_generation_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-tensorflow_data_generation_experimental:
+.. _ug-keras_data_generation_experimental:
 
 
 =====================================
 Keras Data Generation
 =====================================
 
-.. autofunction:: model_compression_toolkit.data_generation.tensorflow_data_generation_experimental
+.. autofunction:: model_compression_toolkit.data_generation.keras_data_generation_experimental
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst
index fa99048f1..afd2eabf6 100644
--- a/docsrc/source/api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-keras_gradient_post_training_quantization_experimental:
+.. _ug-keras_gradient_post_training_quantization:
 
 
 ================================================
 Keras Gradient Based Post Training Quantization
 ================================================
 
-.. autofunction:: model_compression_toolkit.gptq.keras_gradient_post_training_quantization_experimental
+.. autofunction:: model_compression_toolkit.gptq.keras_gradient_post_training_quantization
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_kpi_data_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/keras_kpi_data_experimental.rst
index 608808bca..a0205814f 100644
--- a/docsrc/source/api/experimental_api_docs/methods/keras_kpi_data_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/keras_kpi_data_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-keras_kpi_data_experimental:
+.. _ug-keras_kpi_data:
 
 
 =======================================
 Get KPI information for Keras Models
 =======================================
 
-.. autofunction:: model_compression_toolkit.core.keras_kpi_data_experimental
+.. autofunction:: model_compression_toolkit.core.keras_kpi_data
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst
index ca1e912ee..82a351716 100644
--- a/docsrc/source/api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-keras_post_training_quantization_experimental:
+.. _ug-keras_post_training_quantization:
 
 
 =================================
 Keras Post Training Quantization
 =================================
 
-.. autofunction:: model_compression_toolkit.ptq.keras_post_training_quantization_experimental
+.. autofunction:: model_compression_toolkit.ptq.keras_post_training_quantization
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst b/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst
index 1e2bac84a..54ff74a3f 100644
--- a/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-keras_quantization_aware_training_finalize:
+.. _ug-keras_quantization_aware_training_finalize_experimental:
 
 
 ================================================
 Keras Quantization Aware Training Model Finalize
 ================================================
 
-.. autofunction:: model_compression_toolkit.qat.keras_quantization_aware_training_finalize
+.. autofunction:: model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst b/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst
index f055e1621..b89c3367e 100644
--- a/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-keras_quantization_aware_training_init:
+.. _ug-keras_quantization_aware_training_init_experimental:
 
 
 ================================================
 Keras Quantization Aware Training Model Init
 ================================================
 
-.. autofunction:: model_compression_toolkit.qat.keras_quantization_aware_training_init
+.. autofunction:: model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst
index 4c30d210b..95dcf10f0 100644
--- a/docsrc/source/api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-pytorch_gradient_post_training_quantization_experimental:
+.. _ug-pytorch_gradient_post_training_quantization:
 
 
 ====================================================
 Pytorch Gradient Based Post Training Quantization
 ====================================================
 
-.. autofunction:: model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization_experimental
+.. autofunction:: model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst
index 155a7e1c0..86f512eae 100644
--- a/docsrc/source/api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-pytorch_kpi_data_experimental:
+.. _ug-pytorch_kpi_data:
 
 
 =======================================
 Get KPI information for PyTorch Models
 =======================================
 
-.. autofunction:: model_compression_toolkit.core.pytorch_kpi_data_experimental
+.. autofunction:: model_compression_toolkit.core.pytorch_kpi_data
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst
index 48fcdfa6f..46feca7ba 100644
--- a/docsrc/source/api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-pytorch_post_training_quantization_experimental:
+.. _ug-pytorch_post_training_quantization:
 
 
 =====================================
 Pytorch Post Training Quantization
 =====================================
 
-.. autofunction:: model_compression_toolkit.ptq.pytorch_post_training_quantization_experimental
+.. autofunction:: model_compression_toolkit.ptq.pytorch_post_training_quantization
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst b/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst
index b1e5dcd8c..e391be8d7 100644
--- a/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-pytorch_quantization_aware_training_finalize:
+.. _ug-pytorch_quantization_aware_training_finalize_experimental:
 
 
 ===================================================
 PyTorch Quantization Aware Training Model Finalize
 ===================================================
 
-.. autofunction:: model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize
+.. autofunction:: model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst b/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst
index 899379d6b..4e14c7478 100644
--- a/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst
+++ b/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst
@@ -1,10 +1,10 @@
 :orphan:
 
-.. _ug-pytorch_quantization_aware_training_init:
+.. _ug-pytorch_quantization_aware_training_init_experimental:
 
 
 ================================================
 PyTorch Quantization Aware Training Model Init
 ================================================
 
-.. autofunction:: model_compression_toolkit.qat.pytorch_quantization_aware_training_init
+.. autofunction:: model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental
diff --git a/docsrc/source/api/experimental_api_docs/modules/debug_config.rst b/docsrc/source/api/experimental_api_docs/modules/debug_config.rst
index f1da2735b..16654f433 100644
--- a/docsrc/source/api/experimental_api_docs/modules/debug_config.rst
+++ b/docsrc/source/api/experimental_api_docs/modules/debug_config.rst
@@ -12,6 +12,6 @@ DebugConfig
 ==========================
 **Class to configure params for debugging purposes:**
 
-.. autoclass:: model_compression_toolkit.DebugConfig
+.. autoclass:: model_compression_toolkit.core.DebugConfig
 
 
diff --git a/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst b/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst
index 996479716..f3d6aba8c 100644
--- a/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst
+++ b/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst
@@ -12,7 +12,7 @@ KPI
 ================================
 **Object to configure resources to use when searching for a mixed-precision configuration for a model:**
 
-.. autoclass:: model_compression_toolkit.KPI
+.. autoclass:: model_compression_toolkit.core.KPI
 
 
 |
@@ -22,5 +22,5 @@ MixedPrecisionQuantizationConfigV2
 ===================================
 **Class to configure the quantization process of the model when quantizing in mixed-precision:**
 
-.. autoclass:: model_compression_toolkit.core.MixedPrecisionQuantizationConfigV2
+.. autoclass:: model_compression_toolkit.core.MixedPrecisionQuantizationConfig
 
diff --git a/docsrc/source/api/experimental_api_docs/modules/network_editor.rst b/docsrc/source/api/experimental_api_docs/modules/network_editor.rst
index a97594e39..8df62a390 100644
--- a/docsrc/source/api/experimental_api_docs/modules/network_editor.rst
+++ b/docsrc/source/api/experimental_api_docs/modules/network_editor.rst
@@ -11,52 +11,52 @@ network_editor Module
 
 EditRule
 ==========
-.. autoclass:: model_compression_toolkit.network_editor.EditRule
+.. autoclass:: model_compression_toolkit.core.network_editor.EditRule
 
 Filters
 ==========
 
-.. autoclass:: model_compression_toolkit.network_editor.NodeTypeFilter
+.. autoclass:: model_compression_toolkit.core.network_editor.NodeTypeFilter
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.NodeNameFilter
+.. autoclass:: model_compression_toolkit.core.network_editor.NodeNameFilter
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.NodeNameScopeFilter
+.. autoclass:: model_compression_toolkit.core.network_editor.NodeNameScopeFilter
 
 
 Actions
 ==========
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeFinalWeightsQuantConfigAttr
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantConfigAttr
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeFinalActivationQuantConfigAttr
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantConfigAttr
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeQuantizationParamFunction
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeFinalWeightsQuantizationMethod
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantizationMethod
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod
 
 |
 
-.. autoclass:: model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantizationMethod
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod
 
diff --git a/docsrc/source/api/experimental_api_docs/modules/quantization_config.rst b/docsrc/source/api/experimental_api_docs/modules/quantization_config.rst
index 68b9599eb..7997f6f1b 100644
--- a/docsrc/source/api/experimental_api_docs/modules/quantization_config.rst
+++ b/docsrc/source/api/experimental_api_docs/modules/quantization_config.rst
@@ -11,7 +11,7 @@ QuantizationErrorMethod
 ==========================
 **Enum to select a method for quantization parameters' selection:**
 
-.. autoclass:: model_compression_toolkit.QuantizationErrorMethod
+.. autoclass:: model_compression_toolkit.core.QuantizationErrorMethod
 
 
 |
@@ -21,5 +21,5 @@ QuantizationConfig
 ==========================
 **Class to configure the quantization process of the model:**
 
-.. autoclass:: model_compression_toolkit.QuantizationConfig
+.. autoclass:: model_compression_toolkit.core.QuantizationConfig
 

From 0e242ac2948c6078df1311a239031a57173657e4 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Thu, 7 Mar 2024 17:52:05 +0200
Subject: [PATCH 3/9] update docsrc

---
 .../classes/DefaultDict.rst                   |  0
 .../classes/FolderImageLoader.rst             |  0
 .../classes/FrameworkInfo.rst                 |  0
 .../classes/GradientPTQConfig.rst             |  0
 .../api/api_docs/classes/PruningConfig.rst    |  9 +++
 .../api/api_docs/classes/PruningInfo.rst      | 10 +++
 docsrc/source/api/api_docs/index.rst          | 54 ++++++++++----
 .../get_keras_data_generation_config.rst      |  0
 .../methods/get_keras_gptq_config.rst         |  0
 .../get_pytorch_data_generation_config.rst    |  0
 .../methods/get_pytroch_gptq_config.rst       |  0
 .../get_target_platform_capabilities.rst      |  0
 .../keras_data_generation_experimental.rst    |  0
 ...ost_training_quantization_experimental.rst |  0
 .../api/api_docs/methods/keras_kpi_data.rst   | 10 ---
 .../methods/keras_kpi_data_experimental.rst   |  0
 .../methods/keras_load_quantizad_model.rst    |  0
 .../keras_post_training_quantization.rst      | 10 ---
 ...ost_training_quantization_experimental.rst |  0
 .../methods/keras_pruning_experimental.rst    | 12 ++++
 ...s_quantization_aware_training_finalize.rst |  0
 ...keras_quantization_aware_training_init.rst |  0
 .../pytorch_data_generation_experimental.rst  |  0
 ...ost_training_quantization_experimental.rst |  0
 .../api/api_docs/methods/pytorch_kpi_data.rst | 10 ---
 .../methods/pytorch_kpi_data_experimental.rst |  0
 .../pytorch_post_training_quantization.rst    | 10 ---
 ...ost_training_quantization_experimental.rst |  0
 .../methods/pytorch_pruning_experimental.rst  | 15 ++++
 ...h_quantization_aware_training_finalize.rst |  0
 ...torch_quantization_aware_training_init.rst |  0
 .../methods/set_logger_path.rst               |  0
 .../modules/core_config.rst                   |  0
 .../modules/debug_config.rst                  |  0
 .../modules/exporter.rst                      |  0
 .../modules/layer_filters.rst                 |  0
 .../mixed_precision_quantization_config.rst   | 11 ++-
 .../modules/network_editor.rst                |  0
 .../modules/qat_config.rst                    |  0
 .../modules/quantization_config.rst           |  0
 .../modules/target_platform.rst               |  0
 .../modules/trainable_infrastructure.rst      |  0
 .../notes/experimental_api_note.rst           |  0
 .../notes/tpc_note.rst                        |  0
 .../api/experimental_api_docs/index.rst       | 70 -------------------
 .../methods/keras_pruning_experimental.rst    | 25 -------
 .../methods/pytorch_pruning_experimental.rst  | 25 -------
 .../mixed_precision_quantization_config.rst   | 26 -------
 docsrc/source/index.rst                       | 26 +++----
 49 files changed, 105 insertions(+), 218 deletions(-)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/classes/DefaultDict.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/classes/FolderImageLoader.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/classes/FrameworkInfo.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/classes/GradientPTQConfig.rst (100%)
 create mode 100644 docsrc/source/api/api_docs/classes/PruningConfig.rst
 create mode 100644 docsrc/source/api/api_docs/classes/PruningInfo.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/get_keras_data_generation_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/get_keras_gptq_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/get_pytorch_data_generation_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/get_pytroch_gptq_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/get_target_platform_capabilities.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_data_generation_experimental.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_gradient_post_training_quantization_experimental.rst (100%)
 delete mode 100644 docsrc/source/api/api_docs/methods/keras_kpi_data.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_kpi_data_experimental.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_load_quantizad_model.rst (100%)
 delete mode 100644 docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_post_training_quantization_experimental.rst (100%)
 create mode 100644 docsrc/source/api/api_docs/methods/keras_pruning_experimental.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_quantization_aware_training_finalize.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/keras_quantization_aware_training_init.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/pytorch_data_generation_experimental.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/pytorch_gradient_post_training_quantization_experimental.rst (100%)
 delete mode 100644 docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/pytorch_kpi_data_experimental.rst (100%)
 delete mode 100644 docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/pytorch_post_training_quantization_experimental.rst (100%)
 create mode 100644 docsrc/source/api/api_docs/methods/pytorch_pruning_experimental.rst
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/pytorch_quantization_aware_training_finalize.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/pytorch_quantization_aware_training_init.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/methods/set_logger_path.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/core_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/debug_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/exporter.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/layer_filters.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/network_editor.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/qat_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/quantization_config.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/target_platform.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/modules/trainable_infrastructure.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/notes/experimental_api_note.rst (100%)
 rename docsrc/source/api/{experimental_api_docs => api_docs}/notes/tpc_note.rst (100%)
 delete mode 100644 docsrc/source/api/experimental_api_docs/index.rst
 delete mode 100644 docsrc/source/api/experimental_api_docs/methods/keras_pruning_experimental.rst
 delete mode 100644 docsrc/source/api/experimental_api_docs/methods/pytorch_pruning_experimental.rst
 delete mode 100644 docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst

diff --git a/docsrc/source/api/experimental_api_docs/classes/DefaultDict.rst b/docsrc/source/api/api_docs/classes/DefaultDict.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/classes/DefaultDict.rst
rename to docsrc/source/api/api_docs/classes/DefaultDict.rst
diff --git a/docsrc/source/api/experimental_api_docs/classes/FolderImageLoader.rst b/docsrc/source/api/api_docs/classes/FolderImageLoader.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/classes/FolderImageLoader.rst
rename to docsrc/source/api/api_docs/classes/FolderImageLoader.rst
diff --git a/docsrc/source/api/experimental_api_docs/classes/FrameworkInfo.rst b/docsrc/source/api/api_docs/classes/FrameworkInfo.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/classes/FrameworkInfo.rst
rename to docsrc/source/api/api_docs/classes/FrameworkInfo.rst
diff --git a/docsrc/source/api/experimental_api_docs/classes/GradientPTQConfig.rst b/docsrc/source/api/api_docs/classes/GradientPTQConfig.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/classes/GradientPTQConfig.rst
rename to docsrc/source/api/api_docs/classes/GradientPTQConfig.rst
diff --git a/docsrc/source/api/api_docs/classes/PruningConfig.rst b/docsrc/source/api/api_docs/classes/PruningConfig.rst
new file mode 100644
index 000000000..0b57b743a
--- /dev/null
+++ b/docsrc/source/api/api_docs/classes/PruningConfig.rst
@@ -0,0 +1,9 @@
+:orphan:
+
+.. _ug-PruningConfig:
+
+================================================
+Pruning Configuration
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.PruningConfig
\ No newline at end of file
diff --git a/docsrc/source/api/api_docs/classes/PruningInfo.rst b/docsrc/source/api/api_docs/classes/PruningInfo.rst
new file mode 100644
index 000000000..7bd02336c
--- /dev/null
+++ b/docsrc/source/api/api_docs/classes/PruningInfo.rst
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-PruningInfo:
+
+================================================
+Pruning Information
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.PruningInfo
+
diff --git a/docsrc/source/api/api_docs/index.rst b/docsrc/source/api/api_docs/index.rst
index 28f078466..072f21f1e 100644
--- a/docsrc/source/api/api_docs/index.rst
+++ b/docsrc/source/api/api_docs/index.rst
@@ -7,8 +7,6 @@
 API Docs
 =========
 
-.. note:: This API will be removed in future releases. Please switch to the :ref:`new API<ug-experimental_api_docs>`
-
 **Init module for MCT API.**
 
 .. code-block:: python
@@ -17,30 +15,60 @@ API Docs
 
 |
 
+.. include:: ./notes/experimental_api_note.rst
+
+|
+
+
 Functions
 =========
-- :ref:`pytorch_post_training_quantization<ug-pytorch_post_training_quantization>`: Function to use for post training quantization of Pytorch models.
-- :ref:`pytorch_post_training_quantization_mixed_precision<ug-pytorch_post_training_quantization_mixed_precision>`: Function to use for mixed-precision post training quantization of Pytorch models (experimental).
-- :ref:`keras_post_training_quantization<ug-keras_post_training_quantization>`: Function to use for post training quantization of Keras models.
-- :ref:`keras_post_training_quantization_mixed_precision<ug-keras_post_training_quantization_mixed_precision>`: Function to use for mixed-precision post training quantization of Keras models (experimental).
-- :ref:`get_keras_gptq_config<ug-get_keras_gptq_config>`: Function to create a GradientPTQConfig instance to use for Keras models when using GPTQ (experimental).
-- :ref:`get_target_platform_capabilities<ug-get_target_platform_capabilities>`: Function to get a target platform model for Tensorflow and Pytorch.
-- :ref:`keras_kpi_data<ug-keras_kpi_data>`: Function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models.
-- :ref:`pytorch_kpi_data<ug-pytorch_kpi_data>`: Function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models.
+- :ref:`pytorch_post_training_quantization<ug-pytorch_post_training_quantization>`: A function to use for post training quantization of PyTorch models.
+- :ref:`keras_post_training_quantization<ug-keras_post_training_quantization>`: A function to use for post training quantization of Keras models.
+
+- :ref:`keras_gradient_post_training_quantization<ug-keras_gradient_post_training_quantization>`: A function to use for gradient-based post training quantization of Keras models.
+- :ref:`get_keras_gptq_config<ug-get_keras_gptq_config>`: A function to create a GradientPTQConfig instance to use for Keras models when using GPTQ.
+
+- :ref:`pytorch_gradient_post_training_quantization<ug-pytorch_gradient_post_training_quantization>`: A function to use for gradient-based post training quantization of Pytorch models.
+- :ref:`get_pytorch_gptq_config<ug-get_pytorch_gptq_config>`: A function to create a GradientPTQConfig instance to use for Pytorch models when using GPTQ.
+
+- :ref:`keras_quantization_aware_training_init<ug-keras_quantization_aware_training_init_experimental>`: A function to use for preparing a model for Quantization Aware Training (Experimental)
+- :ref:`keras_quantization_aware_training_finalize<ug-keras_quantization_aware_training_finalize_experimental>`: A function to finalize a model after Quantization Aware Training to a model without QuantizeWrappers (Experimental)
+
+- :ref:`keras_data_generation_experimental<ug-keras_data_generation_experimental>`: A function to generate data for a Keras model (experimental).
+- :ref:`get_keras_data_generation_config<ug-get_keras_data_generation_config>`: A function to generate a DataGenerationConfig for Tensorflow data generation(experimental).
+
+- :ref:`pytorch_data_generation_experimental<ug-pytorch_data_generation_experimental>`: A function to generate data for a Pytorch model (experimental).
+- :ref:`get_pytorch_data_generation_config<ug-get_pytorch_data_generation_config>`: A function to load a DataGenerationConfig for Pytorch data generation (experimental).
+
+- :ref:`keras_pruning_experimental<ug-keras_pruning_experimental>`: A function to apply structured pruning for Keras models (experimental).
+- :ref:`pytorch_pruning_experimental<ug-pytorch_pruning_experimental>`: A function to apply structured pruning for Pytorch models (experimental).
+
+- :ref:`keras_kpi_data<ug-keras_kpi_data>`: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models.
+- :ref:`pytorch_kpi_data<ug-pytorch_kpi_data>`: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models.
+
+- :ref:`get_target_platform_capabilities<ug-get_target_platform_capabilities>`: A function to get a target platform model for Tensorflow and Pytorch.
+- :ref:`keras_load_quantized_model<ug-keras_load_quantized_model>`: A function to load a quantized keras model.
 
 
 Modules
 =========
+- :ref:`core_config<ug-core_config>`: Module to contain configurations of the optimization process.
 - :ref:`quantization_config<ug-quantization_config>`: Module to configure the quantization process.
-- :ref:`mixed_precision_quantization_config<ug-mixed_precision_quantization_config>`: Module to configure the quantization process when using mixed-precision PTQ.
-- :ref:`network_editor<ug-network_editor>`: Module to edit your model during the quantization process.
+- :ref:`mixed_precision_quantization_config<ug-mixed_precision_quantization_config_v2>`: Module to configure the quantization process when using mixed-precision PTQ.
+- :ref:`debug_config<ug-debug_config>`: Module to configure options for debugging the optimization process.
 - :ref:`target_platform<ug-target_platform>`: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference.
+- :ref:`qat_config<ug-qat_config>`: Module to create quantization configuration for Quantization-aware Training.
+- :ref:`exporter<ug-exporter>`: Module that enables to export a quantized model in different serialization formats.
+- :ref:`trainable_infrastructure<ug-trainable_infrastructure>`: Module that contains quantization abstraction and quantizers for hardware-oriented model optimization tools.
 
 Classes
 =========
-- :ref:`GradientPTQConfig<ug-GradientPTQConfig>`: Class to configure GradientPTQC options for gradient based post training quantization.
+- :ref:`GradientPTQConfig<ug-GradientPTQConfig>`: Class to configure GradientPTQ options for gradient based post training quantization.
 - :ref:`FolderImageLoader<ug-FolderImageLoader>`: Class to use an images directory as a representative dataset.
 - :ref:`FrameworkInfo<ug-FrameworkInfo>`: Class to wrap framework information to be used by MCT when optimizing models.
+- :ref:`PruningConfig<ug-PruningConfig>`: PruningConfig
+- :ref:`PruningInfo<ug-PruningInfo>`: PruningInfo
+
 
 Indices and tables
 ==================
diff --git a/docsrc/source/api/experimental_api_docs/methods/get_keras_data_generation_config.rst b/docsrc/source/api/api_docs/methods/get_keras_data_generation_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/get_keras_data_generation_config.rst
rename to docsrc/source/api/api_docs/methods/get_keras_data_generation_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/get_keras_gptq_config.rst b/docsrc/source/api/api_docs/methods/get_keras_gptq_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/get_keras_gptq_config.rst
rename to docsrc/source/api/api_docs/methods/get_keras_gptq_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/get_pytorch_data_generation_config.rst b/docsrc/source/api/api_docs/methods/get_pytorch_data_generation_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/get_pytorch_data_generation_config.rst
rename to docsrc/source/api/api_docs/methods/get_pytorch_data_generation_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/get_pytroch_gptq_config.rst b/docsrc/source/api/api_docs/methods/get_pytroch_gptq_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/get_pytroch_gptq_config.rst
rename to docsrc/source/api/api_docs/methods/get_pytroch_gptq_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/get_target_platform_capabilities.rst b/docsrc/source/api/api_docs/methods/get_target_platform_capabilities.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/get_target_platform_capabilities.rst
rename to docsrc/source/api/api_docs/methods/get_target_platform_capabilities.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_data_generation_experimental.rst b/docsrc/source/api/api_docs/methods/keras_data_generation_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_data_generation_experimental.rst
rename to docsrc/source/api/api_docs/methods/keras_data_generation_experimental.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst b/docsrc/source/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst
rename to docsrc/source/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst
diff --git a/docsrc/source/api/api_docs/methods/keras_kpi_data.rst b/docsrc/source/api/api_docs/methods/keras_kpi_data.rst
deleted file mode 100644
index a0205814f..000000000
--- a/docsrc/source/api/api_docs/methods/keras_kpi_data.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-:orphan:
-
-.. _ug-keras_kpi_data:
-
-
-=======================================
-Get KPI information for Keras Models
-=======================================
-
-.. autofunction:: model_compression_toolkit.core.keras_kpi_data
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_kpi_data_experimental.rst b/docsrc/source/api/api_docs/methods/keras_kpi_data_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_kpi_data_experimental.rst
rename to docsrc/source/api/api_docs/methods/keras_kpi_data_experimental.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_load_quantizad_model.rst b/docsrc/source/api/api_docs/methods/keras_load_quantizad_model.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_load_quantizad_model.rst
rename to docsrc/source/api/api_docs/methods/keras_load_quantizad_model.rst
diff --git a/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst b/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst
deleted file mode 100644
index 82a351716..000000000
--- a/docsrc/source/api/api_docs/methods/keras_post_training_quantization.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-:orphan:
-
-.. _ug-keras_post_training_quantization:
-
-
-=================================
-Keras Post Training Quantization
-=================================
-
-.. autofunction:: model_compression_toolkit.ptq.keras_post_training_quantization
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst b/docsrc/source/api/api_docs/methods/keras_post_training_quantization_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst
rename to docsrc/source/api/api_docs/methods/keras_post_training_quantization_experimental.rst
diff --git a/docsrc/source/api/api_docs/methods/keras_pruning_experimental.rst b/docsrc/source/api/api_docs/methods/keras_pruning_experimental.rst
new file mode 100644
index 000000000..508a11e47
--- /dev/null
+++ b/docsrc/source/api/api_docs/methods/keras_pruning_experimental.rst
@@ -0,0 +1,12 @@
+:orphan:
+
+.. _ug-keras_pruning_experimental:
+
+
+================================================
+Keras Structured Pruning
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.keras_pruning_experimental
+
+
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst b/docsrc/source/api/api_docs/methods/keras_quantization_aware_training_finalize.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst
rename to docsrc/source/api/api_docs/methods/keras_quantization_aware_training_finalize.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst b/docsrc/source/api/api_docs/methods/keras_quantization_aware_training_init.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst
rename to docsrc/source/api/api_docs/methods/keras_quantization_aware_training_init.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_data_generation_experimental.rst b/docsrc/source/api/api_docs/methods/pytorch_data_generation_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/pytorch_data_generation_experimental.rst
rename to docsrc/source/api/api_docs/methods/pytorch_data_generation_experimental.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst b/docsrc/source/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst
rename to docsrc/source/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst
diff --git a/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst b/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst
deleted file mode 100644
index 86f512eae..000000000
--- a/docsrc/source/api/api_docs/methods/pytorch_kpi_data.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-:orphan:
-
-.. _ug-pytorch_kpi_data:
-
-
-=======================================
-Get KPI information for PyTorch Models
-=======================================
-
-.. autofunction:: model_compression_toolkit.core.pytorch_kpi_data
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst b/docsrc/source/api/api_docs/methods/pytorch_kpi_data_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst
rename to docsrc/source/api/api_docs/methods/pytorch_kpi_data_experimental.rst
diff --git a/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst b/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst
deleted file mode 100644
index 46feca7ba..000000000
--- a/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization.rst
+++ /dev/null
@@ -1,10 +0,0 @@
-:orphan:
-
-.. _ug-pytorch_post_training_quantization:
-
-
-=====================================
-Pytorch Post Training Quantization
-=====================================
-
-.. autofunction:: model_compression_toolkit.ptq.pytorch_post_training_quantization
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst b/docsrc/source/api/api_docs/methods/pytorch_post_training_quantization_experimental.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst
rename to docsrc/source/api/api_docs/methods/pytorch_post_training_quantization_experimental.rst
diff --git a/docsrc/source/api/api_docs/methods/pytorch_pruning_experimental.rst b/docsrc/source/api/api_docs/methods/pytorch_pruning_experimental.rst
new file mode 100644
index 000000000..4f050cfe4
--- /dev/null
+++ b/docsrc/source/api/api_docs/methods/pytorch_pruning_experimental.rst
@@ -0,0 +1,15 @@
+:orphan:
+
+.. _ug-pytorch_pruning_experimental:
+
+
+================================================
+Pytorch Structured Pruning
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.pytorch_pruning_experimental
+
+
+
+
+
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst b/docsrc/source/api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst
rename to docsrc/source/api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst b/docsrc/source/api/api_docs/methods/pytorch_quantization_aware_training_init.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst
rename to docsrc/source/api/api_docs/methods/pytorch_quantization_aware_training_init.rst
diff --git a/docsrc/source/api/experimental_api_docs/methods/set_logger_path.rst b/docsrc/source/api/api_docs/methods/set_logger_path.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/methods/set_logger_path.rst
rename to docsrc/source/api/api_docs/methods/set_logger_path.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/core_config.rst b/docsrc/source/api/api_docs/modules/core_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/core_config.rst
rename to docsrc/source/api/api_docs/modules/core_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/debug_config.rst b/docsrc/source/api/api_docs/modules/debug_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/debug_config.rst
rename to docsrc/source/api/api_docs/modules/debug_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/exporter.rst b/docsrc/source/api/api_docs/modules/exporter.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/exporter.rst
rename to docsrc/source/api/api_docs/modules/exporter.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/layer_filters.rst b/docsrc/source/api/api_docs/modules/layer_filters.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/layer_filters.rst
rename to docsrc/source/api/api_docs/modules/layer_filters.rst
diff --git a/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst b/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst
index 4745b0b69..f3d6aba8c 100644
--- a/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst
+++ b/docsrc/source/api/api_docs/modules/mixed_precision_quantization_config.rst
@@ -1,11 +1,11 @@
 :orphan:
 
-.. _ug-mixed_precision_quantization_config:
+.. _ug-mixed_precision_quantization_config_v2:
 
 
-===========================================
+===========================================================
 mixed_precision_quantization_config Module
-===========================================
+===========================================================
 
 
 KPI
@@ -13,14 +13,13 @@ KPI
 **Object to configure resources to use when searching for a mixed-precision configuration for a model:**
 
 .. autoclass:: model_compression_toolkit.core.KPI
-    :noindex:
 
 
 |
 
 
-MixedPrecisionQuantizationConfig
-=================================
+MixedPrecisionQuantizationConfigV2
+===================================
 **Class to configure the quantization process of the model when quantizing in mixed-precision:**
 
 .. autoclass:: model_compression_toolkit.core.MixedPrecisionQuantizationConfig
diff --git a/docsrc/source/api/experimental_api_docs/modules/network_editor.rst b/docsrc/source/api/api_docs/modules/network_editor.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/network_editor.rst
rename to docsrc/source/api/api_docs/modules/network_editor.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/qat_config.rst b/docsrc/source/api/api_docs/modules/qat_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/qat_config.rst
rename to docsrc/source/api/api_docs/modules/qat_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/quantization_config.rst b/docsrc/source/api/api_docs/modules/quantization_config.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/quantization_config.rst
rename to docsrc/source/api/api_docs/modules/quantization_config.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/target_platform.rst b/docsrc/source/api/api_docs/modules/target_platform.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/target_platform.rst
rename to docsrc/source/api/api_docs/modules/target_platform.rst
diff --git a/docsrc/source/api/experimental_api_docs/modules/trainable_infrastructure.rst b/docsrc/source/api/api_docs/modules/trainable_infrastructure.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/modules/trainable_infrastructure.rst
rename to docsrc/source/api/api_docs/modules/trainable_infrastructure.rst
diff --git a/docsrc/source/api/experimental_api_docs/notes/experimental_api_note.rst b/docsrc/source/api/api_docs/notes/experimental_api_note.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/notes/experimental_api_note.rst
rename to docsrc/source/api/api_docs/notes/experimental_api_note.rst
diff --git a/docsrc/source/api/experimental_api_docs/notes/tpc_note.rst b/docsrc/source/api/api_docs/notes/tpc_note.rst
similarity index 100%
rename from docsrc/source/api/experimental_api_docs/notes/tpc_note.rst
rename to docsrc/source/api/api_docs/notes/tpc_note.rst
diff --git a/docsrc/source/api/experimental_api_docs/index.rst b/docsrc/source/api/experimental_api_docs/index.rst
deleted file mode 100644
index 12e023554..000000000
--- a/docsrc/source/api/experimental_api_docs/index.rst
+++ /dev/null
@@ -1,70 +0,0 @@
-:orphan:
-
-.. _ug-experimental_api_docs:
-
-
-=========
-API Docs
-=========
-
-**Init module for MCT API.**
-
-.. code-block:: python
-
-   import model_compression_toolkit as mct
-
-|
-
-.. include:: ./notes/experimental_api_note.rst
-
-|
-
-
-Functions
-=========
-- :ref:`pytorch_post_training_quantization_experimental<ug-pytorch_post_training_quantization_experimental>`: A function to use for post training quantization of PyTorch models (experimental).
-- :ref:`keras_post_training_quantization_experimental<ug-keras_post_training_quantization_experimental>`: A function to use for post training quantization of Keras models (experimental).
-- :ref:`keras_gradient_post_training_quantization_experimental<ug-keras_gradient_post_training_quantization_experimental>`: A function to use for gradient-based post training quantization of Keras models (experimental).
-- :ref:`pytorch_gradient_post_training_quantization_experimental<ug-pytorch_gradient_post_training_quantization_experimental>`: A function to use for gradient-based post training quantization of Pytorch models (experimental).
-- :ref:`keras_quantization_aware_training_init<ug-keras_quantization_aware_training_init>`: A function to use for preparing a model for Quantization Aware Training (Experimental)
-- :ref:`keras_quantization_aware_training_finalize<ug-keras_quantization_aware_training_finalize>`: A function to finalize a model after Quantization Aware Training to a model without QuantizeWrappers(Experimental)
-- :ref:`get_keras_gptq_config<ug-get_keras_gptq_config>`: A function to create a GradientPTQConfig instance to use for Keras models when using GPTQ (experimental).
-- :ref:`get_pytorch_gptq_config<ug-get_pytorch_gptq_config>`: A function to create a GradientPTQConfig instance to use for Pytorch models when using GPTQ (experimental).
-- :ref:`get_target_platform_capabilities<ug-get_target_platform_capabilities>`: A function to get a target platform model for Tensorflow and Pytorch.
-- :ref:`keras_kpi_data_experimental<ug-keras_kpi_data_experimental>`: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models (experimental).
-- :ref:`pytorch_kpi_data_experimental<ug-pytorch_kpi_data_experimental>`: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models (experimental).
-- :ref:`keras_load_quantized_model<ug-keras_load_quantized_model>`: A function to load a quantized keras model (experimental).
-- :ref:`tensorflow_data_generation_experimental<ug-tensorflow_data_generation_experimental>`: A function to generate data for a Keras model (experimental).
-- :ref:`get_keras_data_generation_config<ug-get_keras_data_generation_config>`: A function to generate a DataGenerationConfig for Tensorflow data generation(experimental).
-- :ref:`pytorch_data_generation_experimental<ug-pytorch_data_generation_experimental>`: A function to generate data for a Pytorch model (experimental).
-- :ref:`get_pytorch_data_generation_config<ug-get_pytorch_data_generation_config>`: A function to load a DataGenerationConfig for Pytorch data generation (experimental).
-- :ref:`keras_pruning_experimental<ug-keras_pruning_experimental>`: A function to apply structured pruning for Keras models (experimental).
-
-
-Modules
-=========
-- :ref:`core_config<ug-core_config>`: Module to contain configurations of the optimization process.
-- :ref:`quantization_config<ug-quantization_config>`: Module to configure the quantization process.
-- :ref:`mixed_precision_quantization_config<ug-mixed_precision_quantization_config_v2>`: Module to configure the quantization process when using mixed-precision PTQ.
-- :ref:`debug_config<ug-debug_config>`: Module to configure options for debugging the optimization process.
-- :ref:`target_platform<ug-target_platform>`: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference.
-- :ref:`qat_config<ug-qat_config>`: Module to create quantization configuration for Quantization-aware Training.
-- :ref:`exporter<ug-exporter>`: Module that enables to export a quantized model in different serialization formats.
-- :ref:`trainable_infrastructure<ug-trainable_infrastructure>`: Module that contains quantization abstraction and quantizers for hardware-oriented model optimization tools.
-
-Classes
-=========
-- :ref:`GradientPTQConfig<ug-GradientPTQConfig>`: Class to configure GradientPTQ options for gradient based post training quantization.
-- :ref:`FolderImageLoader<ug-FolderImageLoader>`: Class to use an images directory as a representative dataset.
-- :ref:`FrameworkInfo<ug-FrameworkInfo>`: Class to wrap framework information to be used by MCT when optimizing models.
-
-
-Indices and tables
-==================
-
-* :ref:`genindex`
-* :ref:`modindex`
-* :ref:`search`
-
-.. note:: This documentation is auto-generated using Sphinx
-
diff --git a/docsrc/source/api/experimental_api_docs/methods/keras_pruning_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/keras_pruning_experimental.rst
deleted file mode 100644
index 787bb2452..000000000
--- a/docsrc/source/api/experimental_api_docs/methods/keras_pruning_experimental.rst
+++ /dev/null
@@ -1,25 +0,0 @@
-:orphan:
-
-.. _ug-keras_pruning_experimental:
-
-
-================================================
-Keras Structured Pruning
-================================================
-
-.. autofunction:: model_compression_toolkit.pruning.keras_pruning_experimental
-
-================================================
-Pruning Configuration
-================================================
-
-.. autofunction:: model_compression_toolkit.pruning.PruningConfig
-
-
-
-================================================
-Pruning Information
-================================================
-
-.. autofunction:: model_compression_toolkit.pruning.PruningInfo
-
diff --git a/docsrc/source/api/experimental_api_docs/methods/pytorch_pruning_experimental.rst b/docsrc/source/api/experimental_api_docs/methods/pytorch_pruning_experimental.rst
deleted file mode 100644
index f52e130f5..000000000
--- a/docsrc/source/api/experimental_api_docs/methods/pytorch_pruning_experimental.rst
+++ /dev/null
@@ -1,25 +0,0 @@
-:orphan:
-
-.. _ug-pytorch_pruning_experimental:
-
-
-================================================
-Pytorch Structured Pruning
-================================================
-
-.. autofunction:: model_compression_toolkit.pruning.pytorch_pruning_experimental
-
-================================================
-Pruning Configuration
-================================================
-
-.. autofunction:: model_compression_toolkit.pruning.PruningConfig
-
-
-
-================================================
-Pruning Information
-================================================
-
-.. autofunction:: model_compression_toolkit.pruning.PruningInfo
-
diff --git a/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst b/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst
deleted file mode 100644
index f3d6aba8c..000000000
--- a/docsrc/source/api/experimental_api_docs/modules/mixed_precision_quantization_config.rst
+++ /dev/null
@@ -1,26 +0,0 @@
-:orphan:
-
-.. _ug-mixed_precision_quantization_config_v2:
-
-
-===========================================================
-mixed_precision_quantization_config Module
-===========================================================
-
-
-KPI
-================================
-**Object to configure resources to use when searching for a mixed-precision configuration for a model:**
-
-.. autoclass:: model_compression_toolkit.core.KPI
-
-
-|
-
-
-MixedPrecisionQuantizationConfigV2
-===================================
-**Class to configure the quantization process of the model when quantizing in mixed-precision:**
-
-.. autoclass:: model_compression_toolkit.core.MixedPrecisionQuantizationConfig
-
diff --git a/docsrc/source/index.rst b/docsrc/source/index.rst
index c6a9b0be0..2c4713162 100644
--- a/docsrc/source/index.rst
+++ b/docsrc/source/index.rst
@@ -52,21 +52,21 @@ Supported Features
 
 Keras:
 
-* :ref:`Post Training Quantization<ug-keras_post_training_quantization_experimental>` [1]
-* :ref:`Gradient based post training using knowledge distillation<ug-keras_gradient_post_training_quantization_experimental>`
-* :ref:`Mixed-precision post training quantization<ug-keras_post_training_quantization_mixed_precision>`
-* :ref:`Init model for Quantization Aware Training<ug-keras_quantization_aware_training_init>` (Experimental)
-* :ref:`Finalize model after Quantization Aware Training<ug-keras_quantization_aware_training_finalize>` (Experimental)
-* :ref:`Structured Pruning<ug-keras_pruning_experimental>` (Experimental)
+* :ref:`Post Training Quantization<ug-keras_post_training_quantization>` [1]
+* :ref:`Gradient based post training using knowledge distillation<ug-keras_gradient_post_training_quantization>`
+* :ref:`Init model for Quantization Aware Training<ug-keras_quantization_aware_training_init_experimental>` (Experimental)
+* :ref:`Finalize model after Quantization Aware Training<ug-keras_quantization_aware_training_finalize_experimental>` (Experimental)
+* :ref:`Structured pruning<ug-keras_pruning_experimental>` (Experimental)
+* :ref:`Data generation<ug-keras_data_generation_experimental>` (Experimental)
 
 Pytorch:
 
-* :ref:`Post Training Quantization<ug-pytorch_post_training_quantization_experimental>` [1]
-* :ref:`Gradient based post training using knowledge distillation<ug-pytorch_gradient_post_training_quantization_experimental>`
-* :ref:`Mixed-precision post training quantization<ug-pytorch_post_training_quantization_mixed_precision>`
-* :ref:`Init model for Quantization Aware Training<ug-pytorch_quantization_aware_training_init>` (Experimental)
-* :ref:`Finalize model after Quantization Aware Training<ug-pytorch_quantization_aware_training_finalize>` (Experimental)
-
+* :ref:`Post Training Quantization<ug-pytorch_post_training_quantization>` [1]
+* :ref:`Gradient based post training using knowledge distillation<ug-pytorch_gradient_post_training_quantization>`
+* :ref:`Init model for Quantization Aware Training<ug-pytorch_quantization_aware_training_init_experimental>` (Experimental)
+* :ref:`Finalize model after Quantization Aware Training<ug-pytorch_quantization_aware_training_finalize_experimental>` (Experimental)
+* :ref:`Structured pruning<ug-pytorch_pruning_experimental>` (Experimental)
+* :ref:`Data generation<ug-pytorch_data_generation_experimental>` (Experimental)
 
 
 Visualization:
@@ -101,7 +101,7 @@ Please visit the MCT API documentation here
     :titlesonly:
     :maxdepth: 1
 
-    API Documentation<../api/experimental_api_docs/index>
+    API Documentation<../api/api_docs/index>
 
 Technical Constraints
 =========================

From 1ca7bbb7a8deffe159f993b3a0df78c8594e4683 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Thu, 7 Mar 2024 17:52:56 +0200
Subject: [PATCH 4/9] fix comments of OperationsSetToLayers

---
 .../targetplatform2framework/operations_to_layers.py        | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/operations_to_layers.py b/model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/operations_to_layers.py
index 9fdc38dc7..6a1809f12 100644
--- a/model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/operations_to_layers.py
+++ b/model_compression_toolkit/target_platform_capabilities/target_platform/targetplatform2framework/operations_to_layers.py
@@ -35,9 +35,9 @@ def __init__(self,
         Args:
             op_set_name (str): Name of OperatorsSet to associate with layers.
             layers (List[Any]): List of layers/FilterLayerParams to associate with OperatorsSet.
-            attr_mapping (dict): A mapping between a general attribute name to a DefaultDict that maps a layer
-+                type to the layer's framework name of this attribute (the dictionary type is not specified to
-+                handle circular dependency).
+            attr_mapping (dict): A mapping between a general attribute name to a DefaultDict that maps a layer type
+            to the layer's framework name of this attribute (the dictionary type is not specified to handle circular
+            dependency).
         """
         self.layers = layers
         self.attr_mapping = attr_mapping

From 385b9f4e7493a6355e94dc052c42a35367193531 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Thu, 7 Mar 2024 18:06:11 +0200
Subject: [PATCH 5/9] automate makefile

---
 docsrc/Makefile | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/docsrc/Makefile b/docsrc/Makefile
index a31637a91..b869c2d44 100644
--- a/docsrc/Makefile
+++ b/docsrc/Makefile
@@ -6,7 +6,17 @@ github:
 	@cp -a ../docs/html/. ../docs
 	@rm -rf ../docs/html/
 	@rm -rf ../docs/doctrees/
+	@find ../docs -type f -exec sed -i 's|_images/|images/|g' {} +
+	@find ../docs -type f -exec sed -i 's|_static/|static/|g' {} +
+	@rm -rf ../docs/images
+	@rm -rf ../docs/static
+	@mv ../docs/_images/ ../docs/images
+	@mv ../docs/_static/ ../docs/static
 
+
+
+#@find ../docs -type f -exec sed -i 's|_images/|images/|g' {} +
+#@find ../docs -type f -exec sed -i 's|_static/|static/|g' {} +
 # rm -rf ../docs/images/
 # rm -rf ../docs/statis/
 # mv ../docs/_images/ ../docs/images

From 2cc4a9b08d4c8337f8d5ac61457bab83a87d9399 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Sat, 9 Mar 2024 20:08:28 +0200
Subject: [PATCH 6/9] Add export pytorch example

---
 docsrc/source/api/api_docs/index.rst          |   4 -
 .../source/api/api_docs/modules/exporter.rst  | 154 +++++++++++++++++-
 .../api_docs/notes/experimental_api_note.rst  |   7 -
 3 files changed, 153 insertions(+), 12 deletions(-)
 delete mode 100644 docsrc/source/api/api_docs/notes/experimental_api_note.rst

diff --git a/docsrc/source/api/api_docs/index.rst b/docsrc/source/api/api_docs/index.rst
index 072f21f1e..3b8eec621 100644
--- a/docsrc/source/api/api_docs/index.rst
+++ b/docsrc/source/api/api_docs/index.rst
@@ -15,10 +15,6 @@ API Docs
 
 |
 
-.. include:: ./notes/experimental_api_note.rst
-
-|
-
 
 Functions
 =========
diff --git a/docsrc/source/api/api_docs/modules/exporter.rst b/docsrc/source/api/api_docs/modules/exporter.rst
index 987cbe483..7977cc700 100644
--- a/docsrc/source/api/api_docs/modules/exporter.rst
+++ b/docsrc/source/api/api_docs/modules/exporter.rst
@@ -9,7 +9,13 @@ exporter Module
 
 Allows to export a quantized model in different serialization formats and quantization formats.
 For more details about the export formats and options, please refer to the project's GitHub `README file <https://github.com/sony/model_optimization/tree/main/model_compression_toolkit/exporter>`_.
-Note that this feature is experimental and subject to future changes. If you have any questions or issues, please open an issue in this GitHub repository.
+If you have any questions or issues, please open an issue in this GitHub repository.
+
+
+QuantizationFormat
+==========================
+
+.. autoclass:: model_compression_toolkit.exporter.QuantizationFormat
 
 
 KerasExportSerializationFormat
@@ -39,3 +45,149 @@ Allows to export a Pytorch model that was quantized via MCT.
 
 .. autoclass:: model_compression_toolkit.exporter.pytorch_export_model
 
+
+
+Pytorch Tutorial
+==========================
+
+To export a Pytorch model as a quantized model, it is necessary to first apply quantization
+to the model using MCT:
+
+.. code-block:: shell
+
+    ! pip install -q mct-nightly
+
+In order to export your quantized model to ONNX format, and use it for inference, some additional packages are needed. Notice, this is needed only for models exported to ONNX format, so this part can be skipped if this is not planned:
+
+.. code-block:: shell
+
+    ! pip install -q onnx onnxruntime onnxruntime-extensions
+
+Now, let's start the export demonstration by quantizing the model using MCT:
+
+.. code-block:: python
+
+    import model_compression_toolkit as mct
+    import numpy as np
+    import torch
+    from torchvision.models.mobilenetv2 import mobilenet_v2
+
+    # Create a model
+    float_model = mobilenet_v2()
+
+
+    # Notice that here the representative dataset is random for demonstration only.
+    def representative_data_gen():
+        yield [np.random.random((1, 3, 224, 224))]
+
+
+    quantized_exportable_model, _ = mct.ptq.pytorch_post_training_quantization(float_model, representative_data_gen=representative_data_gen)
+
+
+
+
+### ONNX
+
+The model will be exported in ONNX format where weights and activations are represented as float. Notice that `onnx` should be installed in order to export the model to an ONNX model.
+
+There are two optional formats to choose: MCTQ or FAKELY_QUANT.
+
+#### MCTQ Quantization Format
+
+By default, `mct.exporter.pytorch_export_model` will export the quantized pytorch model to
+an ONNX model with custom quantizers from mct_quantizers module.
+
+
+
+.. code-block:: python
+
+    # Path of exported model
+    onnx_file_path = 'model_format_onnx_mctq.onnx'
+
+    # Export ONNX model with mctq quantizers.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=onnx_file_path,
+                                      repr_dataset=representative_data_gen)
+
+Notice that the model has the same size as the quantized exportable model as weights data types are float.
+
+#### ONNX opset version
+
+By default, the used ONNX opset version is 15, but this can be changed using `onnx_opset_version`:
+
+.. code-block:: python
+
+    # Export ONNX model with mctq quantizers.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=onnx_file_path,
+                                      repr_dataset=representative_data_gen,
+                                      onnx_opset_version=16)
+
+### Use exported model for inference
+
+To load and infer using the exported model, which was exported to an ONNX file in MCTQ format, we will use `mct_quantizers` method `get_ort_session_options` during onnxruntime session creation. **Notice**, inference on models that are exported in this format are slowly and suffers from longer latency. However, inference of these models on IMX500 will not suffer from this issue.
+
+.. code-block:: python
+
+    import mct_quantizers as mctq
+    import onnxruntime as ort
+
+    sess = ort.InferenceSession(onnx_file_path,
+                                mctq.get_ort_session_options(),
+                                providers=['CUDAExecutionProvider', 'CPUExecutionProvider'])
+
+    _input_data = next(representative_data_gen())[0].astype(np.float32)
+    _model_output_name = sess.get_outputs()[0].name
+    _model_input_name = sess.get_inputs()[0].name
+
+    # Run inference
+    predictions = sess.run([_model_output_name], {_model_input_name: _input_data})
+
+#### Fakely-Quantized
+
+To export a fakely-quantized model, use QuantizationFormat.FAKELY_QUANT:
+
+.. code-block:: python
+
+    import tempfile
+
+    # Path of exported model
+    _, onnx_file_path = tempfile.mkstemp('.onnx')
+
+    # Use QuantizationFormat.FAKELY_QUANT for fakely-quantized weights and activations.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=onnx_file_path,
+                                      repr_dataset=representative_data_gen,
+                                      quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+
+Notice that the fakely-quantized model has the same size as the quantized
+exportable model as weights data types are float.
+
+### TorchScript
+
+The model will be exported in TorchScript format where weights and activations are
+quantized but represented as float (fakely quant).
+
+.. code-block:: python
+
+    # Path of exported model
+    _, torchscript_file_path = tempfile.mkstemp('.pt')
+
+
+    # Use mode PytorchExportSerializationFormat.TORCHSCRIPT a torchscript model
+    # and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights and activations.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=torchscript_file_path,
+                                      repr_dataset=representative_data_gen,
+                                      serialization_format=mct.exporter.PytorchExportSerializationFormat.TORCHSCRIPT,
+                                      quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.
+
+
+
+
+
+
diff --git a/docsrc/source/api/api_docs/notes/experimental_api_note.rst b/docsrc/source/api/api_docs/notes/experimental_api_note.rst
deleted file mode 100644
index 4980a5344..000000000
--- a/docsrc/source/api/api_docs/notes/experimental_api_note.rst
+++ /dev/null
@@ -1,7 +0,0 @@
-
-.. note::
-   This is an experimental new API. The previous API is still available and can be used as before (please
-   visit :ref:`previous API documentation <ug-api_docs>` for more information). However, we recommend using the new API as the previous API is deprecated
-   and will be removed in the future.
-
-

From 8de2704c59e6bae4fde328a025a8224c81ba5c42 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Sat, 9 Mar 2024 20:22:19 +0200
Subject: [PATCH 7/9] add QuantizationFormat doc

---
 .../model_exporter/fw_agonstic/quantization_format.py  | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/model_compression_toolkit/exporter/model_exporter/fw_agonstic/quantization_format.py b/model_compression_toolkit/exporter/model_exporter/fw_agonstic/quantization_format.py
index dc9c7e965..b6fedc2b2 100644
--- a/model_compression_toolkit/exporter/model_exporter/fw_agonstic/quantization_format.py
+++ b/model_compression_toolkit/exporter/model_exporter/fw_agonstic/quantization_format.py
@@ -16,6 +16,16 @@
 
 
 class QuantizationFormat(Enum):
+    """
+    Specify which quantization format to use for exporting a quantized model.
+
+    FAKELY_QUANT - Weights and activations are quantized but represented using float data type.
+
+    INT8 - Weights and activations are represented using 8-bit integer data type.
+
+    MCTQ - Weights and activations are quantized using mct_quantizers custom quantizers.
+
+    """
     FAKELY_QUANT = 0
     INT8 = 1
     MCTQ = 2

From 38eb005873713ac4c328b86176cc45334f7a4e44 Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Sat, 9 Mar 2024 20:25:46 +0200
Subject: [PATCH 8/9] fix exporter subtitles

---
 .../source/api/api_docs/modules/exporter.rst  | 190 ++++++++++++++++--
 1 file changed, 175 insertions(+), 15 deletions(-)

diff --git a/docsrc/source/api/api_docs/modules/exporter.rst b/docsrc/source/api/api_docs/modules/exporter.rst
index 7977cc700..e441eee22 100644
--- a/docsrc/source/api/api_docs/modules/exporter.rst
+++ b/docsrc/source/api/api_docs/modules/exporter.rst
@@ -25,6 +25,159 @@ Select the serialization format for exporting a quantized Keras model.
 .. autoclass:: model_compression_toolkit.exporter.KerasExportSerializationFormat
 
 
+keras_export_model
+==========================
+Allows to export a Keras model that was quantized via MCT.
+
+.. autoclass:: model_compression_toolkit.exporter.keras_export_model
+
+
+Keras Tutorial
+==========================
+To export a TensorFlow model as a quantized model, it is necessary to first apply quantization
+to the model using MCT:
+
+.. code-block:: shell
+
+    ! pip install -q mct-nightly
+
+.. code-block:: python
+
+    import numpy as np
+    from keras.applications import ResNet50
+    import model_compression_toolkit as mct
+
+    # Create a model
+    float_model = ResNet50()
+    # Quantize the model.
+    # Notice that here the representative dataset is random for demonstration only.
+    quantized_exportable_model, _ = mct.ptq.keras_post_training_quantization(float_model,
+                                                                             representative_data_gen=lambda: [np.random.random((1, 224, 224, 3))])
+
+
+
+++++++++++++++++++++++++++++
+keras serialization format
+++++++++++++++++++++++++++++
+The model will be exported as a tensorflow `.keras` model where weights and activations are quantized but represented using a float32 dtype.
+Two optional quantization formats are available: MCTQ and FAKELY_QUANT.
+
+++++
+MCTQ
+++++
+
+By default, `mct.exporter.keras_export_model` will export the quantized Keras model to
+a .keras model with custom quantizers from mct_quantizers module.
+
+.. code-block:: python
+
+    import tempfile
+
+    # Path of exported model
+    _, keras_file_path = tempfile.mkstemp('.keras')
+
+    # Export a keras model with mctq custom quantizers.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=keras_file_path)
+
+Notice that the model has the same size as the quantized exportable model as weights data types are float.
+
++++++++++++++++++++++++++++
+Fakely-Quantized in Keras
++++++++++++++++++++++++++++
+
+.. code-block:: python
+
+    # Path of exported model
+    _, keras_file_path = tempfile.mkstemp('.keras')
+
+    # Use mode KerasExportSerializationFormat.KERAS for a .keras model
+    # and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights
+    # and activations.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=keras_file_path,
+                                    quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.
+
+++++++
+TFLite
+++++++
+
+The tflite serialization format export in two qauntization formats: INT8 and FAKELY_QUANT.
+
++++++++++++
+INT8 TFLite
++++++++++++
+
+The model will be exported as a tflite model where weights and activations are represented as 8bit integers.
+
+.. code-block:: python
+
+    import tempfile
+
+    # Path of exported model
+    _, tflite_file_path = tempfile.mkstemp('.tflite')
+
+    # Use mode KerasExportSerializationFormat.TFLITE for tflite model and quantization_format.INT8.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=tflite_file_path,
+                                    serialization_format=mct.exporter.KerasExportSerializationFormat.TFLITE,
+                                    quantization_format=mct.exporter.QuantizationFormat.INT8)
+
+Compare size of float and quantized model:
+
+
+.. code-block:: python
+
+    import os
+
+    # Save float model to measure its size
+    _, float_file_path = tempfile.mkstemp('.keras')
+    float_model.save(float_file_path)
+
+    print("Float model in Mb:", os.path.getsize(float_file_path) / float(2 ** 20))
+    print("Quantized model in Mb:", os.path.getsize(tflite_file_path) / float(2 ** 20))
+    print(f'Compression ratio: {os.path.getsize(float_file_path) / os.path.getsize(tflite_file_path)}')
+
+
++++++++++++++++++++++++
+Fakely-Quantized TFLite
++++++++++++++++++++++++
+
+The model will be exported as a tflite model where weights and activations are quantized but represented with a float data type.
+
++++++++++++++
+Usage Example
++++++++++++++
+
+
+
+.. code-block:: python
+
+    # Path of exported model
+    _, tflite_file_path = tempfile.mkstemp('.tflite')
+
+    # Use mode KerasExportSerializationFormat.TFLITE for tflite model and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights
+    # and activations.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=tflite_file_path,
+                                    serialization_format=mct.exporter.KerasExportSerializationFormat.TFLITE,
+                                    quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+
+
+
+
+Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.
+
+
+
+
+
+
 PytorchExportSerializationFormat
 ==================================
 Select the serialization format for exporting a quantized Pytorch model.
@@ -32,11 +185,7 @@ Select the serialization format for exporting a quantized Pytorch model.
 .. autoclass:: model_compression_toolkit.exporter.PytorchExportSerializationFormat
 
 
-keras_export_model
-==========================
-Allows to export a Keras model that was quantized via MCT.
 
-.. autoclass:: model_compression_toolkit.exporter.keras_export_model
 
 
 pytorch_export_model
@@ -85,14 +234,17 @@ Now, let's start the export demonstration by quantizing the model using MCT:
 
 
 
-
-### ONNX
++++++++++
+ONNX
++++++++++
 
 The model will be exported in ONNX format where weights and activations are represented as float. Notice that `onnx` should be installed in order to export the model to an ONNX model.
 
 There are two optional formats to choose: MCTQ or FAKELY_QUANT.
 
-#### MCTQ Quantization Format
++++++++++++++++++++++++++++
+MCTQ Quantization Format
++++++++++++++++++++++++++++
 
 By default, `mct.exporter.pytorch_export_model` will export the quantized pytorch model to
 an ONNX model with custom quantizers from mct_quantizers module.
@@ -111,7 +263,9 @@ an ONNX model with custom quantizers from mct_quantizers module.
 
 Notice that the model has the same size as the quantized exportable model as weights data types are float.
 
-#### ONNX opset version
++++++++++++++++++++++++++++
+ONNX opset version
++++++++++++++++++++++++++++
 
 By default, the used ONNX opset version is 15, but this can be changed using `onnx_opset_version`:
 
@@ -123,7 +277,11 @@ By default, the used ONNX opset version is 15, but this can be changed using `on
                                       repr_dataset=representative_data_gen,
                                       onnx_opset_version=16)
 
-### Use exported model for inference
+|
+
+++++++++++++++++++++++++++++++++++++
+Use exported model for inference
+++++++++++++++++++++++++++++++++++++
 
 To load and infer using the exported model, which was exported to an ONNX file in MCTQ format, we will use `mct_quantizers` method `get_ort_session_options` during onnxruntime session creation. **Notice**, inference on models that are exported in this format are slowly and suffers from longer latency. However, inference of these models on IMX500 will not suffer from this issue.
 
@@ -143,7 +301,11 @@ To load and infer using the exported model, which was exported to an ONNX file i
     # Run inference
     predictions = sess.run([_model_output_name], {_model_input_name: _input_data})
 
-#### Fakely-Quantized
+|
+
++++++++++++++++++++++++++++++
+Fakely-Quantized in Pytorch
++++++++++++++++++++++++++++++
 
 To export a fakely-quantized model, use QuantizationFormat.FAKELY_QUANT:
 
@@ -164,7 +326,9 @@ To export a fakely-quantized model, use QuantizationFormat.FAKELY_QUANT:
 Notice that the fakely-quantized model has the same size as the quantized
 exportable model as weights data types are float.
 
-### TorchScript
+++++++++++++++++++
+TorchScript
+++++++++++++++++++
 
 The model will be exported in TorchScript format where weights and activations are
 quantized but represented as float (fakely quant).
@@ -187,7 +351,3 @@ Notice that the fakely-quantized model has the same size as the quantized export
 float.
 
 
-
-
-
-

From 7b1d1080629c4b23b34ad2835bb45f73ae0d777f Mon Sep 17 00:00:00 2001
From: reuvenp <reuvenp@altair-semi.com>
Date: Sat, 9 Mar 2024 20:40:17 +0200
Subject: [PATCH 9/9] auto generated

---
 .../api/api_docs/classes/DefaultDict.rst.txt  |  11 +
 .../classes/FolderImageLoader.rst.txt         |  20 +
 .../api_docs/classes/FrameworkInfo.rst.txt    |  23 +
 .../classes/GradientPTQConfig.rst.txt         |  24 +
 .../api_docs/classes/PruningConfig.rst.txt    |   9 +
 .../api/api_docs/classes/PruningInfo.rst.txt  |  10 +
 docs/_sources/api/api_docs/index.rst.txt      |  50 +-
 .../get_keras_data_generation_config.rst.txt  |  10 +
 .../methods/get_keras_gptq_config.rst.txt     |  10 +
 ...get_pytorch_data_generation_config.rst.txt |  10 +
 .../methods/get_pytroch_gptq_config.rst.txt   |  10 +
 .../get_target_platform_capabilities.rst.txt  |  13 +
 ...keras_data_generation_experimental.rst.txt |  10 +
 ...training_quantization_experimental.rst.txt |  10 +
 .../keras_kpi_data_experimental.rst.txt       |  10 +
 .../keras_load_quantizad_model.rst.txt        |  10 +
 ...training_quantization_experimental.rst.txt |  10 +
 .../keras_pruning_experimental.rst.txt        |  12 +
 ...antization_aware_training_finalize.rst.txt |  10 +
 ...s_quantization_aware_training_init.rst.txt |  10 +
 ...torch_data_generation_experimental.rst.txt |  10 +
 ...training_quantization_experimental.rst.txt |  10 +
 .../pytorch_kpi_data_experimental.rst.txt     |  10 +
 ...training_quantization_experimental.rst.txt |  10 +
 .../pytorch_pruning_experimental.rst.txt      |  15 +
 ...antization_aware_training_finalize.rst.txt |  10 +
 ...h_quantization_aware_training_init.rst.txt |  10 +
 .../api_docs/methods/set_logger_path.rst.txt  |  10 +
 .../api/api_docs/modules/core_config.rst.txt  |  16 +
 .../api/api_docs/modules/debug_config.rst.txt |  17 +
 .../api/api_docs/modules/exporter.rst.txt     | 353 ++++++++++++++
 .../api_docs/modules/layer_filters.rst.txt    |  40 ++
 ...ixed_precision_quantization_config.rst.txt |  15 +-
 .../api_docs/modules/network_editor.rst.txt   |  62 +++
 .../api/api_docs/modules/qat_config.rst.txt   |  26 +
 .../modules/quantization_config.rst.txt       |  25 +
 .../api_docs/modules/target_platform.rst.txt  | 357 ++++++++++++++
 .../modules/trainable_infrastructure.rst.txt  |  83 ++++
 .../api/api_docs/notes/tpc_note.rst.txt       |   8 +
 docs/_sources/index.rst.txt                   |  28 +-
 docs/api/api_docs/classes/DefaultDict.html    |  44 +-
 .../api_docs/classes/FolderImageLoader.html   |  43 +-
 docs/api/api_docs/classes/FrameworkInfo.html  |  34 +-
 .../api_docs/classes/GradientPTQConfig.html   |  67 ++-
 docs/api/api_docs/classes/PruningConfig.html  | 124 +++++
 docs/api/api_docs/classes/PruningInfo.html    | 117 +++++
 docs/api/api_docs/index.html                  |  62 ++-
 .../get_keras_data_generation_config.html     | 122 +++++
 .../methods/get_keras_gptq_config.html        |  57 ++-
 .../get_pytorch_data_generation_config.html   | 123 +++++
 .../methods/get_pytroch_gptq_config.html      | 123 +++++
 .../get_target_platform_capabilities.html     |  46 +-
 .../keras_data_generation_experimental.html   | 109 +++++
 ...st_training_quantization_experimental.html | 165 +++++++
 .../methods/keras_kpi_data_experimental.html  | 126 +++++
 .../methods/keras_load_quantizad_model.html   | 101 ++++
 ...st_training_quantization_experimental.html | 156 ++++++
 .../methods/keras_pruning_experimental.html   | 154 ++++++
 ..._quantization_aware_training_finalize.html | 144 ++++++
 ...eras_quantization_aware_training_init.html | 165 +++++++
 .../pytorch_data_generation_experimental.html | 109 +++++
 ...st_training_quantization_experimental.html | 146 ++++++
 .../pytorch_kpi_data_experimental.html        | 126 +++++
 ...st_training_quantization_experimental.html | 135 ++++++
 .../methods/pytorch_pruning_experimental.html | 158 ++++++
 ..._quantization_aware_training_finalize.html | 127 +++++
 ...orch_quantization_aware_training_init.html | 152 ++++++
 .../api/api_docs/methods/set_logger_path.html |  25 +-
 docs/api/api_docs/modules/core_config.html    | 113 +++++
 docs/api/api_docs/modules/debug_config.html   | 113 +++++
 docs/api/api_docs/modules/exporter.html       | 455 ++++++++++++++++++
 docs/api/api_docs/modules/layer_filters.html  |  33 +-
 .../mixed_precision_quantization_config.html  |  27 +-
 docs/api/api_docs/modules/network_editor.html | 124 ++---
 docs/api/api_docs/modules/qat_config.html     | 131 +++++
 .../api_docs/modules/quantization_config.html |  48 +-
 .../api/api_docs/modules/target_platform.html | 374 +++++++-------
 .../modules/trainable_infrastructure.html     | 216 +++++++++
 docs/api/api_docs/notes/tpc_note.html         |  27 +-
 docs/genindex.html                            | 184 ++++---
 docs/guidelines/quickstart_pytorch.html       |   8 +-
 docs/guidelines/visualization.html            |   4 +-
 docs/index.html                               |  28 +-
 docs/objects.inv                              | Bin 5533 -> 5385 bytes
 docs/searchindex.js                           |   2 +-
 85 files changed, 5732 insertions(+), 612 deletions(-)
 create mode 100644 docs/_sources/api/api_docs/classes/DefaultDict.rst.txt
 create mode 100644 docs/_sources/api/api_docs/classes/FolderImageLoader.rst.txt
 create mode 100644 docs/_sources/api/api_docs/classes/FrameworkInfo.rst.txt
 create mode 100644 docs/_sources/api/api_docs/classes/GradientPTQConfig.rst.txt
 create mode 100644 docs/_sources/api/api_docs/classes/PruningConfig.rst.txt
 create mode 100644 docs/_sources/api/api_docs/classes/PruningInfo.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/get_keras_data_generation_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/get_keras_gptq_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/get_pytorch_data_generation_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/get_pytroch_gptq_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_data_generation_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_kpi_data_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_load_quantizad_model.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_post_training_quantization_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_pruning_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_quantization_aware_training_finalize.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/keras_quantization_aware_training_init.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_data_generation_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_kpi_data_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_post_training_quantization_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_pruning_experimental.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_init.rst.txt
 create mode 100644 docs/_sources/api/api_docs/methods/set_logger_path.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/core_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/debug_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/exporter.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/layer_filters.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/network_editor.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/qat_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/quantization_config.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/target_platform.rst.txt
 create mode 100644 docs/_sources/api/api_docs/modules/trainable_infrastructure.rst.txt
 create mode 100644 docs/_sources/api/api_docs/notes/tpc_note.rst.txt
 create mode 100644 docs/api/api_docs/classes/PruningConfig.html
 create mode 100644 docs/api/api_docs/classes/PruningInfo.html
 create mode 100644 docs/api/api_docs/methods/get_keras_data_generation_config.html
 create mode 100644 docs/api/api_docs/methods/get_pytorch_data_generation_config.html
 create mode 100644 docs/api/api_docs/methods/get_pytroch_gptq_config.html
 create mode 100644 docs/api/api_docs/methods/keras_data_generation_experimental.html
 create mode 100644 docs/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.html
 create mode 100644 docs/api/api_docs/methods/keras_kpi_data_experimental.html
 create mode 100644 docs/api/api_docs/methods/keras_load_quantizad_model.html
 create mode 100644 docs/api/api_docs/methods/keras_post_training_quantization_experimental.html
 create mode 100644 docs/api/api_docs/methods/keras_pruning_experimental.html
 create mode 100644 docs/api/api_docs/methods/keras_quantization_aware_training_finalize.html
 create mode 100644 docs/api/api_docs/methods/keras_quantization_aware_training_init.html
 create mode 100644 docs/api/api_docs/methods/pytorch_data_generation_experimental.html
 create mode 100644 docs/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html
 create mode 100644 docs/api/api_docs/methods/pytorch_kpi_data_experimental.html
 create mode 100644 docs/api/api_docs/methods/pytorch_post_training_quantization_experimental.html
 create mode 100644 docs/api/api_docs/methods/pytorch_pruning_experimental.html
 create mode 100644 docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize.html
 create mode 100644 docs/api/api_docs/methods/pytorch_quantization_aware_training_init.html
 create mode 100644 docs/api/api_docs/modules/core_config.html
 create mode 100644 docs/api/api_docs/modules/debug_config.html
 create mode 100644 docs/api/api_docs/modules/exporter.html
 create mode 100644 docs/api/api_docs/modules/qat_config.html
 create mode 100644 docs/api/api_docs/modules/trainable_infrastructure.html

diff --git a/docs/_sources/api/api_docs/classes/DefaultDict.rst.txt b/docs/_sources/api/api_docs/classes/DefaultDict.rst.txt
new file mode 100644
index 000000000..3d62995b3
--- /dev/null
+++ b/docs/_sources/api/api_docs/classes/DefaultDict.rst.txt
@@ -0,0 +1,11 @@
+:orphan:
+
+.. _ug-DefaultDict:
+
+
+=================================
+DefaultDict Class
+=================================
+
+.. autoclass:: model_compression_toolkit.DefaultDict
+    :members:
diff --git a/docs/_sources/api/api_docs/classes/FolderImageLoader.rst.txt b/docs/_sources/api/api_docs/classes/FolderImageLoader.rst.txt
new file mode 100644
index 000000000..6897e353f
--- /dev/null
+++ b/docs/_sources/api/api_docs/classes/FolderImageLoader.rst.txt
@@ -0,0 +1,20 @@
+:orphan:
+
+.. _ug-FolderImageLoader:
+
+===============================
+Folder Image Loader API
+===============================
+
+**The following API can be used to load a folder of images to create a representative dataset for PTQ calibration**
+
+.. autoclass:: model_compression_toolkit.core.FolderImageLoader
+    :members:
+
+
+=================================
+Default file types to scan
+=================================
+
+.. autodata:: model_compression_toolkit.core.common.data_loader.FILETYPES
+
diff --git a/docs/_sources/api/api_docs/classes/FrameworkInfo.rst.txt b/docs/_sources/api/api_docs/classes/FrameworkInfo.rst.txt
new file mode 100644
index 000000000..2338a7dd4
--- /dev/null
+++ b/docs/_sources/api/api_docs/classes/FrameworkInfo.rst.txt
@@ -0,0 +1,23 @@
+:orphan:
+
+.. _ug-FrameworkInfo:
+
+
+=================================
+FrameworkInfo Class
+=================================
+
+**The following API can be used to pass MCT framework-related information to use when optimizing the network**
+
+.. autoclass:: model_compression_toolkit.core.FrameworkInfo
+
+
+|
+
+
+ChannelAxis
+==========================
+**Enum to select the output channels format in the model:**
+
+.. autoclass:: model_compression_toolkit.core.ChannelAxis
+
diff --git a/docs/_sources/api/api_docs/classes/GradientPTQConfig.rst.txt b/docs/_sources/api/api_docs/classes/GradientPTQConfig.rst.txt
new file mode 100644
index 000000000..11a79e1c8
--- /dev/null
+++ b/docs/_sources/api/api_docs/classes/GradientPTQConfig.rst.txt
@@ -0,0 +1,24 @@
+:orphan:
+
+.. _ug-GradientPTQConfig:
+
+
+=================================
+GradientPTQConfig Class
+=================================
+
+
+**The following API can be used to create a GradientPTQConfig instance which can be used for post training quantization using knowledge distillation from a teacher (float Keras model) to a student (the quantized Keras model)**
+
+.. autoclass:: model_compression_toolkit.gptq.GradientPTQConfig
+    :members:
+
+=================================
+GPTQHessianScoresConfig Class
+=================================
+
+
+**The following API can be used to create a GPTQHessianScoresConfig instance which can be used to define necessary parameters for computing Hessian scores for the GPTQ loss function.**
+
+.. autoclass:: model_compression_toolkit.gptq.GPTQHessianScoresConfig
+    :members:
diff --git a/docs/_sources/api/api_docs/classes/PruningConfig.rst.txt b/docs/_sources/api/api_docs/classes/PruningConfig.rst.txt
new file mode 100644
index 000000000..0b57b743a
--- /dev/null
+++ b/docs/_sources/api/api_docs/classes/PruningConfig.rst.txt
@@ -0,0 +1,9 @@
+:orphan:
+
+.. _ug-PruningConfig:
+
+================================================
+Pruning Configuration
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.PruningConfig
\ No newline at end of file
diff --git a/docs/_sources/api/api_docs/classes/PruningInfo.rst.txt b/docs/_sources/api/api_docs/classes/PruningInfo.rst.txt
new file mode 100644
index 000000000..7bd02336c
--- /dev/null
+++ b/docs/_sources/api/api_docs/classes/PruningInfo.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-PruningInfo:
+
+================================================
+Pruning Information
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.PruningInfo
+
diff --git a/docs/_sources/api/api_docs/index.rst.txt b/docs/_sources/api/api_docs/index.rst.txt
index 28f078466..3b8eec621 100644
--- a/docs/_sources/api/api_docs/index.rst.txt
+++ b/docs/_sources/api/api_docs/index.rst.txt
@@ -7,8 +7,6 @@
 API Docs
 =========
 
-.. note:: This API will be removed in future releases. Please switch to the :ref:`new API<ug-experimental_api_docs>`
-
 **Init module for MCT API.**
 
 .. code-block:: python
@@ -17,30 +15,56 @@ API Docs
 
 |
 
+
 Functions
 =========
-- :ref:`pytorch_post_training_quantization<ug-pytorch_post_training_quantization>`: Function to use for post training quantization of Pytorch models.
-- :ref:`pytorch_post_training_quantization_mixed_precision<ug-pytorch_post_training_quantization_mixed_precision>`: Function to use for mixed-precision post training quantization of Pytorch models (experimental).
-- :ref:`keras_post_training_quantization<ug-keras_post_training_quantization>`: Function to use for post training quantization of Keras models.
-- :ref:`keras_post_training_quantization_mixed_precision<ug-keras_post_training_quantization_mixed_precision>`: Function to use for mixed-precision post training quantization of Keras models (experimental).
-- :ref:`get_keras_gptq_config<ug-get_keras_gptq_config>`: Function to create a GradientPTQConfig instance to use for Keras models when using GPTQ (experimental).
-- :ref:`get_target_platform_capabilities<ug-get_target_platform_capabilities>`: Function to get a target platform model for Tensorflow and Pytorch.
-- :ref:`keras_kpi_data<ug-keras_kpi_data>`: Function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models.
-- :ref:`pytorch_kpi_data<ug-pytorch_kpi_data>`: Function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models.
+- :ref:`pytorch_post_training_quantization<ug-pytorch_post_training_quantization>`: A function to use for post training quantization of PyTorch models.
+- :ref:`keras_post_training_quantization<ug-keras_post_training_quantization>`: A function to use for post training quantization of Keras models.
+
+- :ref:`keras_gradient_post_training_quantization<ug-keras_gradient_post_training_quantization>`: A function to use for gradient-based post training quantization of Keras models.
+- :ref:`get_keras_gptq_config<ug-get_keras_gptq_config>`: A function to create a GradientPTQConfig instance to use for Keras models when using GPTQ.
+
+- :ref:`pytorch_gradient_post_training_quantization<ug-pytorch_gradient_post_training_quantization>`: A function to use for gradient-based post training quantization of Pytorch models.
+- :ref:`get_pytorch_gptq_config<ug-get_pytorch_gptq_config>`: A function to create a GradientPTQConfig instance to use for Pytorch models when using GPTQ.
+
+- :ref:`keras_quantization_aware_training_init<ug-keras_quantization_aware_training_init_experimental>`: A function to use for preparing a model for Quantization Aware Training (Experimental)
+- :ref:`keras_quantization_aware_training_finalize<ug-keras_quantization_aware_training_finalize_experimental>`: A function to finalize a model after Quantization Aware Training to a model without QuantizeWrappers (Experimental)
+
+- :ref:`keras_data_generation_experimental<ug-keras_data_generation_experimental>`: A function to generate data for a Keras model (experimental).
+- :ref:`get_keras_data_generation_config<ug-get_keras_data_generation_config>`: A function to generate a DataGenerationConfig for Tensorflow data generation(experimental).
+
+- :ref:`pytorch_data_generation_experimental<ug-pytorch_data_generation_experimental>`: A function to generate data for a Pytorch model (experimental).
+- :ref:`get_pytorch_data_generation_config<ug-get_pytorch_data_generation_config>`: A function to load a DataGenerationConfig for Pytorch data generation (experimental).
+
+- :ref:`keras_pruning_experimental<ug-keras_pruning_experimental>`: A function to apply structured pruning for Keras models (experimental).
+- :ref:`pytorch_pruning_experimental<ug-pytorch_pruning_experimental>`: A function to apply structured pruning for Pytorch models (experimental).
+
+- :ref:`keras_kpi_data<ug-keras_kpi_data>`: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models.
+- :ref:`pytorch_kpi_data<ug-pytorch_kpi_data>`: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models.
+
+- :ref:`get_target_platform_capabilities<ug-get_target_platform_capabilities>`: A function to get a target platform model for Tensorflow and Pytorch.
+- :ref:`keras_load_quantized_model<ug-keras_load_quantized_model>`: A function to load a quantized keras model.
 
 
 Modules
 =========
+- :ref:`core_config<ug-core_config>`: Module to contain configurations of the optimization process.
 - :ref:`quantization_config<ug-quantization_config>`: Module to configure the quantization process.
-- :ref:`mixed_precision_quantization_config<ug-mixed_precision_quantization_config>`: Module to configure the quantization process when using mixed-precision PTQ.
-- :ref:`network_editor<ug-network_editor>`: Module to edit your model during the quantization process.
+- :ref:`mixed_precision_quantization_config<ug-mixed_precision_quantization_config_v2>`: Module to configure the quantization process when using mixed-precision PTQ.
+- :ref:`debug_config<ug-debug_config>`: Module to configure options for debugging the optimization process.
 - :ref:`target_platform<ug-target_platform>`: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference.
+- :ref:`qat_config<ug-qat_config>`: Module to create quantization configuration for Quantization-aware Training.
+- :ref:`exporter<ug-exporter>`: Module that enables to export a quantized model in different serialization formats.
+- :ref:`trainable_infrastructure<ug-trainable_infrastructure>`: Module that contains quantization abstraction and quantizers for hardware-oriented model optimization tools.
 
 Classes
 =========
-- :ref:`GradientPTQConfig<ug-GradientPTQConfig>`: Class to configure GradientPTQC options for gradient based post training quantization.
+- :ref:`GradientPTQConfig<ug-GradientPTQConfig>`: Class to configure GradientPTQ options for gradient based post training quantization.
 - :ref:`FolderImageLoader<ug-FolderImageLoader>`: Class to use an images directory as a representative dataset.
 - :ref:`FrameworkInfo<ug-FrameworkInfo>`: Class to wrap framework information to be used by MCT when optimizing models.
+- :ref:`PruningConfig<ug-PruningConfig>`: PruningConfig
+- :ref:`PruningInfo<ug-PruningInfo>`: PruningInfo
+
 
 Indices and tables
 ==================
diff --git a/docs/_sources/api/api_docs/methods/get_keras_data_generation_config.rst.txt b/docs/_sources/api/api_docs/methods/get_keras_data_generation_config.rst.txt
new file mode 100644
index 000000000..33efd7cb7
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/get_keras_data_generation_config.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-get_keras_data_generation_config:
+
+
+===========================================
+Get DataGenerationConfig for Keras Models
+===========================================
+
+.. autofunction:: model_compression_toolkit.data_generation.get_keras_data_generation_config
diff --git a/docs/_sources/api/api_docs/methods/get_keras_gptq_config.rst.txt b/docs/_sources/api/api_docs/methods/get_keras_gptq_config.rst.txt
new file mode 100644
index 000000000..3f64adea5
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/get_keras_gptq_config.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-get_keras_gptq_config:
+
+
+=======================================
+Get GradientPTQConfig for Keras Models
+=======================================
+
+.. autofunction:: model_compression_toolkit.gptq.get_keras_gptq_config
diff --git a/docs/_sources/api/api_docs/methods/get_pytorch_data_generation_config.rst.txt b/docs/_sources/api/api_docs/methods/get_pytorch_data_generation_config.rst.txt
new file mode 100644
index 000000000..100e669dc
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/get_pytorch_data_generation_config.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-get_pytorch_data_generation_config:
+
+
+===========================================
+Get DataGenerationConfig for Pytorch Models
+===========================================
+
+.. autofunction:: model_compression_toolkit.data_generation.get_pytorch_data_generation_config
diff --git a/docs/_sources/api/api_docs/methods/get_pytroch_gptq_config.rst.txt b/docs/_sources/api/api_docs/methods/get_pytroch_gptq_config.rst.txt
new file mode 100644
index 000000000..990c72e2c
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/get_pytroch_gptq_config.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-get_pytorch_gptq_config:
+
+
+============================================
+Get GradientPTQConfig for Pytorch Models
+============================================
+
+.. autofunction:: model_compression_toolkit.gptq.get_pytorch_gptq_config
diff --git a/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt b/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt
new file mode 100644
index 000000000..cc623b66a
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/get_target_platform_capabilities.rst.txt
@@ -0,0 +1,13 @@
+:orphan:
+
+.. _ug-get_target_platform_capabilities:
+
+
+=======================================
+Get TargetPlatformCapabilities
+=======================================
+
+.. autofunction:: model_compression_toolkit.get_target_platform_capabilities
+
+
+.. include:: ../notes/tpc_note.rst
\ No newline at end of file
diff --git a/docs/_sources/api/api_docs/methods/keras_data_generation_experimental.rst.txt b/docs/_sources/api/api_docs/methods/keras_data_generation_experimental.rst.txt
new file mode 100644
index 000000000..66dfa8dcf
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_data_generation_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_data_generation_experimental:
+
+
+=====================================
+Keras Data Generation
+=====================================
+
+.. autofunction:: model_compression_toolkit.data_generation.keras_data_generation_experimental
diff --git a/docs/_sources/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst.txt b/docs/_sources/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst.txt
new file mode 100644
index 000000000..afd2eabf6
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_gradient_post_training_quantization:
+
+
+================================================
+Keras Gradient Based Post Training Quantization
+================================================
+
+.. autofunction:: model_compression_toolkit.gptq.keras_gradient_post_training_quantization
diff --git a/docs/_sources/api/api_docs/methods/keras_kpi_data_experimental.rst.txt b/docs/_sources/api/api_docs/methods/keras_kpi_data_experimental.rst.txt
new file mode 100644
index 000000000..a0205814f
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_kpi_data_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_kpi_data:
+
+
+=======================================
+Get KPI information for Keras Models
+=======================================
+
+.. autofunction:: model_compression_toolkit.core.keras_kpi_data
diff --git a/docs/_sources/api/api_docs/methods/keras_load_quantizad_model.rst.txt b/docs/_sources/api/api_docs/methods/keras_load_quantizad_model.rst.txt
new file mode 100644
index 000000000..d3d5d89b0
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_load_quantizad_model.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_load_quantized_model:
+
+
+=======================================
+Load Quantized Keras Model
+=======================================
+
+.. autofunction:: model_compression_toolkit.keras_load_quantized_model
diff --git a/docs/_sources/api/api_docs/methods/keras_post_training_quantization_experimental.rst.txt b/docs/_sources/api/api_docs/methods/keras_post_training_quantization_experimental.rst.txt
new file mode 100644
index 000000000..82a351716
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_post_training_quantization_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_post_training_quantization:
+
+
+=================================
+Keras Post Training Quantization
+=================================
+
+.. autofunction:: model_compression_toolkit.ptq.keras_post_training_quantization
diff --git a/docs/_sources/api/api_docs/methods/keras_pruning_experimental.rst.txt b/docs/_sources/api/api_docs/methods/keras_pruning_experimental.rst.txt
new file mode 100644
index 000000000..508a11e47
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_pruning_experimental.rst.txt
@@ -0,0 +1,12 @@
+:orphan:
+
+.. _ug-keras_pruning_experimental:
+
+
+================================================
+Keras Structured Pruning
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.keras_pruning_experimental
+
+
diff --git a/docs/_sources/api/api_docs/methods/keras_quantization_aware_training_finalize.rst.txt b/docs/_sources/api/api_docs/methods/keras_quantization_aware_training_finalize.rst.txt
new file mode 100644
index 000000000..54ff74a3f
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_quantization_aware_training_finalize.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_quantization_aware_training_finalize_experimental:
+
+
+================================================
+Keras Quantization Aware Training Model Finalize
+================================================
+
+.. autofunction:: model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental
diff --git a/docs/_sources/api/api_docs/methods/keras_quantization_aware_training_init.rst.txt b/docs/_sources/api/api_docs/methods/keras_quantization_aware_training_init.rst.txt
new file mode 100644
index 000000000..b89c3367e
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/keras_quantization_aware_training_init.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-keras_quantization_aware_training_init_experimental:
+
+
+================================================
+Keras Quantization Aware Training Model Init
+================================================
+
+.. autofunction:: model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental
diff --git a/docs/_sources/api/api_docs/methods/pytorch_data_generation_experimental.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_data_generation_experimental.rst.txt
new file mode 100644
index 000000000..0679417ec
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_data_generation_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-pytorch_data_generation_experimental:
+
+
+=====================================
+Pytorch Data Generation
+=====================================
+
+.. autofunction:: model_compression_toolkit.data_generation.pytorch_data_generation_experimental
diff --git a/docs/_sources/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst.txt
new file mode 100644
index 000000000..95dcf10f0
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-pytorch_gradient_post_training_quantization:
+
+
+====================================================
+Pytorch Gradient Based Post Training Quantization
+====================================================
+
+.. autofunction:: model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization
diff --git a/docs/_sources/api/api_docs/methods/pytorch_kpi_data_experimental.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_kpi_data_experimental.rst.txt
new file mode 100644
index 000000000..86f512eae
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_kpi_data_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-pytorch_kpi_data:
+
+
+=======================================
+Get KPI information for PyTorch Models
+=======================================
+
+.. autofunction:: model_compression_toolkit.core.pytorch_kpi_data
diff --git a/docs/_sources/api/api_docs/methods/pytorch_post_training_quantization_experimental.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_post_training_quantization_experimental.rst.txt
new file mode 100644
index 000000000..46feca7ba
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_post_training_quantization_experimental.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-pytorch_post_training_quantization:
+
+
+=====================================
+Pytorch Post Training Quantization
+=====================================
+
+.. autofunction:: model_compression_toolkit.ptq.pytorch_post_training_quantization
diff --git a/docs/_sources/api/api_docs/methods/pytorch_pruning_experimental.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_pruning_experimental.rst.txt
new file mode 100644
index 000000000..4f050cfe4
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_pruning_experimental.rst.txt
@@ -0,0 +1,15 @@
+:orphan:
+
+.. _ug-pytorch_pruning_experimental:
+
+
+================================================
+Pytorch Structured Pruning
+================================================
+
+.. autofunction:: model_compression_toolkit.pruning.pytorch_pruning_experimental
+
+
+
+
+
diff --git a/docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst.txt
new file mode 100644
index 000000000..e391be8d7
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-pytorch_quantization_aware_training_finalize_experimental:
+
+
+===================================================
+PyTorch Quantization Aware Training Model Finalize
+===================================================
+
+.. autofunction:: model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental
diff --git a/docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_init.rst.txt b/docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_init.rst.txt
new file mode 100644
index 000000000..4e14c7478
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/pytorch_quantization_aware_training_init.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-pytorch_quantization_aware_training_init_experimental:
+
+
+================================================
+PyTorch Quantization Aware Training Model Init
+================================================
+
+.. autofunction:: model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental
diff --git a/docs/_sources/api/api_docs/methods/set_logger_path.rst.txt b/docs/_sources/api/api_docs/methods/set_logger_path.rst.txt
new file mode 100644
index 000000000..d449869aa
--- /dev/null
+++ b/docs/_sources/api/api_docs/methods/set_logger_path.rst.txt
@@ -0,0 +1,10 @@
+:orphan:
+
+.. _ug-set_logger_path:
+
+=================================
+Enable a Logger
+=================================
+
+.. autofunction:: model_compression_toolkit.set_log_folder
+
diff --git a/docs/_sources/api/api_docs/modules/core_config.rst.txt b/docs/_sources/api/api_docs/modules/core_config.rst.txt
new file mode 100644
index 000000000..5601ffabd
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/core_config.rst.txt
@@ -0,0 +1,16 @@
+:orphan:
+
+.. _ug-core_config:
+
+
+=================================
+core_config Module
+=================================
+
+
+CoreConfig
+==========================
+**Class to configure the optimization process of the model:**
+
+.. autoclass:: model_compression_toolkit.core.CoreConfig
+
diff --git a/docs/_sources/api/api_docs/modules/debug_config.rst.txt b/docs/_sources/api/api_docs/modules/debug_config.rst.txt
new file mode 100644
index 000000000..16654f433
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/debug_config.rst.txt
@@ -0,0 +1,17 @@
+:orphan:
+
+.. _ug-debug_config:
+
+
+=================================
+debug_config Module
+=================================
+
+
+DebugConfig
+==========================
+**Class to configure params for debugging purposes:**
+
+.. autoclass:: model_compression_toolkit.core.DebugConfig
+
+
diff --git a/docs/_sources/api/api_docs/modules/exporter.rst.txt b/docs/_sources/api/api_docs/modules/exporter.rst.txt
new file mode 100644
index 000000000..e441eee22
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/exporter.rst.txt
@@ -0,0 +1,353 @@
+:orphan:
+
+.. _ug-exporter:
+
+
+=================================
+exporter Module
+=================================
+
+Allows to export a quantized model in different serialization formats and quantization formats.
+For more details about the export formats and options, please refer to the project's GitHub `README file <https://github.com/sony/model_optimization/tree/main/model_compression_toolkit/exporter>`_.
+If you have any questions or issues, please open an issue in this GitHub repository.
+
+
+QuantizationFormat
+==========================
+
+.. autoclass:: model_compression_toolkit.exporter.QuantizationFormat
+
+
+KerasExportSerializationFormat
+================================
+Select the serialization format for exporting a quantized Keras model.
+
+.. autoclass:: model_compression_toolkit.exporter.KerasExportSerializationFormat
+
+
+keras_export_model
+==========================
+Allows to export a Keras model that was quantized via MCT.
+
+.. autoclass:: model_compression_toolkit.exporter.keras_export_model
+
+
+Keras Tutorial
+==========================
+To export a TensorFlow model as a quantized model, it is necessary to first apply quantization
+to the model using MCT:
+
+.. code-block:: shell
+
+    ! pip install -q mct-nightly
+
+.. code-block:: python
+
+    import numpy as np
+    from keras.applications import ResNet50
+    import model_compression_toolkit as mct
+
+    # Create a model
+    float_model = ResNet50()
+    # Quantize the model.
+    # Notice that here the representative dataset is random for demonstration only.
+    quantized_exportable_model, _ = mct.ptq.keras_post_training_quantization(float_model,
+                                                                             representative_data_gen=lambda: [np.random.random((1, 224, 224, 3))])
+
+
+
+++++++++++++++++++++++++++++
+keras serialization format
+++++++++++++++++++++++++++++
+The model will be exported as a tensorflow `.keras` model where weights and activations are quantized but represented using a float32 dtype.
+Two optional quantization formats are available: MCTQ and FAKELY_QUANT.
+
+++++
+MCTQ
+++++
+
+By default, `mct.exporter.keras_export_model` will export the quantized Keras model to
+a .keras model with custom quantizers from mct_quantizers module.
+
+.. code-block:: python
+
+    import tempfile
+
+    # Path of exported model
+    _, keras_file_path = tempfile.mkstemp('.keras')
+
+    # Export a keras model with mctq custom quantizers.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=keras_file_path)
+
+Notice that the model has the same size as the quantized exportable model as weights data types are float.
+
++++++++++++++++++++++++++++
+Fakely-Quantized in Keras
++++++++++++++++++++++++++++
+
+.. code-block:: python
+
+    # Path of exported model
+    _, keras_file_path = tempfile.mkstemp('.keras')
+
+    # Use mode KerasExportSerializationFormat.KERAS for a .keras model
+    # and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights
+    # and activations.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=keras_file_path,
+                                    quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.
+
+++++++
+TFLite
+++++++
+
+The tflite serialization format export in two qauntization formats: INT8 and FAKELY_QUANT.
+
++++++++++++
+INT8 TFLite
++++++++++++
+
+The model will be exported as a tflite model where weights and activations are represented as 8bit integers.
+
+.. code-block:: python
+
+    import tempfile
+
+    # Path of exported model
+    _, tflite_file_path = tempfile.mkstemp('.tflite')
+
+    # Use mode KerasExportSerializationFormat.TFLITE for tflite model and quantization_format.INT8.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=tflite_file_path,
+                                    serialization_format=mct.exporter.KerasExportSerializationFormat.TFLITE,
+                                    quantization_format=mct.exporter.QuantizationFormat.INT8)
+
+Compare size of float and quantized model:
+
+
+.. code-block:: python
+
+    import os
+
+    # Save float model to measure its size
+    _, float_file_path = tempfile.mkstemp('.keras')
+    float_model.save(float_file_path)
+
+    print("Float model in Mb:", os.path.getsize(float_file_path) / float(2 ** 20))
+    print("Quantized model in Mb:", os.path.getsize(tflite_file_path) / float(2 ** 20))
+    print(f'Compression ratio: {os.path.getsize(float_file_path) / os.path.getsize(tflite_file_path)}')
+
+
++++++++++++++++++++++++
+Fakely-Quantized TFLite
++++++++++++++++++++++++
+
+The model will be exported as a tflite model where weights and activations are quantized but represented with a float data type.
+
++++++++++++++
+Usage Example
++++++++++++++
+
+
+
+.. code-block:: python
+
+    # Path of exported model
+    _, tflite_file_path = tempfile.mkstemp('.tflite')
+
+    # Use mode KerasExportSerializationFormat.TFLITE for tflite model and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights
+    # and activations.
+    mct.exporter.keras_export_model(model=quantized_exportable_model,
+                                    save_model_path=tflite_file_path,
+                                    serialization_format=mct.exporter.KerasExportSerializationFormat.TFLITE,
+                                    quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+
+
+
+
+Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.
+
+
+
+
+
+
+PytorchExportSerializationFormat
+==================================
+Select the serialization format for exporting a quantized Pytorch model.
+
+.. autoclass:: model_compression_toolkit.exporter.PytorchExportSerializationFormat
+
+
+
+
+
+pytorch_export_model
+==========================
+Allows to export a Pytorch model that was quantized via MCT.
+
+.. autoclass:: model_compression_toolkit.exporter.pytorch_export_model
+
+
+
+Pytorch Tutorial
+==========================
+
+To export a Pytorch model as a quantized model, it is necessary to first apply quantization
+to the model using MCT:
+
+.. code-block:: shell
+
+    ! pip install -q mct-nightly
+
+In order to export your quantized model to ONNX format, and use it for inference, some additional packages are needed. Notice, this is needed only for models exported to ONNX format, so this part can be skipped if this is not planned:
+
+.. code-block:: shell
+
+    ! pip install -q onnx onnxruntime onnxruntime-extensions
+
+Now, let's start the export demonstration by quantizing the model using MCT:
+
+.. code-block:: python
+
+    import model_compression_toolkit as mct
+    import numpy as np
+    import torch
+    from torchvision.models.mobilenetv2 import mobilenet_v2
+
+    # Create a model
+    float_model = mobilenet_v2()
+
+
+    # Notice that here the representative dataset is random for demonstration only.
+    def representative_data_gen():
+        yield [np.random.random((1, 3, 224, 224))]
+
+
+    quantized_exportable_model, _ = mct.ptq.pytorch_post_training_quantization(float_model, representative_data_gen=representative_data_gen)
+
+
+
++++++++++
+ONNX
++++++++++
+
+The model will be exported in ONNX format where weights and activations are represented as float. Notice that `onnx` should be installed in order to export the model to an ONNX model.
+
+There are two optional formats to choose: MCTQ or FAKELY_QUANT.
+
++++++++++++++++++++++++++++
+MCTQ Quantization Format
++++++++++++++++++++++++++++
+
+By default, `mct.exporter.pytorch_export_model` will export the quantized pytorch model to
+an ONNX model with custom quantizers from mct_quantizers module.
+
+
+
+.. code-block:: python
+
+    # Path of exported model
+    onnx_file_path = 'model_format_onnx_mctq.onnx'
+
+    # Export ONNX model with mctq quantizers.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=onnx_file_path,
+                                      repr_dataset=representative_data_gen)
+
+Notice that the model has the same size as the quantized exportable model as weights data types are float.
+
++++++++++++++++++++++++++++
+ONNX opset version
++++++++++++++++++++++++++++
+
+By default, the used ONNX opset version is 15, but this can be changed using `onnx_opset_version`:
+
+.. code-block:: python
+
+    # Export ONNX model with mctq quantizers.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=onnx_file_path,
+                                      repr_dataset=representative_data_gen,
+                                      onnx_opset_version=16)
+
+|
+
+++++++++++++++++++++++++++++++++++++
+Use exported model for inference
+++++++++++++++++++++++++++++++++++++
+
+To load and infer using the exported model, which was exported to an ONNX file in MCTQ format, we will use `mct_quantizers` method `get_ort_session_options` during onnxruntime session creation. **Notice**, inference on models that are exported in this format are slowly and suffers from longer latency. However, inference of these models on IMX500 will not suffer from this issue.
+
+.. code-block:: python
+
+    import mct_quantizers as mctq
+    import onnxruntime as ort
+
+    sess = ort.InferenceSession(onnx_file_path,
+                                mctq.get_ort_session_options(),
+                                providers=['CUDAExecutionProvider', 'CPUExecutionProvider'])
+
+    _input_data = next(representative_data_gen())[0].astype(np.float32)
+    _model_output_name = sess.get_outputs()[0].name
+    _model_input_name = sess.get_inputs()[0].name
+
+    # Run inference
+    predictions = sess.run([_model_output_name], {_model_input_name: _input_data})
+
+|
+
++++++++++++++++++++++++++++++
+Fakely-Quantized in Pytorch
++++++++++++++++++++++++++++++
+
+To export a fakely-quantized model, use QuantizationFormat.FAKELY_QUANT:
+
+.. code-block:: python
+
+    import tempfile
+
+    # Path of exported model
+    _, onnx_file_path = tempfile.mkstemp('.onnx')
+
+    # Use QuantizationFormat.FAKELY_QUANT for fakely-quantized weights and activations.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=onnx_file_path,
+                                      repr_dataset=representative_data_gen,
+                                      quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+
+Notice that the fakely-quantized model has the same size as the quantized
+exportable model as weights data types are float.
+
+++++++++++++++++++
+TorchScript
+++++++++++++++++++
+
+The model will be exported in TorchScript format where weights and activations are
+quantized but represented as float (fakely quant).
+
+.. code-block:: python
+
+    # Path of exported model
+    _, torchscript_file_path = tempfile.mkstemp('.pt')
+
+
+    # Use mode PytorchExportSerializationFormat.TORCHSCRIPT a torchscript model
+    # and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights and activations.
+    mct.exporter.pytorch_export_model(model=quantized_exportable_model,
+                                      save_model_path=torchscript_file_path,
+                                      repr_dataset=representative_data_gen,
+                                      serialization_format=mct.exporter.PytorchExportSerializationFormat.TORCHSCRIPT,
+                                      quantization_format=mct.exporter.QuantizationFormat.FAKELY_QUANT)
+
+Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.
+
+
diff --git a/docs/_sources/api/api_docs/modules/layer_filters.rst.txt b/docs/_sources/api/api_docs/modules/layer_filters.rst.txt
new file mode 100644
index 000000000..fb6af858b
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/layer_filters.rst.txt
@@ -0,0 +1,40 @@
+:orphan:
+
+.. _ug-layer_filters:
+
+
+=================================
+Layer Attributes Filters
+=================================
+
+In order to create LayerFilterParams which needed to filter layers by their attributes,
+one may use the next filters to check if a layer configuration holds the created LayerFilterParams:
+
+
+
+Attribute Filters
+==================
+
+.. autoclass:: model_compression_toolkit.target_platform.Eq
+
+|
+
+.. autoclass:: model_compression_toolkit.target_platform.NotEq
+
+|
+
+.. autoclass:: model_compression_toolkit.target_platform.Greater
+
+|
+
+
+.. autoclass:: model_compression_toolkit.target_platform.GreaterEq
+
+|
+
+
+.. autoclass:: model_compression_toolkit.target_platform.Smaller
+
+|
+
+.. autoclass:: model_compression_toolkit.target_platform.SmallerEq
diff --git a/docs/_sources/api/api_docs/modules/mixed_precision_quantization_config.rst.txt b/docs/_sources/api/api_docs/modules/mixed_precision_quantization_config.rst.txt
index e48b66381..f3d6aba8c 100644
--- a/docs/_sources/api/api_docs/modules/mixed_precision_quantization_config.rst.txt
+++ b/docs/_sources/api/api_docs/modules/mixed_precision_quantization_config.rst.txt
@@ -1,27 +1,26 @@
 :orphan:
 
-.. _ug-mixed_precision_quantization_config:
+.. _ug-mixed_precision_quantization_config_v2:
 
 
-===========================================
+===========================================================
 mixed_precision_quantization_config Module
-===========================================
+===========================================================
 
 
 KPI
 ================================
 **Object to configure resources to use when searching for a mixed-precision configuration for a model:**
 
-.. autoclass:: model_compression_toolkit.KPI
-    :noindex:
+.. autoclass:: model_compression_toolkit.core.KPI
 
 
 |
 
 
-MixedPrecisionQuantizationConfig
-=================================
+MixedPrecisionQuantizationConfigV2
+===================================
 **Class to configure the quantization process of the model when quantizing in mixed-precision:**
 
-.. autoclass:: model_compression_toolkit.MixedPrecisionQuantizationConfig
+.. autoclass:: model_compression_toolkit.core.MixedPrecisionQuantizationConfig
 
diff --git a/docs/_sources/api/api_docs/modules/network_editor.rst.txt b/docs/_sources/api/api_docs/modules/network_editor.rst.txt
new file mode 100644
index 000000000..8df62a390
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/network_editor.rst.txt
@@ -0,0 +1,62 @@
+:orphan:
+
+.. _ug-network_editor:
+
+
+=================================
+network_editor Module
+=================================
+
+**The model can be edited by a list of EditRules to apply on nodes in a graph that represents the model during the model quantization. Each EditRule is a tuple of a filter and an action, where we apply the action on each node the filter matches**
+
+EditRule
+==========
+.. autoclass:: model_compression_toolkit.core.network_editor.EditRule
+
+Filters
+==========
+
+.. autoclass:: model_compression_toolkit.core.network_editor.NodeTypeFilter
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.NodeNameFilter
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.NodeNameScopeFilter
+
+
+Actions
+==========
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod
+
+|
+
+.. autoclass:: model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod
+
diff --git a/docs/_sources/api/api_docs/modules/qat_config.rst.txt b/docs/_sources/api/api_docs/modules/qat_config.rst.txt
new file mode 100644
index 000000000..9583aee88
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/qat_config.rst.txt
@@ -0,0 +1,26 @@
+:orphan:
+
+.. _ug-qat_config:
+
+
+===========================================================
+qat_config Module
+===========================================================
+
+
+TrainingMethod
+================================
+**Select a QAT training method:**
+
+.. autoclass:: model_compression_toolkit.qat.TrainingMethod
+
+
+|
+
+
+QATConfig
+===================================
+**Class to configure the quantization process of the model when quantizing using Quantization-aware Training (QAT):**
+
+.. autoclass:: model_compression_toolkit.qat.QATConfig
+
diff --git a/docs/_sources/api/api_docs/modules/quantization_config.rst.txt b/docs/_sources/api/api_docs/modules/quantization_config.rst.txt
new file mode 100644
index 000000000..7997f6f1b
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/quantization_config.rst.txt
@@ -0,0 +1,25 @@
+:orphan:
+
+.. _ug-quantization_config:
+
+
+=================================
+quantization_config Module
+=================================
+
+QuantizationErrorMethod
+==========================
+**Enum to select a method for quantization parameters' selection:**
+
+.. autoclass:: model_compression_toolkit.core.QuantizationErrorMethod
+
+
+|
+
+
+QuantizationConfig
+==========================
+**Class to configure the quantization process of the model:**
+
+.. autoclass:: model_compression_toolkit.core.QuantizationConfig
+
diff --git a/docs/_sources/api/api_docs/modules/target_platform.rst.txt b/docs/_sources/api/api_docs/modules/target_platform.rst.txt
new file mode 100644
index 000000000..a4e4831f5
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/target_platform.rst.txt
@@ -0,0 +1,357 @@
+:orphan:
+
+.. _ug-target_platform:
+
+
+=================================
+target_platform Module
+=================================
+
+MCT can be configured to quantize and optimize models for different hardware settings.
+For example, when using qnnpack backend for Pytorch model inference, Pytorch `quantization
+configuration <https://github.com/pytorch/pytorch/blob/master/torch/ao/quantization/qconfig.py#L199>`_
+uses `per-tensor weights quantization <https://github.com/pytorch/pytorch/blob/master/torch/ao/quantization/observer.py#L1429>`_
+for Conv2d, while when using tflite modeling, Tensorflow uses `per-channel weights quantization for
+Conv2D <https://www.tensorflow.org/lite/performance/quantization_spec#per-axis_vs_per-tensor>`_.
+
+This can be addressed in MCT by using the target_platform module, that can configure different
+parameters that are hardware-related, and the optimization process will use this to optimize the model accordingly.
+Models for IMX500, TFLite and qnnpack can be observed `here <https://github.com/sony/model_optimization/tree/main/model_compression_toolkit/target_platform_capabilities>`_, and can be used using :ref:`get_target_platform_capabilities function<ug-get_target_platform_capabilities>`.
+
+|
+
+.. include:: ../notes/tpc_note.rst
+
+|
+
+The object MCT should get called TargetPlatformCapabilities (or shortly TPC).
+This diagram demonstrates the main components:
+
+.. image:: ../../../../images/tpc.jpg
+  :scale: 80%
+
+Now, we will explain about each component with examples.
+
+The first part is configuring the quantization method for both wights and activations of an operator.
+Several methods can be used using QuantizationMethod API:
+
+
+QuantizationMethod
+==========================
+Select a method to use during quantization:
+
+.. autoclass:: model_compression_toolkit.target_platform.QuantizationMethod
+
+
+|
+
+
+Using a quantization method (or methods, if the weights and activations of an operator are quantized differently)
+Quantization configuration of different operators can be created using OpQuantizationConfig:
+
+
+OpQuantizationConfig
+======================
+.. autoclass:: model_compression_toolkit.target_platform.OpQuantizationConfig
+
+|
+
+If, for example, we would like to quantize an operator's weights with 8 bits (and per-channel), its activations
+with 8 bits, and the quantization thresholds (for both weights and activations) must be power-of-two,
+we can create the OpQuantizationConfig:
+
+.. code-block:: python
+
+   op_qc_8bit = OpQuantizationConfig(
+       activation_quantization_method=QuantizationMethod.POWER_OF_TWO,
+        weights_quantization_method=QuantizationMethod.POWER_OF_TWO,
+        activation_n_bits=8,
+        weights_n_bits=8,
+        weights_per_channel_threshold=True,
+        enable_weights_quantization=True,
+        enable_activation_quantization=True
+    )
+
+|
+
+We will demonstrate later how to attach this OpQuantizationConfig to a specific operator.
+
+If an operator can be quantized in different ways (the simplest example is mixed-precision quantization),
+one can create a QuantizationConfigOptions instance to represent a set of possible quantization
+configuration options for an operator:
+
+
+QuantizationConfigOptions
+============================
+.. autoclass:: model_compression_toolkit.target_platform.QuantizationConfigOptions
+
+If a QuantizationConfigOptions is created with more than
+one OpQuantizationConfig option, a base_config must be passed to the QuantizationConfigOptions
+in order to support the model when MCT optimizes the model in no mixed-precision manner.
+
+For example, we would like to quantize an operator's weights with either 2, 4 or 8 bits (and in
+case we would like to use MCT non mixed-precision functions, we would like to quantize the operator
+using 8 bits). For this we can create new OpQuantizationConfigs based on previously created
+OpQuantizationConfigs, and gather them under a single QuantizationConfigOptions instance:
+
+.. code-block:: python
+
+    # To quantize a model using mixed-precision, create a QuantizationConfigOptions with more
+    # than one QuantizationConfig.
+    # In this example, we aim to quantize some operations' weights using 2, 4 or 8 bits.
+    op_qc_4bit = op_qc_8bit.clone_and_edit(weights_n_bits=4)
+    op_qc_2bit = op_qc_8bit.clone_and_edit(weights_n_bits=2)
+    mixed_precision_configuration_options = QuantizationConfigOptions([op_qc_8bit,
+                                                                       op_qc_4bit,
+                                                                       op_qc_2bit],
+                                                                       base_config=op_qc_8bit)
+
+|
+
+
+
+The main class to define the hardware-related properties, is called TargetPlatformModel. Using a TargetPlatformModel
+object we can create operator sets, configure how these operators sets will be quantized,
+group operators by common properties and configure patterns of operators to fuse:
+
+
+TargetPlatformModel
+=======================
+.. autoclass:: model_compression_toolkit.target_platform.TargetPlatformModel
+
+
+A default QuantizationConfigOptions (containing a single OpQuantizationConfig) must be passed
+when instancing a TargetPlatformModel object. It comes to use when MCT needs to optimize
+an operator that is not defined explicitly in the TargetPlatformModel. In this case, the OpQuantizationConfig
+in the default QuantizationConfigOptions will guide MCT how this operator should be optimized. For example:
+
+.. code-block:: python
+
+    # Create a QuantizationConfigOptions with a single OpQuantizationConfig to use as
+    # a default configuration options.
+    default_configuration_options = QuantizationConfigOptions([op_qc_8bit])
+
+    # Create a TargetPlatformModel and set its default quantization config.
+    # This default configuration will be used for all operations
+    # unless specified otherwise:
+    my_model = TargetPlatformModel(default_configuration_options, name='my_model')
+
+|
+
+Then, we can start defining the model by creating OperatorsSets:
+
+OperatorsSet
+================
+.. autoclass:: model_compression_toolkit.target_platform.OperatorsSet
+
+An OperatorsSet gathers group of operators that are labeled by a unique name and can be attached to a
+QuantizationConfigOptions (so MCT will use these options to optimize operators from this set).
+For example, if FullyConnected can be quantized using 2, 4, or 8 bits, we can create the next
+OperatorsSet using the previously created mixed_precision_configuration_options:
+
+.. code-block:: python
+
+    # Define operators set named "FullyConnected" and attach
+    # mixed_precision_configuration_options as its QuantizationConfigOptions:
+    fc_opset = OperatorsSet("FullyConnected", mixed_precision_configuration_options)
+
+|
+
+The QuantizationConfigOptions is optional. An OperatorsSet can be also created
+without any attached QuantizationConfigOptions. Operators in this kind of OperatorsSets
+are attached implicitly to the default QuantizationConfigOptions of the TargetPlatformModel
+they are part of:
+
+.. code-block:: python
+
+    # Define operators set named "Relu" and do not attach
+    # it any QuantizationConfigOptions:
+    relu_opset = OperatorsSet("Relu")
+
+|
+
+Another component of a TargetPlatformModel is Fusing. Fusing defines a list
+of operators that should be combined and treated as a single operator, hence no
+quantization is applied between them when they appear in a model:
+
+
+Fusing
+==============
+.. autoclass:: model_compression_toolkit.target_platform.Fusing
+
+For example, to fuse the previously created two OperatorsSets fc_opset and
+relu_opset we can create the next Fusing:
+
+.. code-block:: python
+
+    # Combine multiple operators into a single operator to avoid quantization between
+    # them. To do this we define fusing patterns using the OperatorsSets that were created.
+    Fusing([fc_opset, relu_opset])
+
+|
+
+Notice that the list of opsets must contain at least two OperatorSets.
+Also notice that sublist of the OperatorsSet list that is passed to the Fusing,
+will not be fused, unless another Fusing is created for that. For example,
+if a model is defined to fuse three sequenced operators [FullyConnected, Relu, Add]:
+
+.. code-block:: python
+
+    # In addition to the OperatorsSets we created, create new OperatorsSets for "add" ops:
+    add_opset = OperatorsSet("Add")
+
+    # Fuse sequences of operators:
+    Fusing([fc_opset, relu_opset, add_opset])
+
+|
+
+and the pre-trained model that MCT optimizes has a sequence of [fc_opset, relu_opset]
+where the next operator is not an add_opset, the two operators [fc_opset, relu_opset]
+will not be fused as the only defined fusing pattern is of the three OperatorsSets
+[fc_opset, relu_opset, add_opset]. In order to fuse sequences of [fc_opset, relu_opset]
+as well, a new Fusing should be defined:
+
+.. code-block:: python
+
+    # Fuse sequences of the three listed operators:
+    Fusing([fc_opset, relu_opset, add_opset])
+
+    # In addition, fuse sequences of the two listed operators:
+    Fusing([fc_opset, relu_opset])
+
+Now, if MCT encounters a sequence of [fc_opset, relu_opset] they will be fused regardless the following operator.
+Sequences of [fc_opset, relu_opset, add_opset] will be fused as well, and
+the new Fusing of [fc_opset, relu_opset] will not affect them (but will affect patterns
+of [fc_opset, relu_opset], of course).
+
+When multiple operators should be fused in a similar way, an OperatorSetConcat can be used:
+
+OperatorSetConcat
+====================
+.. autoclass:: model_compression_toolkit.target_platform.OperatorSetConcat
+
+
+OperatorSetConcat gathers multiple OperatorsSet and can be specified in a fusing operators list.
+If, for example, we want to fuse the patterns [fc_opset, add_opset] and [fc_opset, relu_opset],
+we can either create two separate Fusing objects as was demonstrated above, or an OperatorSetConcat
+can be used as follows:
+
+.. code-block:: python
+
+    # Concatenate two OpseratorsSet objects to be treated similarly when fused:
+    activations_after_fc_to_fuse = OperatorSetConcat(relu_opset, add_opset)
+
+    # Create a fusing pattern using OperatorSetConcat. This is equivalent to define two
+    # separate fusing patterns of: [fc_opset, relu_opset], [fc_opset, add_opset]
+    Fusing([fc_opset, activations_after_fc_to_fuse])
+
+|
+
+
+TargetPlatformModel Code Example
+===================================
+
+.. literalinclude:: ../../../../../model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/v1/tp_model.py
+    :language: python
+    :lines: 15-156
+
+|
+
+After modeling the hardware MCT should optimize according to, this hardware model needs to be
+attached to a specific framework information in order to associate the operators that are defined in
+hardware model to layers in different representations of a framework.
+For example, if we created an OperatorsSet for "Add" operator, in Tensorflow this operator
+can be used by two different layers: keras.layers.Add, tf.add.
+To attach a list of framework's layers to an OperatorsSet that is defined in the TargetPlatformModel,
+an OperationsSetToLayers can be used:
+
+OperationsSetToLayers
+=========================
+.. autoclass:: model_compression_toolkit.target_platform.OperationsSetToLayers
+
+Using OperationsSetToLayers we can associate an OperatorsSet label to a list of framework's layers:
+
+.. code-block:: python
+
+    import tensorflow as tf
+    from keras.layers import Add
+    OperationsSetToLayers("Add", [tf.add, Add])
+
+|
+
+This way, when MCT quantizes one of the layers tf.add or keras.layers.Add, it uses the QuantizationConfigOptions
+that is associated with the OperatorsSet that was labeled "Add" to optimize the layer.
+
+There are cases where an operator can be represented using a layer but it must have a specific configuration.
+
+For example, in case the optimization should be different for bounded ReLU and unbounded ReLU, two OperatorSets
+can be created, and the layers that will be attached to each OperatorSet will have to be filtered.
+For that, LayerFilterParams can be used:
+
+LayerFilterParams
+=========================
+.. autoclass:: model_compression_toolkit.target_platform.LayerFilterParams
+
+
+LayerFilterParams wraps a layer with several conditions and key-value pairs
+and can check whether a layer matches the layer, conditions and key-value pairs.
+If for example a distinguish need to be made between bounded-ReLU and unbounded-ReLU in Tensorflow
+the next LayerFilterParams can be created:
+
+.. code-block:: python
+
+    from keras.layers import ReLU
+
+    # Create a LayerFilterParams that matches ReLU layers that have an attribute 'max_value'
+    # and it is None
+    unbounded_relu_filter = LayerFilterParams(ReLU, max_value=None)
+
+    # Create a LayerFilterParams that matches ReLU layers that have an attribute 'max_value'
+    # and it is not None
+    unbounded_relu_filter = LayerFilterParams(ReLU, NotEq('max_value', None))
+
+|
+
+In this example, we used NotEq which is a way to filter layers with attributes that has
+a value different than the value that was passed (in this case - None). More filters can be created
+and passed to the LayerFilterParams in order to create more detailed filter.
+More filters and usage examples are detailed :ref:`here<ug-layer_filters>`.
+
+These LayerFilterParams instances can now be attached to OperatorsSets in the TargetPlatformModel
+using OperationsSetToLayers just like any other layers:
+
+.. code-block:: python
+
+    import tensorflow as tf
+    from keras.layers import ReLU, Activation
+
+    OperationsSetToLayers("ReLU", [tf.nn.relu,
+                                   tf.nn.relu6,
+                                   LayerFilterParams(ReLU, negative_slope=0.0),
+                                   LayerFilterParams(Activation, activation="relu")])
+
+|
+
+The mapping from OperatorsSets to layers' lists are part of a class called TargetPlatformCapabilities
+which attaches the layers representations to OperatorsSets in a TargetPlatformModel instance:
+
+TargetPlatformCapabilities
+=============================
+.. autoclass:: model_compression_toolkit.target_platform.TargetPlatformCapabilities
+
+
+To create a TargetPlatformCapabilities, a TargetPlatformModel instance should be passed upon the
+TargetPlatformCapabilities initialization. Then, OperationsSetToLayers can be created and attached
+to the TargetPlatformCapabilities like in the following example:
+
+
+TargetPlatformCapabilities Code Example
+===========================================
+
+.. literalinclude:: ../../../../../model_compression_toolkit/target_platform_capabilities/tpc_models/imx500_tpc/v1/tp_model.py
+    :language: python
+    :lines: 15-86
+
+
+
+
diff --git a/docs/_sources/api/api_docs/modules/trainable_infrastructure.rst.txt b/docs/_sources/api/api_docs/modules/trainable_infrastructure.rst.txt
new file mode 100644
index 000000000..c514a3307
--- /dev/null
+++ b/docs/_sources/api/api_docs/modules/trainable_infrastructure.rst.txt
@@ -0,0 +1,83 @@
+:orphan:
+
+.. _ug-trainable_infrastructure:
+
+
+=================================
+trainable_infrastructure Module
+=================================
+
+The trainable infrastructure is a module containing quantization abstraction and quantizers for hardware-oriented model optimization tools.
+It provides the required abstraction for trainable quantization methods such as quantization-aware training.
+It utilizes the Inferable Quantizers Infrastructure provided by the `MCT Quantizers <https://github.com/sony/mct_quantizers>`_ package, which proposes the required abstraction for emulating inference-time quantization.
+
+When using a trainable quantizer, each layer with quantized weights is wrapped with a "Quantization Wrapper" object,
+and each activation quantizer is being stored in an "Activation Quantization Holder" object.
+Both components are provided by the MCT Quantizers package.
+
+The quantizers in this module are built upon the "Inferable Quantizer" abstraction (from MCT Quantizers),
+and define the "Trainable Quantizer" framework,
+which contains learnable quantization parameters that can be optimized during training.
+
+Now, we will explain how a trainable quantizer is built and used.
+We start by explaining the basic building block of a trainable quantizer, and then explain how to initialize it using a configuration object.
+
+BaseKerasTrainableQuantizer
+==============================
+This class is a base class for trainable Keras quantizers which validates provided quantization config and defines an abstract function which any quantizer needs to implement.
+It adds to the base quantizer a get_config and from_config functions to enable loading and saving the keras model.
+
+.. autoclass:: model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer
+
+BasePytorchTrainableQuantizer
+==============================
+This class is a base class for trainable Pytorch quantizers which validates provided quantization config and defines an abstract function which any quantizer needs to implement.
+It adds to the base quantizer a get_config and from_config functions to enable loading and saving the keras model.
+
+.. autoclass:: model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer
+
+TrainableQuantizerWeightsConfig
+=================================
+This configuration object contains the necessary attributes for configuring a weights trainable quantizer.
+
+.. autoclass:: model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig
+
+For example, we can set a trainable weights quantizer with the following configuration:
+
+.. code-block:: python
+
+    from model_compression_toolkit.target_platform_capabilities.target_platform import QuantizationMethod
+    from model_compression_toolkit.constants import THRESHOLD, MIN_THRESHOLD
+
+    TrainableQuantizerWeightsConfig(weights_quantization_method=QuantizationMethod.SYMMETRIC,
+                                               weights_n_bits=8,
+                                               weights_quantization_params={THRESHOLD: 2.0},
+                                               enable_weights_quantization=True,
+                                               weights_channels_axis=3,
+                                               weights_per_channel_threshold=True,
+                                               min_threshold=MIN_THRESHOLD)
+
+
+|
+
+TrainableQuantizerActivationConfig
+====================================
+This configuration object contains the necessary attributes for configuring an activation trainable quantizer.
+
+.. autoclass:: model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig
+
+For example, we can set a trainable activation quantizer with the following configuration:
+
+.. code-block:: python
+
+    from model_compression_toolkit.target_platform_capabilities.target_platform import QuantizationMethod
+    from model_compression_toolkit.constants import THRESHOLD, MIN_THRESHOLD
+
+    TrainableQuantizerActivationConfig(activation_quantization_method=QuantizationMethod.UNIFORM,
+                                                  activation_n_bits=8,
+                                                  activation_quantization_params=={THRESHOLD: 2.0},
+                                                  enable_activation_quantization=True,
+                                                  min_threshold=MIN_THRESHOLD)
+
+
+|
diff --git a/docs/_sources/api/api_docs/notes/tpc_note.rst.txt b/docs/_sources/api/api_docs/notes/tpc_note.rst.txt
new file mode 100644
index 000000000..c7352b8cb
--- /dev/null
+++ b/docs/_sources/api/api_docs/notes/tpc_note.rst.txt
@@ -0,0 +1,8 @@
+
+.. note::
+   For now, some fields of :class:`~model_compression_toolkit.target_platform.OpQuantizationConfig` are ignored during
+   the optimization process (currently, the quantizer type, number of bits, and quantization enable/disable information
+   are in use).
+
+   - MCT will use more information from :class:`~model_compression_toolkit.target_platform.OpQuantizationConfig`, in the future.
+
diff --git a/docs/_sources/index.rst.txt b/docs/_sources/index.rst.txt
index bd91fe81f..2c4713162 100644
--- a/docs/_sources/index.rst.txt
+++ b/docs/_sources/index.rst.txt
@@ -41,7 +41,7 @@ A nightly version is also available (unstable):
 
 For using with Tensorflow please install the packages:
 `tensorflow <https://www.tensorflow.org/install>`_
-`tensorflow-model-optimization <https://www.tensorflow.org/model_optimization/guide/install>`_
+
 
 For using with Pytorch please install the package:
 `torch <https://pytorch.org/>`_
@@ -52,21 +52,21 @@ Supported Features
 
 Keras:
 
-* :ref:`Post Training Quantization<ug-keras_post_training_quantization_experimental>` [1]
-* :ref:`Gradient based post training using knowledge distillation<ug-keras_gradient_post_training_quantization_experimental>`
-* :ref:`Mixed-precision post training quantization<ug-keras_post_training_quantization_mixed_precision>`
-* :ref:`Init model for Quantization Aware Training<ug-keras_quantization_aware_training_init>` (Experimental)
-* :ref:`Finalize model after Quantization Aware Training<ug-keras_quantization_aware_training_finalize>` (Experimental)
-* :ref:`Structured Pruning<ug-keras_pruning_experimental>` (Experimental)
+* :ref:`Post Training Quantization<ug-keras_post_training_quantization>` [1]
+* :ref:`Gradient based post training using knowledge distillation<ug-keras_gradient_post_training_quantization>`
+* :ref:`Init model for Quantization Aware Training<ug-keras_quantization_aware_training_init_experimental>` (Experimental)
+* :ref:`Finalize model after Quantization Aware Training<ug-keras_quantization_aware_training_finalize_experimental>` (Experimental)
+* :ref:`Structured pruning<ug-keras_pruning_experimental>` (Experimental)
+* :ref:`Data generation<ug-keras_data_generation_experimental>` (Experimental)
 
 Pytorch:
 
-* :ref:`Post Training Quantization<ug-pytorch_post_training_quantization_experimental>` [1]
-* :ref:`Gradient based post training using knowledge distillation<ug-pytorch_gradient_post_training_quantization_experimental>`
-* :ref:`Mixed-precision post training quantization<ug-pytorch_post_training_quantization_mixed_precision>`
-* :ref:`Init model for Quantization Aware Training<ug-pytorch_quantization_aware_training_init>` (Experimental)
-* :ref:`Finalize model after Quantization Aware Training<ug-pytorch_quantization_aware_training_finalize>` (Experimental)
-
+* :ref:`Post Training Quantization<ug-pytorch_post_training_quantization>` [1]
+* :ref:`Gradient based post training using knowledge distillation<ug-pytorch_gradient_post_training_quantization>`
+* :ref:`Init model for Quantization Aware Training<ug-pytorch_quantization_aware_training_init_experimental>` (Experimental)
+* :ref:`Finalize model after Quantization Aware Training<ug-pytorch_quantization_aware_training_finalize_experimental>` (Experimental)
+* :ref:`Structured pruning<ug-pytorch_pruning_experimental>` (Experimental)
+* :ref:`Data generation<ug-pytorch_data_generation_experimental>` (Experimental)
 
 
 Visualization:
@@ -101,7 +101,7 @@ Please visit the MCT API documentation here
     :titlesonly:
     :maxdepth: 1
 
-    API Documentation<../api/experimental_api_docs/index>
+    API Documentation<../api/api_docs/index>
 
 Technical Constraints
 =========================
diff --git a/docs/api/api_docs/classes/DefaultDict.html b/docs/api/api_docs/classes/DefaultDict.html
index d99a59dbb..602dea4e2 100644
--- a/docs/api/api_docs/classes/DefaultDict.html
+++ b/docs/api/api_docs/classes/DefaultDict.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>DefaultDict Class &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>DefaultDict Class &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">DefaultDict Class</a></li> 
       </ul>
     </div>  
@@ -41,18 +42,18 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="defaultdict-class">
-<span id="ug-defaultdict"></span><h1>DefaultDict Class<a class="headerlink" href="#defaultdict-class" title="Permalink to this headline">¶</a></h1>
+<span id="ug-defaultdict"></span><h1>DefaultDict Class<a class="headerlink" href="#defaultdict-class" title="Permalink to this heading">¶</a></h1>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.DefaultDict">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">DefaultDict</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">known_dict</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">default_factory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.DefaultDict" title="Permalink to this definition">¶</a></dt>
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">DefaultDict</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">known_dict</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">default_value</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.DefaultDict" title="Permalink to this definition">¶</a></dt>
 <dd><p>Default dictionary. It wraps a dictionary given at initialization and return its
 values when requested. If the requested key is not presented at initial dictionary,
-it returns the returned value a default factory (that is passed at initialization) generates.</p>
+it returns the returned value a default value (that is passed at initialization) generates.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>known_dict</strong> (<em>Dict</em><em>[</em><em>Any</em><em>, </em><em>Any</em><em>]</em>) – Dictionary to wrap.</p></li>
-<li><p><strong>default_factory</strong> (<em>Callable</em>) – Callable to get default values when requested key is not in known_dict.</p></li>
+<li><p><strong>known_dict</strong> – Dictionary to wrap. If None is provided, initializes an empty dictionary.</p></li>
+<li><p><strong>default_value</strong> – default value when requested key is not in known_dict.</p></li>
 </ul>
 </dd>
 </dl>
@@ -62,19 +63,26 @@ <h3>Navigation</h3>
 <dd><p>Get the value of the inner dictionary by the given key, If key is not in dictionary,
 it uses the default_factory to return a default value.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>key</strong> (<em>Any</em>) – Key to use in inner dictionary.</p>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><p><strong>key</strong> – Key to use in inner dictionary.</p>
 </dd>
-<dt class="field-even">Returns</dt>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
 <dd class="field-even"><p>Value of the inner dictionary by the given key, or a default value if not exist.
 If default_factory was not passed at initialization, it returns None.</p>
 </dd>
-<dt class="field-odd">Return type</dt>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
 <dd class="field-odd"><p><code class="xref py py-data docutils literal notranslate"><span class="pre">Any</span></code></p>
 </dd>
 </dl>
 </dd></dl>
 
+<dl class="py method">
+<dt class="sig sig-object py" id="model_compression_toolkit.DefaultDict.keys">
+<span class="sig-name descname"><span class="pre">keys</span></span><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.DefaultDict.keys" title="Permalink to this definition">¶</a></dt>
+<dd><p>Get keys of known_dict
+Returns: keys of known_dict</p>
+</dd></dl>
+
 </dd></dl>
 
 </section>
@@ -95,7 +103,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -106,13 +114,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">DefaultDict Class</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/classes/FolderImageLoader.html b/docs/api/api_docs/classes/FolderImageLoader.html
index 50ff1aac2..4da36875d 100644
--- a/docs/api/api_docs/classes/FolderImageLoader.html
+++ b/docs/api/api_docs/classes/FolderImageLoader.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>Folder Image Loader API &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>Folder Image Loader API &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Folder Image Loader API</a></li> 
       </ul>
     </div>  
@@ -41,21 +42,21 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="folder-image-loader-api">
-<span id="ug-folderimageloader"></span><h1>Folder Image Loader API<a class="headerlink" href="#folder-image-loader-api" title="Permalink to this headline">¶</a></h1>
+<span id="ug-folderimageloader"></span><h1>Folder Image Loader API<a class="headerlink" href="#folder-image-loader-api" title="Permalink to this heading">¶</a></h1>
 <p><strong>The following API can be used to load a folder of images to create a representative dataset for PTQ calibration</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.FolderImageLoader">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">FolderImageLoader</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">folder</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">preprocessing</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">batch_size</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">file_types</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">FILETYPES</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.FolderImageLoader" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.FolderImageLoader">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">FolderImageLoader</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">folder</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">preprocessing</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">batch_size</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">file_types</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">FILETYPES</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.FolderImageLoader" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class for images loading, processing and retrieving.</p>
 <p>Initialize a FolderImageLoader object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>folder</strong> (<em>str</em>) – Path of folder with images to load. The path has to exist, and has to contain at</p></li>
+<li><p><strong>folder</strong> – Path of folder with images to load. The path has to exist, and has to contain at</p></li>
 <li><p><strong>image.</strong> (<em>least one</em>) – </p></li>
-<li><p><strong>preprocessing</strong> (<em>List</em><em>[</em><em>Callable</em><em>]</em>) – List of functions to use when processing the images before retrieving them.</p></li>
-<li><p><strong>batch_size</strong> (<em>int</em>) – Number of images to retrieve each sample.</p></li>
-<li><p><strong>file_types</strong> (<em>List</em><em>[</em><em>str</em><em>]</em>) – Files types to scan in the folder. Default list is <a class="reference internal" href="#model_compression_toolkit.common.data_loader.FILETYPES" title="model_compression_toolkit.common.data_loader.FILETYPES"><code class="xref py py-data docutils literal notranslate"><span class="pre">FILETYPES</span></code></a></p></li>
+<li><p><strong>preprocessing</strong> – List of functions to use when processing the images before retrieving them.</p></li>
+<li><p><strong>batch_size</strong> – Number of images to retrieve each sample.</p></li>
+<li><p><strong>file_types</strong> – Files types to scan in the folder. Default list is <a class="reference internal" href="#model_compression_toolkit.core.common.data_loader.FILETYPES" title="model_compression_toolkit.core.common.data_loader.FILETYPES"><code class="xref py py-data docutils literal notranslate"><span class="pre">FILETYPES</span></code></a></p></li>
 </ul>
 </dd>
 </dl>
@@ -74,8 +75,8 @@ <h3>Navigation</h3>
 </pre></div>
 </div>
 <dl class="py method">
-<dt class="sig sig-object py" id="model_compression_toolkit.FolderImageLoader.sample">
-<span class="sig-name descname"><span class="pre">sample</span></span><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.FolderImageLoader.sample" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.FolderImageLoader.sample">
+<span class="sig-name descname"><span class="pre">sample</span></span><span class="sig-paren">(</span><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.FolderImageLoader.sample" title="Permalink to this definition">¶</a></dt>
 <dd><p>Returns: A sample of batch_size images from the folder the FolderImageLoader scanned.</p>
 </dd></dl>
 
@@ -83,10 +84,10 @@ <h3>Navigation</h3>
 
 </section>
 <section id="default-file-types-to-scan">
-<h1>Default file types to scan<a class="headerlink" href="#default-file-types-to-scan" title="Permalink to this headline">¶</a></h1>
+<h1>Default file types to scan<a class="headerlink" href="#default-file-types-to-scan" title="Permalink to this heading">¶</a></h1>
 <dl class="py data">
-<dt class="sig sig-object py" id="model_compression_toolkit.common.data_loader.FILETYPES">
-<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.common.data_loader.</span></span><span class="sig-name descname"><span class="pre">FILETYPES</span></span><em class="property"><span class="w"> </span><span class="p"><span class="pre">=</span></span><span class="w"> </span><span class="pre">['jpeg',</span> <span class="pre">'jpg',</span> <span class="pre">'bmp',</span> <span class="pre">'png']</span></em><a class="headerlink" href="#model_compression_toolkit.common.data_loader.FILETYPES" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.common.data_loader.FILETYPES">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.common.data_loader.</span></span><span class="sig-name descname"><span class="pre">FILETYPES</span></span><em class="property"><span class="w"> </span><span class="p"><span class="pre">=</span></span><span class="w"> </span><span class="pre">['jpeg',</span> <span class="pre">'jpg',</span> <span class="pre">'bmp',</span> <span class="pre">'png']</span></em><a class="headerlink" href="#model_compression_toolkit.core.common.data_loader.FILETYPES" title="Permalink to this definition">¶</a></dt>
 <dd></dd></dl>
 
 </section>
@@ -115,7 +116,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -126,13 +127,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Folder Image Loader API</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/classes/FrameworkInfo.html b/docs/api/api_docs/classes/FrameworkInfo.html
index fc5e39ec1..1f4524d44 100644
--- a/docs/api/api_docs/classes/FrameworkInfo.html
+++ b/docs/api/api_docs/classes/FrameworkInfo.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>FrameworkInfo Class &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>FrameworkInfo Class &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">FrameworkInfo Class</a></li> 
       </ul>
     </div>  
@@ -41,11 +42,11 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="frameworkinfo-class">
-<span id="ug-frameworkinfo"></span><h1>FrameworkInfo Class<a class="headerlink" href="#frameworkinfo-class" title="Permalink to this headline">¶</a></h1>
+<span id="ug-frameworkinfo"></span><h1>FrameworkInfo Class<a class="headerlink" href="#frameworkinfo-class" title="Permalink to this heading">¶</a></h1>
 <p><strong>The following API can be used to pass MCT framework-related information to use when optimizing the network</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.FrameworkInfo">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">FrameworkInfo</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantizer_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantizer_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">kernel_channels_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_min_max_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">layer_min_max_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">kernel_ops_attributes_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_channel_index</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.FrameworkInfo" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.FrameworkInfo">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">FrameworkInfo</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantizer_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">kernel_channels_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_min_max_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">layer_min_max_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">kernel_ops_attributes_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">out_channel_axis_mapping</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.FrameworkInfo" title="Permalink to this definition">¶</a></dt>
 <dd><p>A class to wrap all information about a specific framework the library needs to quantize a model.
 Specifically, FrameworkInfo holds lists of layers by how they should be quantized, and multiple mappings such as
 layer to it kernel channels indices, and a layer to its min/max values, etc.
@@ -54,15 +55,14 @@ <h3>Navigation</h3>
 activation_ops: Layers that their outputs should get quantized (e.g., Add, ReLU, etc.)
 no_quantization_ops:Layers that should not get quantized (e.g., Reshape, Transpose, etc.)</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>activation_quantizer_mapping</strong> (<em>Dict</em><em>[</em><a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.QuantizationMethod" title="model_compression_toolkit.target_platform.QuantizationMethod"><em>QuantizationMethod</em></a><em>, </em><em>Callable</em><em>]</em>) – A dictionary mapping from QuantizationMethod to a quantization function.</p></li>
-<li><p><strong>weights_quantizer_mapping</strong> (<em>Dict</em><em>[</em><a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.QuantizationMethod" title="model_compression_toolkit.target_platform.QuantizationMethod"><em>QuantizationMethod</em></a><em>, </em><em>Callable</em><em>]</em>) – A dictionary mapping from QuantizationMethod to a quantization function.</p></li>
 <li><p><strong>kernel_channels_mapping</strong> (<a class="reference internal" href="DefaultDict.html#model_compression_toolkit.DefaultDict" title="model_compression_toolkit.DefaultDict"><em>DefaultDict</em></a>) – Dictionary from a layer to a tuple of its kernel in/out channels indices.</p></li>
 <li><p><strong>activation_min_max_mapping</strong> (<em>Dict</em><em>[</em><em>str</em><em>, </em><em>tuple</em><em>]</em>) – Dictionary from an activation function to its min/max output values.</p></li>
 <li><p><strong>layer_min_max_mapping</strong> (<em>Dict</em><em>[</em><em>Any</em><em>, </em><em>tuple</em><em>]</em>) – Dictionary from a layer to its min/max output values.</p></li>
 <li><p><strong>kernel_ops_attributes_mapping</strong> (<a class="reference internal" href="DefaultDict.html#model_compression_toolkit.DefaultDict" title="model_compression_toolkit.DefaultDict"><em>DefaultDict</em></a>) – Dictionary from a framework operator to a list of its weights attirbutes to quantize.</p></li>
-<li><p><strong>output_channel_index</strong> (<a class="reference internal" href="#model_compression_toolkit.ChannelAxis" title="model_compression_toolkit.ChannelAxis"><em>ChannelAxis</em></a>) – Index of output channels of the model’s layers (for computing statistics per-channel).</p></li>
+<li><p><strong>out_channel_axis_mapping</strong> (<a class="reference internal" href="DefaultDict.html#model_compression_toolkit.DefaultDict" title="model_compression_toolkit.DefaultDict"><em>DefaultDict</em></a>) – Dictionary of output channels of the model’s layers (for computing statistics per-channel).</p></li>
 </ul>
 </dd>
 </dl>
@@ -94,11 +94,11 @@ <h3>Navigation</h3>
 <div class="line"><br /></div>
 </div>
 <section id="channelaxis">
-<h2>ChannelAxis<a class="headerlink" href="#channelaxis" title="Permalink to this headline">¶</a></h2>
+<h2>ChannelAxis<a class="headerlink" href="#channelaxis" title="Permalink to this heading">¶</a></h2>
 <p><strong>Enum to select the output channels format in the model:</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.ChannelAxis">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">ChannelAxis</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.ChannelAxis" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.ChannelAxis">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">ChannelAxis</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.ChannelAxis" title="Permalink to this definition">¶</a></dt>
 <dd><p>Index of output channels axis:</p>
 <p>NHWC - Output channels index is last.</p>
 <p>NCHW - Output channels index is 1.</p>
@@ -133,7 +133,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -144,13 +144,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">FrameworkInfo Class</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/classes/GradientPTQConfig.html b/docs/api/api_docs/classes/GradientPTQConfig.html
index 37909e9f3..8c13eb544 100644
--- a/docs/api/api_docs/classes/GradientPTQConfig.html
+++ b/docs/api/api_docs/classes/GradientPTQConfig.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>GradientPTQConfig Class &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>GradientPTQConfig Class &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">GradientPTQConfig Class</a></li> 
       </ul>
     </div>  
@@ -41,24 +42,52 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="gradientptqconfig-class">
-<span id="ug-gradientptqconfig"></span><h1>GradientPTQConfig Class<a class="headerlink" href="#gradientptqconfig-class" title="Permalink to this headline">¶</a></h1>
+<span id="ug-gradientptqconfig"></span><h1>GradientPTQConfig Class<a class="headerlink" href="#gradientptqconfig-class" title="Permalink to this heading">¶</a></h1>
 <p><strong>The following API can be used to create a GradientPTQConfig instance which can be used for post training quantization using knowledge distillation from a teacher (float Keras model) to a student (the quantized Keras model)</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.GradientPTQConfig">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">GradientPTQConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_iter</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">loss</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">log_function</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">train_bias</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">lsb_change_per_bit_width</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DefaultDict(MAX_LSBS_CHANGE_MAP,</span> <span class="pre">lambda</span> <span class="pre">:</span> <span class="pre">...)</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.GradientPTQConfig" title="Permalink to this definition">¶</a></dt>
-<dd><p>Configuration to use for quantization with GradientPTQ (experimental).</p>
+<dt class="sig sig-object py" id="model_compression_toolkit.gptq.GradientPTQConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.gptq.</span></span><span class="sig-name descname"><span class="pre">GradientPTQConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_epochs</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer_rest</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">loss</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">log_function</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">train_bias</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">rounding_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">RoundingType.SoftQuantizer</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">use_hessian_based_weights</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer_quantization_parameter</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer_bias</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">regularization_factor</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">REG_DEFAULT</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">hessian_weights_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">GPTQHessianScoresConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">gptq_quantizer_params_override</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.gptq.GradientPTQConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>Configuration to use for quantization with GradientPTQ.</p>
 <p>Initialize a GradientPTQConfig.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>n_iter</strong> (<em>int</em>) – Number of iterations to train.</p></li>
+<li><p><strong>n_epochs</strong> (<em>int</em>) – Number of representative dataset epochs to train.</p></li>
 <li><p><strong>optimizer</strong> (<em>Any</em>) – Optimizer to use.</p></li>
+<li><p><strong>optimizer_rest</strong> (<em>Any</em>) – Optimizer to use for bias and quantizer parameters.</p></li>
 <li><p><strong>loss</strong> (<em>Callable</em>) – The loss to use. should accept 6 lists of tensors. 1st list of quantized tensors, the 2nd list is the float tensors,
 the 3rd is a list of quantized weights, the 4th is a list of float weights, the 5th and 6th lists are the mean and std of the tensors
 accordingly. see example in multiple_tensors_mse_loss</p></li>
 <li><p><strong>log_function</strong> (<em>Callable</em>) – Function to log information about the GPTQ process.</p></li>
 <li><p><strong>train_bias</strong> (<em>bool</em>) – Whether to update the bias during the training or not.</p></li>
-<li><p><strong>lsb_change_per_bit_width</strong> (<em>dict</em>) – Whether to update the bias during the training or not.</p></li>
+<li><p><strong>rounding_type</strong> (<em>RoundingType</em>) – An enum that defines the rounding type.</p></li>
+<li><p><strong>use_hessian_based_weights</strong> (<em>bool</em>) – Whether to use Hessian-based weights for weighted average loss.</p></li>
+<li><p><strong>optimizer_quantization_parameter</strong> (<em>Any</em>) – Optimizer to override the rest optimizer  for quantizer parameters.</p></li>
+<li><p><strong>optimizer_bias</strong> (<em>Any</em>) – Optimizer to override the rest optimizer for bias.</p></li>
+<li><p><strong>regularization_factor</strong> (<em>float</em>) – A floating point number that defines the regularization factor.</p></li>
+<li><p><strong>hessian_weights_config</strong> (<a class="reference internal" href="#model_compression_toolkit.gptq.GPTQHessianScoresConfig" title="model_compression_toolkit.gptq.GPTQHessianScoresConfig"><em>GPTQHessianScoresConfig</em></a>) – A configuration that include all necessary arguments to run a computation of Hessian scores for the GPTQ loss.</p></li>
+<li><p><strong>gptq_quantizer_params_override</strong> (<em>dict</em>) – A dictionary of parameters to override in GPTQ quantizer instantiation. Defaults to None (no parameters).</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+<section id="gptqhessianscoresconfig-class">
+<h1>GPTQHessianScoresConfig Class<a class="headerlink" href="#gptqhessianscoresconfig-class" title="Permalink to this heading">¶</a></h1>
+<p><strong>The following API can be used to create a GPTQHessianScoresConfig instance which can be used to define necessary parameters for computing Hessian scores for the GPTQ loss function.</strong></p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.gptq.GPTQHessianScoresConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.gptq.</span></span><span class="sig-name descname"><span class="pre">GPTQHessianScoresConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">hessians_num_samples</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">16</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">norm_scores</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">log_norm</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">scale_log_norm</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.gptq.GPTQHessianScoresConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>Configuration to use for computing the Hessian-based scores for GPTQ loss metric.</p>
+<p>Initialize a GPTQHessianWeightsConfig.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>hessians_num_samples</strong> (<em>int</em>) – Number of samples to use for computing the Hessian-based scores.</p></li>
+<li><p><strong>norm_scores</strong> (<em>bool</em>) – Whether to normalize the returned scores of the weighted loss function (to get values between 0 and 1).</p></li>
+<li><p><strong>log_norm</strong> (<em>bool</em>) – Whether to use log normalization for the GPTQ Hessian-based scores.</p></li>
+<li><p><strong>scale_log_norm</strong> (<em>bool</em>) – Whether to scale the final vector of the Hessian-based scores.</p></li>
 </ul>
 </dd>
 </dl>
@@ -73,6 +102,14 @@ <h3>Navigation</h3>
       </div>
       <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
         <div class="sphinxsidebarwrapper">
+  <div>
+    <h3><a href="../../../index.html">Table of Contents</a></h3>
+    <ul>
+<li><a class="reference internal" href="#">GradientPTQConfig Class</a></li>
+<li><a class="reference internal" href="#gptqhessianscoresconfig-class">GPTQHessianScoresConfig Class</a></li>
+</ul>
+
+  </div>
 <div id="searchbox" style="display: none" role="search">
   <h3 id="searchlabel">Quick search</h3>
     <div class="searchformwrapper">
@@ -82,7 +119,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -93,13 +130,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">GradientPTQConfig Class</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/classes/PruningConfig.html b/docs/api/api_docs/classes/PruningConfig.html
new file mode 100644
index 000000000..ead79c479
--- /dev/null
+++ b/docs/api/api_docs/classes/PruningConfig.html
@@ -0,0 +1,124 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Pruning Configuration &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pruning Configuration</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pruning-configuration">
+<span id="ug-pruningconfig"></span><h1>Pruning Configuration<a class="headerlink" href="#pruning-configuration" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.PruningConfig">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">PruningConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">num_score_approximations</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">32</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">importance_metric</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImportanceMetric.LFH</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">channels_filtering_strategy</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ChannelsFilteringStrategy.GREEDY</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.pruning.PruningConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>Configuration class for specifying how a neural network should be pruned.</p>
+<dl class="py attribute">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.num_score_approximations">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">num_score_approximations</span></span><a class="headerlink" href="#model_compression_toolkit.pruning.num_score_approximations" title="Permalink to this definition">¶</a></dt>
+<dd><p>The number of score approximations to perform
+when calculating channel importance.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>int</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="py attribute">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.importance_metric">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">importance_metric</span></span><a class="headerlink" href="#model_compression_toolkit.pruning.importance_metric" title="Permalink to this definition">¶</a></dt>
+<dd><p>The metric used to calculate channel importance.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>ImportanceMetric</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="py attribute">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.channels_filtering_strategy">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">channels_filtering_strategy</span></span><a class="headerlink" href="#model_compression_toolkit.pruning.channels_filtering_strategy" title="Permalink to this definition">¶</a></dt>
+<dd><p>The strategy used to filter out channels.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>ChannelsFilteringStrategy</p>
+</dd>
+</dl>
+</dd></dl>
+
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pruning Configuration</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/classes/PruningInfo.html b/docs/api/api_docs/classes/PruningInfo.html
new file mode 100644
index 000000000..8564f1c77
--- /dev/null
+++ b/docs/api/api_docs/classes/PruningInfo.html
@@ -0,0 +1,117 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Pruning Information &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pruning Information</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pruning-information">
+<span id="ug-pruninginfo"></span><h1>Pruning Information<a class="headerlink" href="#pruning-information" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.PruningInfo">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">PruningInfo</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">pruning_masks</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">importance_scores</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.pruning.PruningInfo" title="Permalink to this definition">¶</a></dt>
+<dd><p>PruningInfo stores information about a pruned model, including the pruning masks
+and importance scores for each layer. This class acts as a container for accessing
+pruning-related metadata.</p>
+<dl class="py attribute">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.pruning_masks">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">pruning_masks</span></span><a class="headerlink" href="#model_compression_toolkit.pruning.pruning_masks" title="Permalink to this definition">¶</a></dt>
+<dd><p>Stores the pruning masks for each layer.
+A pruning mask is an array where each element indicates whether the corresponding
+channel or neuron has been pruned (0) or kept (1).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>Dict[BaseNode, np.ndarray]</p>
+</dd>
+</dl>
+</dd></dl>
+
+<dl class="py attribute">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.importance_scores">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">importance_scores</span></span><a class="headerlink" href="#model_compression_toolkit.pruning.importance_scores" title="Permalink to this definition">¶</a></dt>
+<dd><p>Stores the importance scores for each layer.
+Importance scores quantify the significance of each channel in the layer.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>Dict[BaseNode, np.ndarray]</p>
+</dd>
+</dl>
+</dd></dl>
+
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pruning Information</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/index.html b/docs/api/api_docs/index.html
index 5fda3e16d..93bc332e2 100644
--- a/docs/api/api_docs/index.html
+++ b/docs/api/api_docs/index.html
@@ -20,6 +20,7 @@
     <script src="../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../genindex.html" />
     <link rel="search" title="Search" href="../../search.html" />
+    <link rel="prev" title="MCT Quickstart Guideline for Pytorch models" href="../../guidelines/quickstart_pytorch.html" />
     <meta name="viewport" content="width=device-width,initial-scale=1.0" />
     <!--[if lt IE 9]>
     <script src="static/css3-mediaqueries.js"></script>
@@ -31,6 +32,9 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
+        <li class="right" >
+          <a href="../../guidelines/quickstart_pytorch.html" title="MCT Quickstart Guideline for Pytorch models"
+             accesskey="P">previous</a> |</li>
         <li class="nav-item nav-item-0"><a href="../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">API Docs</a></li> 
       </ul>
@@ -43,10 +47,6 @@ <h3>Navigation</h3>
             
   <section id="api-docs">
 <span id="ug-api-docs"></span><h1>API Docs<a class="headerlink" href="#api-docs" title="Permalink to this heading">¶</a></h1>
-<div class="admonition note">
-<p class="admonition-title">Note</p>
-<p>This API will be removed in future releases. Please switch to the <a class="reference internal" href="../experimental_api_docs/index.html#ug-experimental-api-docs"><span class="std std-ref">new API</span></a></p>
-</div>
 <p><strong>Init module for MCT API.</strong></p>
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
 </pre></div>
@@ -57,31 +57,47 @@ <h3>Navigation</h3>
 <section id="functions">
 <h2>Functions<a class="headerlink" href="#functions" title="Permalink to this heading">¶</a></h2>
 <ul class="simple">
-<li><p><a class="reference internal" href="methods/pytorch_post_training_quantization.html#ug-pytorch-post-training-quantization"><span class="std std-ref">pytorch_post_training_quantization</span></a>: Function to use for post training quantization of Pytorch models.</p></li>
-<li><p><a class="reference internal" href="methods/pytorch_post_training_quantization_mixed_precision.html#ug-pytorch-post-training-quantization-mixed-precision"><span class="std std-ref">pytorch_post_training_quantization_mixed_precision</span></a>: Function to use for mixed-precision post training quantization of Pytorch models (experimental).</p></li>
-<li><p><a class="reference internal" href="methods/keras_post_training_quantization.html#ug-keras-post-training-quantization"><span class="std std-ref">keras_post_training_quantization</span></a>: Function to use for post training quantization of Keras models.</p></li>
-<li><p><a class="reference internal" href="methods/keras_post_training_quantization_mixed_precision.html#ug-keras-post-training-quantization-mixed-precision"><span class="std std-ref">keras_post_training_quantization_mixed_precision</span></a>: Function to use for mixed-precision post training quantization of Keras models (experimental).</p></li>
-<li><p><a class="reference internal" href="../experimental_api_docs/methods/get_keras_gptq_config.html#ug-get-keras-gptq-config"><span class="std std-ref">get_keras_gptq_config</span></a>: Function to create a GradientPTQConfig instance to use for Keras models when using GPTQ (experimental).</p></li>
-<li><p><a class="reference internal" href="../experimental_api_docs/methods/get_target_platform_capabilities.html#ug-get-target-platform-capabilities"><span class="std std-ref">get_target_platform_capabilities</span></a>: Function to get a target platform model for Tensorflow and Pytorch.</p></li>
-<li><p><a class="reference internal" href="methods/keras_kpi_data.html#ug-keras-kpi-data"><span class="std std-ref">keras_kpi_data</span></a>: Function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models.</p></li>
-<li><p><a class="reference internal" href="methods/pytorch_kpi_data.html#ug-pytorch-kpi-data"><span class="std std-ref">pytorch_kpi_data</span></a>: Function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models.</p></li>
+<li><p><a class="reference internal" href="methods/pytorch_post_training_quantization_experimental.html#ug-pytorch-post-training-quantization"><span class="std std-ref">pytorch_post_training_quantization</span></a>: A function to use for post training quantization of PyTorch models.</p></li>
+<li><p><a class="reference internal" href="methods/keras_post_training_quantization_experimental.html#ug-keras-post-training-quantization"><span class="std std-ref">keras_post_training_quantization</span></a>: A function to use for post training quantization of Keras models.</p></li>
+<li><p><a class="reference internal" href="methods/keras_gradient_post_training_quantization_experimental.html#ug-keras-gradient-post-training-quantization"><span class="std std-ref">keras_gradient_post_training_quantization</span></a>: A function to use for gradient-based post training quantization of Keras models.</p></li>
+<li><p><a class="reference internal" href="methods/get_keras_gptq_config.html#ug-get-keras-gptq-config"><span class="std std-ref">get_keras_gptq_config</span></a>: A function to create a GradientPTQConfig instance to use for Keras models when using GPTQ.</p></li>
+<li><p><a class="reference internal" href="methods/pytorch_gradient_post_training_quantization_experimental.html#ug-pytorch-gradient-post-training-quantization"><span class="std std-ref">pytorch_gradient_post_training_quantization</span></a>: A function to use for gradient-based post training quantization of Pytorch models.</p></li>
+<li><p><a class="reference internal" href="methods/get_pytroch_gptq_config.html#ug-get-pytorch-gptq-config"><span class="std std-ref">get_pytorch_gptq_config</span></a>: A function to create a GradientPTQConfig instance to use for Pytorch models when using GPTQ.</p></li>
+<li><p><a class="reference internal" href="methods/keras_quantization_aware_training_init.html#ug-keras-quantization-aware-training-init-experimental"><span class="std std-ref">keras_quantization_aware_training_init</span></a>: A function to use for preparing a model for Quantization Aware Training (Experimental)</p></li>
+<li><p><a class="reference internal" href="methods/keras_quantization_aware_training_finalize.html#ug-keras-quantization-aware-training-finalize-experimental"><span class="std std-ref">keras_quantization_aware_training_finalize</span></a>: A function to finalize a model after Quantization Aware Training to a model without QuantizeWrappers (Experimental)</p></li>
+<li><p><a class="reference internal" href="methods/keras_data_generation_experimental.html#ug-keras-data-generation-experimental"><span class="std std-ref">keras_data_generation_experimental</span></a>: A function to generate data for a Keras model (experimental).</p></li>
+<li><p><a class="reference internal" href="methods/get_keras_data_generation_config.html#ug-get-keras-data-generation-config"><span class="std std-ref">get_keras_data_generation_config</span></a>: A function to generate a DataGenerationConfig for Tensorflow data generation(experimental).</p></li>
+<li><p><a class="reference internal" href="methods/pytorch_data_generation_experimental.html#ug-pytorch-data-generation-experimental"><span class="std std-ref">pytorch_data_generation_experimental</span></a>: A function to generate data for a Pytorch model (experimental).</p></li>
+<li><p><a class="reference internal" href="methods/get_pytorch_data_generation_config.html#ug-get-pytorch-data-generation-config"><span class="std std-ref">get_pytorch_data_generation_config</span></a>: A function to load a DataGenerationConfig for Pytorch data generation (experimental).</p></li>
+<li><p><a class="reference internal" href="methods/keras_pruning_experimental.html#ug-keras-pruning-experimental"><span class="std std-ref">keras_pruning_experimental</span></a>: A function to apply structured pruning for Keras models (experimental).</p></li>
+<li><p><a class="reference internal" href="methods/pytorch_pruning_experimental.html#ug-pytorch-pruning-experimental"><span class="std std-ref">pytorch_pruning_experimental</span></a>: A function to apply structured pruning for Pytorch models (experimental).</p></li>
+<li><p><a class="reference internal" href="methods/keras_kpi_data_experimental.html#ug-keras-kpi-data"><span class="std std-ref">keras_kpi_data</span></a>: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of Keras models.</p></li>
+<li><p><a class="reference internal" href="methods/pytorch_kpi_data_experimental.html#ug-pytorch-kpi-data"><span class="std std-ref">pytorch_kpi_data</span></a>: A function to compute KPI data that can be used to calculate the desired target KPI for mixed-precision quantization of PyTorch models.</p></li>
+<li><p><a class="reference internal" href="methods/get_target_platform_capabilities.html#ug-get-target-platform-capabilities"><span class="std std-ref">get_target_platform_capabilities</span></a>: A function to get a target platform model for Tensorflow and Pytorch.</p></li>
+<li><p><a class="reference internal" href="methods/keras_load_quantizad_model.html#ug-keras-load-quantized-model"><span class="std std-ref">keras_load_quantized_model</span></a>: A function to load a quantized keras model.</p></li>
 </ul>
 </section>
 <section id="modules">
 <h2>Modules<a class="headerlink" href="#modules" title="Permalink to this heading">¶</a></h2>
 <ul class="simple">
-<li><p><a class="reference internal" href="../experimental_api_docs/modules/quantization_config.html#ug-quantization-config"><span class="std std-ref">quantization_config</span></a>: Module to configure the quantization process.</p></li>
-<li><p><a class="reference internal" href="modules/mixed_precision_quantization_config.html#ug-mixed-precision-quantization-config"><span class="std std-ref">mixed_precision_quantization_config</span></a>: Module to configure the quantization process when using mixed-precision PTQ.</p></li>
-<li><p><a class="reference internal" href="../experimental_api_docs/modules/network_editor.html#ug-network-editor"><span class="std std-ref">network_editor</span></a>: Module to edit your model during the quantization process.</p></li>
-<li><p><a class="reference internal" href="../experimental_api_docs/modules/target_platform.html#ug-target-platform"><span class="std std-ref">target_platform</span></a>: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference.</p></li>
+<li><p><a class="reference internal" href="modules/core_config.html#ug-core-config"><span class="std std-ref">core_config</span></a>: Module to contain configurations of the optimization process.</p></li>
+<li><p><a class="reference internal" href="modules/quantization_config.html#ug-quantization-config"><span class="std std-ref">quantization_config</span></a>: Module to configure the quantization process.</p></li>
+<li><p><a class="reference internal" href="modules/mixed_precision_quantization_config.html#ug-mixed-precision-quantization-config-v2"><span class="std std-ref">mixed_precision_quantization_config</span></a>: Module to configure the quantization process when using mixed-precision PTQ.</p></li>
+<li><p><a class="reference internal" href="modules/debug_config.html#ug-debug-config"><span class="std std-ref">debug_config</span></a>: Module to configure options for debugging the optimization process.</p></li>
+<li><p><a class="reference internal" href="modules/target_platform.html#ug-target-platform"><span class="std std-ref">target_platform</span></a>: Module to create and model hardware-related settings to optimize the model according to, by the hardware the optimized model will use during inference.</p></li>
+<li><p><a class="reference internal" href="modules/qat_config.html#ug-qat-config"><span class="std std-ref">qat_config</span></a>: Module to create quantization configuration for Quantization-aware Training.</p></li>
+<li><p><a class="reference internal" href="modules/exporter.html#ug-exporter"><span class="std std-ref">exporter</span></a>: Module that enables to export a quantized model in different serialization formats.</p></li>
+<li><p><a class="reference internal" href="modules/trainable_infrastructure.html#ug-trainable-infrastructure"><span class="std std-ref">trainable_infrastructure</span></a>: Module that contains quantization abstraction and quantizers for hardware-oriented model optimization tools.</p></li>
 </ul>
 </section>
 <section id="classes">
 <h2>Classes<a class="headerlink" href="#classes" title="Permalink to this heading">¶</a></h2>
 <ul class="simple">
-<li><p><a class="reference internal" href="../experimental_api_docs/classes/GradientPTQConfig.html#ug-gradientptqconfig"><span class="std std-ref">GradientPTQConfig</span></a>: Class to configure GradientPTQC options for gradient based post training quantization.</p></li>
-<li><p><a class="reference internal" href="../experimental_api_docs/classes/FolderImageLoader.html#ug-folderimageloader"><span class="std std-ref">FolderImageLoader</span></a>: Class to use an images directory as a representative dataset.</p></li>
-<li><p><a class="reference internal" href="../experimental_api_docs/classes/FrameworkInfo.html#ug-frameworkinfo"><span class="std std-ref">FrameworkInfo</span></a>: Class to wrap framework information to be used by MCT when optimizing models.</p></li>
+<li><p><a class="reference internal" href="classes/GradientPTQConfig.html#ug-gradientptqconfig"><span class="std std-ref">GradientPTQConfig</span></a>: Class to configure GradientPTQ options for gradient based post training quantization.</p></li>
+<li><p><a class="reference internal" href="classes/FolderImageLoader.html#ug-folderimageloader"><span class="std std-ref">FolderImageLoader</span></a>: Class to use an images directory as a representative dataset.</p></li>
+<li><p><a class="reference internal" href="classes/FrameworkInfo.html#ug-frameworkinfo"><span class="std std-ref">FrameworkInfo</span></a>: Class to wrap framework information to be used by MCT when optimizing models.</p></li>
+<li><p><a class="reference internal" href="classes/PruningConfig.html#ug-pruningconfig"><span class="std std-ref">PruningConfig</span></a>: PruningConfig</p></li>
+<li><p><a class="reference internal" href="classes/PruningInfo.html#ug-pruninginfo"><span class="std std-ref">PruningInfo</span></a>: PruningInfo</p></li>
 </ul>
 </section>
 <section id="indices-and-tables">
@@ -118,6 +134,11 @@ <h3><a href="../../index.html">Table of Contents</a></h3>
 </ul>
 
   </div>
+  <div>
+    <h4>Previous topic</h4>
+    <p class="topless"><a href="../../guidelines/quickstart_pytorch.html"
+                          title="previous chapter">MCT Quickstart Guideline for Pytorch models</a></p>
+  </div>
 <div id="searchbox" style="display: none" role="search">
   <h3 id="searchlabel">Quick search</h3>
     <div class="searchformwrapper">
@@ -138,6 +159,9 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../genindex.html" title="General Index"
              >index</a></li>
+        <li class="right" >
+          <a href="../../guidelines/quickstart_pytorch.html" title="MCT Quickstart Guideline for Pytorch models"
+             >previous</a> |</li>
         <li class="nav-item nav-item-0"><a href="../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">API Docs</a></li> 
       </ul>
diff --git a/docs/api/api_docs/methods/get_keras_data_generation_config.html b/docs/api/api_docs/methods/get_keras_data_generation_config.html
new file mode 100644
index 000000000..37778aa48
--- /dev/null
+++ b/docs/api/api_docs/methods/get_keras_data_generation_config.html
@@ -0,0 +1,122 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Get DataGenerationConfig for Keras Models &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get DataGenerationConfig for Keras Models</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="get-datagenerationconfig-for-keras-models">
+<span id="ug-get-keras-data-generation-config"></span><h1>Get DataGenerationConfig for Keras Models<a class="headerlink" href="#get-datagenerationconfig-for-keras-models" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.data_generation.get_keras_data_generation_config">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.data_generation.</span></span><span class="sig-name descname"><span class="pre">get_keras_data_generation_config</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_iter</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_N_ITER</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">Adam</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">data_gen_batch_size</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_DATA_GEN_BS</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">initial_lr</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_INITIAL_LR</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_loss_multiplier</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_OUTPUT_LOSS_MULTIPLIER</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">scheduler_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">SchedulerType.REDUCE_ON_PLATEAU</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">bn_alignment_loss_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">BatchNormAlignemntLossType.L2_SQUARE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_loss_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">OutputLossType.REGULARIZED_MIN_MAX_DIFF</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">data_init_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DataInitType.Gaussian</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">layer_weighting_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">BNLayerWeightingType.AVERAGE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">image_granularity</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImageGranularity.BatchWise</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">image_pipeline_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImagePipelineType.RANDOM_CROP_FLIP</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">image_normalization_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImageNormalizationType.KERAS_APPLICATIONS</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">extra_pixels</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">0</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">bn_layer_types</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">[BatchNormalization]</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">clip_images</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">reflection</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.data_generation.get_keras_data_generation_config" title="Permalink to this definition">¶</a></dt>
+<dd><p>Function to create a DataGenerationConfig object with the specified configuration parameters.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>n_iter</strong> (<em>int</em>) – Number of iterations for the data generation process.</p></li>
+<li><p><strong>optimizer</strong> (<em>Optimizer</em>) – The optimizer to use for the data generation process.</p></li>
+<li><p><strong>data_gen_batch_size</strong> (<em>int</em>) – Batch size for data generation.</p></li>
+<li><p><strong>initial_lr</strong> (<em>float</em>) – Initial learning rate for the optimizer.</p></li>
+<li><p><strong>output_loss_multiplier</strong> (<em>float</em>) – Multiplier for the output loss during optimization.</p></li>
+<li><p><strong>scheduler_type</strong> (<em>SchedulerType</em>) – The type of scheduler to use.</p></li>
+<li><p><strong>bn_alignment_loss_type</strong> (<em>BatchNormAlignemntLossType</em>) – The type of BatchNorm alignment loss to use.</p></li>
+<li><p><strong>output_loss_type</strong> (<em>OutputLossType</em>) – The type of output loss to use.</p></li>
+<li><p><strong>data_init_type</strong> (<em>DataInitType</em>) – The type of data initialization to use.</p></li>
+<li><p><strong>layer_weighting_type</strong> (<em>BNLayerWeightingType</em>) – The type of layer weighting to use.</p></li>
+<li><p><strong>image_granularity</strong> (<em>ImageGranularity</em>) – The granularity of the images for optimization.</p></li>
+<li><p><strong>image_pipeline_type</strong> (<em>ImagePipelineType</em>) – The type of image pipeline to use.</p></li>
+<li><p><strong>image_normalization_type</strong> (<em>ImageNormalizationType</em>) – The type of image normalization to use.</p></li>
+<li><p><strong>extra_pixels</strong> (<em>int</em>) – Extra pixels to add to the input image size. Defaults to 0.</p></li>
+<li><p><strong>bn_layer_types</strong> (<em>List</em>) – List of BatchNorm layer types to be considered for data generation.</p></li>
+<li><p><strong>clip_images</strong> (<em>bool</em>) – Whether to clip images during optimization.</p></li>
+<li><p><strong>reflection</strong> (<em>bool</em>) – Whether to use reflection during optimization.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>Data generation configuration object.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>DataGenerationConfig</p>
+</dd>
+<dt class="field-even">Return type<span class="colon">:</span></dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">DataGenerationConfig</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get DataGenerationConfig for Keras Models</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/get_keras_gptq_config.html b/docs/api/api_docs/methods/get_keras_gptq_config.html
index d40ae3122..8993aac0d 100644
--- a/docs/api/api_docs/methods/get_keras_gptq_config.html
+++ b/docs/api/api_docs/methods/get_keras_gptq_config.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>Get GradientPTQConfig for Keras Models &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>Get GradientPTQConfig for Keras Models &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Get GradientPTQConfig for Keras Models</a></li> 
       </ul>
     </div>  
@@ -41,39 +42,47 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="get-gradientptqconfig-for-keras-models">
-<span id="ug-get-keras-gptq-config"></span><h1>Get GradientPTQConfig for Keras Models<a class="headerlink" href="#get-gradientptqconfig-for-keras-models" title="Permalink to this headline">¶</a></h1>
+<span id="ug-get-keras-gptq-config"></span><h1>Get GradientPTQConfig for Keras Models<a class="headerlink" href="#get-gradientptqconfig-for-keras-models" title="Permalink to this heading">¶</a></h1>
 <dl class="py function">
-<dt class="sig sig-object py" id="model_compression_toolkit.get_keras_gptq_config">
-<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">get_keras_gptq_config</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_iter</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">tf.keras.optimizers.Adam()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">loss</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">multiple_tensors_mse_loss</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">log_function</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">train_bias</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.get_keras_gptq_config" title="Permalink to this definition">¶</a></dt>
-<dd><p>Create a GradientPTQConfig instance for Keras models.</p>
+<dt class="sig sig-object py" id="model_compression_toolkit.gptq.get_keras_gptq_config">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.gptq.</span></span><span class="sig-name descname"><span class="pre">get_keras_gptq_config</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_epochs</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">tf.keras.optimizers.Adam(learning_rate=LR_DEFAULT)</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer_rest</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">tf.keras.optimizers.Adam(learning_rate=LR_REST_DEFAULT)</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">loss</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">GPTQMultipleTensorsLoss()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">log_function</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">use_hessian_based_weights</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">regularization_factor</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">REG_DEFAULT</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.gptq.get_keras_gptq_config" title="Permalink to this definition">¶</a></dt>
+<dd><p>Create a GradientPTQConfigV2 instance for Keras models.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>n_iter</strong> (<em>int</em>) – Number of iterations to fine-tune.</p></li>
-<li><p><strong>optimizer</strong> (<em>OptimizerV2</em>) – Keras optimizer to use for fine-tuning.</p></li>
+<li><p><strong>n_epochs</strong> (<em>int</em>) – Number of epochs for running the representative dataset for fine-tuning.</p></li>
+<li><p><strong>optimizer</strong> (<em>OptimizerV2</em>) – Keras optimizer to use for fine-tuning for auxiliry variable with a default learning rate set to 0.2.</p></li>
+<li><p><strong>optimizer_rest</strong> (<em>OptimizerV2</em>) – Keras optimizer to use for fine-tuning of the bias variable.</p></li>
 <li><p><strong>loss</strong> (<em>Callable</em>) – loss to use during fine-tuning. should accept 4 lists of tensors. 1st list of quantized tensors, the 2nd list is the float tensors, the 3rd is a list of quantized weights and the 4th is a list of float weights.</p></li>
 <li><p><strong>log_function</strong> (<em>Callable</em>) – Function to log information about the gptq process.</p></li>
-<li><p><strong>train_bias</strong> (<em>bool</em>) – Whether to update the bias during the the fine-tuning or not.</p></li>
+<li><p><strong>use_hessian_based_weights</strong> (<em>bool</em>) – Whether to use Hessian-based weights for weighted average loss.</p></li>
+<li><p><strong>regularization_factor</strong> (<em>float</em>) – A floating point number that defines the regularization factor.</p></li>
 </ul>
 </dd>
-<dt class="field-even">Returns</dt>
-<dd class="field-even"><p>a GradientPTQConfig object to use when fine-tuning the quantized model using gptq.</p>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>a GradientPTQConfigV2 object to use when fine-tuning the quantized model using gptq.</p>
 </dd>
 </dl>
 <p class="rubric">Examples</p>
-<p>Create a GradientPTQConfig to run for 5 iteration:</p>
-<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">get_keras_gptq_config</span><span class="p">(</span><span class="n">n_iter</span><span class="o">=</span><span class="mi">5</span><span class="p">)</span>
+<p>Import MCT and TensorFlow:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">tensorflow</span> <span class="k">as</span> <span class="nn">tf</span>
 </pre></div>
 </div>
-<p>To disable the biases training, one may set train_bias to false (enabled by default):</p>
-<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">get_keras_gptq_config</span><span class="p">(</span><span class="n">n_iter</span><span class="o">=</span><span class="mi">5</span><span class="p">,</span> <span class="n">train_bias</span><span class="o">=</span><span class="n">false</span><span class="p">)</span>
+<p>Create a GradientPTQConfigV2 to run for 5 epochs:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">get_keras_gptq_config</span><span class="p">(</span><span class="n">n_epochs</span><span class="o">=</span><span class="mi">5</span><span class="p">)</span>
 </pre></div>
 </div>
 <p>Other Tensorflow optimizers can be passed:</p>
-<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">get_keras_gptq_config</span><span class="p">(</span><span class="n">n_iter</span><span class="o">=</span><span class="mi">3</span><span class="p">,</span> <span class="n">optimizer</span><span class="o">=</span><span class="n">tf</span><span class="o">.</span><span class="n">keras</span><span class="o">.</span><span class="n">optimizers</span><span class="o">.</span><span class="n">Nadam</span><span class="p">())</span>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">get_keras_gptq_config</span><span class="p">(</span><span class="n">n_epochs</span><span class="o">=</span><span class="mi">3</span><span class="p">,</span> <span class="n">optimizer</span><span class="o">=</span><span class="n">tf</span><span class="o">.</span><span class="n">keras</span><span class="o">.</span><span class="n">optimizers</span><span class="o">.</span><span class="n">Nadam</span><span class="p">())</span>
 </pre></div>
 </div>
-<p>The configuration can be passed to <a class="reference internal" href="keras_post_training_quantization.html#model_compression_toolkit.keras_post_training_quantization" title="model_compression_toolkit.keras_post_training_quantization"><code class="xref py py-func docutils literal notranslate"><span class="pre">keras_post_training_quantization()</span></code></a> in order to quantize a keras model using gptq.</p>
+<p>The configuration can be passed to <code class="xref py py-func docutils literal notranslate"><span class="pre">keras_post_training_quantization()</span></code> in order to quantize a keras model using gptq.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><a class="reference internal" href="../classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfig" title="model_compression_toolkit.gptq.common.gptq_config.GradientPTQConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">GradientPTQConfig</span></code></a></p>
+</dd>
+</dl>
 </dd></dl>
 
 </section>
@@ -94,7 +103,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -105,13 +114,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Get GradientPTQConfig for Keras Models</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/get_pytorch_data_generation_config.html b/docs/api/api_docs/methods/get_pytorch_data_generation_config.html
new file mode 100644
index 000000000..2852b8509
--- /dev/null
+++ b/docs/api/api_docs/methods/get_pytorch_data_generation_config.html
@@ -0,0 +1,123 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Get DataGenerationConfig for Pytorch Models &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get DataGenerationConfig for Pytorch Models</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="get-datagenerationconfig-for-pytorch-models">
+<span id="ug-get-pytorch-data-generation-config"></span><h1>Get DataGenerationConfig for Pytorch Models<a class="headerlink" href="#get-datagenerationconfig-for-pytorch-models" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.data_generation.get_pytorch_data_generation_config">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.data_generation.</span></span><span class="sig-name descname"><span class="pre">get_pytorch_data_generation_config</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_iter</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_N_ITER</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">RAdam</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">data_gen_batch_size</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_DATA_GEN_BS</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">initial_lr</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_INITIAL_LR</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_loss_multiplier</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_OUTPUT_LOSS_MULTIPLIER</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">scheduler_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">SchedulerType.REDUCE_ON_PLATEAU</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">bn_alignment_loss_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">BatchNormAlignemntLossType.L2_SQUARE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_loss_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">OutputLossType.REGULARIZED_MIN_MAX_DIFF</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">data_init_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DataInitType.Diverse</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">layer_weighting_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">BNLayerWeightingType.AVERAGE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">image_granularity</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImageGranularity.AllImages</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">image_pipeline_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImagePipelineType.RANDOM_CROP</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">image_normalization_type</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">ImageNormalizationType.TORCHVISION</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">extra_pixels</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">0</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">bn_layer_types</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_BN_LAYER_TYPES</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">last_layer_types</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_LAST_LAYER_TYPES</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">clip_images</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">reflection</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.data_generation.get_pytorch_data_generation_config" title="Permalink to this definition">¶</a></dt>
+<dd><p>Function to create a DataGenerationConfig object with the specified configuration parameters.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>n_iter</strong> (<em>int</em>) – Number of iterations for the data generation process.</p></li>
+<li><p><strong>optimizer</strong> (<em>Optimizer</em>) – The optimizer to use for the data generation process.</p></li>
+<li><p><strong>data_gen_batch_size</strong> (<em>int</em>) – Batch size for data generation.</p></li>
+<li><p><strong>initial_lr</strong> (<em>float</em>) – Initial learning rate for the optimizer.</p></li>
+<li><p><strong>output_loss_multiplier</strong> (<em>float</em>) – Multiplier for the output loss during optimization.</p></li>
+<li><p><strong>scheduler_type</strong> (<em>SchedulerType</em>) – The type of scheduler to use.</p></li>
+<li><p><strong>bn_alignment_loss_type</strong> (<em>BatchNormAlignemntLossType</em>) – The type of BatchNorm alignment loss to use.</p></li>
+<li><p><strong>output_loss_type</strong> (<em>OutputLossType</em>) – The type of output loss to use.</p></li>
+<li><p><strong>data_init_type</strong> (<em>DataInitType</em>) – The type of data initialization to use.</p></li>
+<li><p><strong>layer_weighting_type</strong> (<em>BNLayerWeightingType</em>) – The type of layer weighting to use.</p></li>
+<li><p><strong>image_granularity</strong> (<em>ImageGranularity</em>) – The granularity of the images for optimization.</p></li>
+<li><p><strong>image_pipeline_type</strong> (<em>ImagePipelineType</em>) – The type of image pipeline to use.</p></li>
+<li><p><strong>image_normalization_type</strong> (<em>ImageNormalizationType</em>) – The type of image normalization to use.</p></li>
+<li><p><strong>extra_pixels</strong> (<em>int</em>) – Extra pixels to add to the input image size. Defaults to 0.</p></li>
+<li><p><strong>bn_layer_types</strong> (<em>List</em>) – List of BatchNorm layer types to be considered for data generation.</p></li>
+<li><p><strong>last_layer_types</strong> (<em>List</em>) – List of layer types to be considered for the output loss.</p></li>
+<li><p><strong>clip_images</strong> (<em>bool</em>) – Whether to clip images during optimization.</p></li>
+<li><p><strong>reflection</strong> (<em>bool</em>) – Whether to use reflection during optimization.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>Data generation configuration object.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>DataGenerationConfig</p>
+</dd>
+<dt class="field-even">Return type<span class="colon">:</span></dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">DataGenerationConfig</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get DataGenerationConfig for Pytorch Models</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/get_pytroch_gptq_config.html b/docs/api/api_docs/methods/get_pytroch_gptq_config.html
new file mode 100644
index 000000000..5a8c0370a
--- /dev/null
+++ b/docs/api/api_docs/methods/get_pytroch_gptq_config.html
@@ -0,0 +1,123 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Get GradientPTQConfig for Pytorch Models &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get GradientPTQConfig for Pytorch Models</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="get-gradientptqconfig-for-pytorch-models">
+<span id="ug-get-pytorch-gptq-config"></span><h1>Get GradientPTQConfig for Pytorch Models<a class="headerlink" href="#get-gradientptqconfig-for-pytorch-models" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.gptq.get_pytorch_gptq_config">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.gptq.</span></span><span class="sig-name descname"><span class="pre">get_pytorch_gptq_config</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">n_epochs</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">Adam([torch.Tensor([])],</span> <span class="pre">lr=LR_DEFAULT)</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">optimizer_rest</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">Adam([torch.Tensor([])],</span> <span class="pre">lr=LR_REST_DEFAULT)</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">loss</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">multiple_tensors_mse_loss</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">log_function</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">use_hessian_based_weights</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">regularization_factor</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">REG_DEFAULT</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.gptq.get_pytorch_gptq_config" title="Permalink to this definition">¶</a></dt>
+<dd><p>Create a GradientPTQConfigV2 instance for Pytorch models.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>n_epochs</strong> (<em>int</em>) – Number of epochs for running the representative dataset for fine-tuning.</p></li>
+<li><p><strong>optimizer</strong> (<em>Optimizer</em>) – Pytorch optimizer to use for fine-tuning for auxiliry variable.</p></li>
+<li><p><strong>optimizer_rest</strong> (<em>Optimizer</em>) – Pytorch optimizer to use for fine-tuning of the bias variable.</p></li>
+<li><p><strong>loss</strong> (<em>Callable</em>) – loss to use during fine-tuning. should accept 4 lists of tensors. 1st list of quantized tensors, the 2nd list is the float tensors, the 3rd is a list of quantized weights and the 4th is a list of float weights.</p></li>
+<li><p><strong>log_function</strong> (<em>Callable</em>) – Function to log information about the gptq process.</p></li>
+<li><p><strong>use_hessian_based_weights</strong> (<em>bool</em>) – Whether to use Hessian-based weights for weighted average loss.</p></li>
+<li><p><strong>regularization_factor</strong> (<em>float</em>) – A floating point number that defines the regularization factor.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>a GradientPTQConfigV2 object to use when fine-tuning the quantized model using gptq.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT and Create a GradientPTQConfigV2 to run for 5 epochs:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">get_pytorch_gptq_config</span><span class="p">(</span><span class="n">n_epochs</span><span class="o">=</span><span class="mi">5</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Other PyTorch optimizers can be passed with dummy params:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">torch</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_conf</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">get_pytorch_gptq_config</span><span class="p">(</span><span class="n">n_epochs</span><span class="o">=</span><span class="mi">3</span><span class="p">,</span> <span class="n">optimizer</span><span class="o">=</span><span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span><span class="p">([</span><span class="n">torch</span><span class="o">.</span><span class="n">Tensor</span><span class="p">(</span><span class="mi">1</span><span class="p">)]))</span>
+</pre></div>
+</div>
+<p>The configuration can be passed to <code class="xref py py-func docutils literal notranslate"><span class="pre">pytorch_post_training_quantization()</span></code> in order to quantize a pytorch model using gptq.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><a class="reference internal" href="../classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfig" title="model_compression_toolkit.gptq.common.gptq_config.GradientPTQConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">GradientPTQConfig</span></code></a></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get GradientPTQConfig for Pytorch Models</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/get_target_platform_capabilities.html b/docs/api/api_docs/methods/get_target_platform_capabilities.html
index b6e0f7c69..f486b41f8 100644
--- a/docs/api/api_docs/methods/get_target_platform_capabilities.html
+++ b/docs/api/api_docs/methods/get_target_platform_capabilities.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>Get TargetPlatformCapabilities &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>Get TargetPlatformCapabilities &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Get TargetPlatformCapabilities</a></li> 
       </ul>
     </div>  
@@ -41,39 +42,38 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="get-targetplatformcapabilities">
-<span id="ug-get-target-platform-capabilities"></span><h1>Get TargetPlatformCapabilities<a class="headerlink" href="#get-targetplatformcapabilities" title="Permalink to this headline">¶</a></h1>
+<span id="ug-get-target-platform-capabilities"></span><h1>Get TargetPlatformCapabilities<a class="headerlink" href="#get-targetplatformcapabilities" title="Permalink to this heading">¶</a></h1>
 <dl class="py function">
 <dt class="sig sig-object py" id="model_compression_toolkit.get_target_platform_capabilities">
-<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">get_target_platform_capabilities</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">fw_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_name</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.get_target_platform_capabilities" title="Permalink to this definition">¶</a></dt>
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">get_target_platform_capabilities</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">fw_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_version</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.get_target_platform_capabilities" title="Permalink to this definition">¶</a></dt>
 <dd><p>Get a TargetPlatformCapabilities by the target platform model name and the framework name.
 For now, it supports frameworks ‘tensorflow’ and ‘pytorch’. For both of them
-the target platform model can be ‘default’,’tflite’, or ‘qnnpack’.</p>
+the target platform model can be ‘default’, ‘imx500’, ‘tflite’, or ‘qnnpack’.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>fw_name</strong> (<em>str</em>) – Framework name of the TargetPlatformCapabilities.</p></li>
-<li><p><strong>target_platform_name</strong> (<em>str</em>) – Target platform model name the model will use for inference.</p></li>
+<li><p><strong>fw_name</strong> – Framework name of the TargetPlatformCapabilities.</p></li>
+<li><p><strong>target_platform_name</strong> – Target platform model name the model will use for inference.</p></li>
+<li><p><strong>target_platform_version</strong> – Target platform capabilities version.</p></li>
 </ul>
 </dd>
-<dt class="field-even">Returns</dt>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
 <dd class="field-even"><p>A TargetPlatformCapabilities object that models the hardware and attaches
 a framework information to it.</p>
 </dd>
-<dt class="field-odd">Return type</dt>
-<dd class="field-odd"><p><a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.common.target_platform.targetplatform2framework.target_platform_capabilities.TargetPlatformCapabilities"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformCapabilities</span></code></a></p>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform_capabilities.target_platform.targetplatform2framework.target_platform_capabilities.TargetPlatformCapabilities"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformCapabilities</span></code></a></p>
 </dd>
 </dl>
 </dd></dl>
 
 <div class="admonition note">
 <p class="admonition-title">Note</p>
-<p>For now, fusing operators information from <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformModel</span></code></a>
-is ignored during the optimization process (fusing still occurs but using an existing mechanism).
-Also, parts of <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a> is ignored (currently,
-the quantizer type, number of bits, and quantization enable/disable information is used during the
-optimization process).</p>
+<p>For now, some fields of <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a> are ignored during
+the optimization process (currently, the quantizer type, number of bits, and quantization enable/disable information
+are in use).</p>
 <ul class="simple">
-<li><p>MCT will use more information from <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformModel</span></code></a>, in the future.</p></li>
+<li><p>MCT will use more information from <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a>, in the future.</p></li>
 </ul>
 </div>
 </section>
@@ -94,7 +94,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -105,13 +105,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Get TargetPlatformCapabilities</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_data_generation_experimental.html b/docs/api/api_docs/methods/keras_data_generation_experimental.html
new file mode 100644
index 000000000..87ea353f0
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_data_generation_experimental.html
@@ -0,0 +1,109 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Keras Data Generation &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Data Generation</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="keras-data-generation">
+<span id="ug-keras-data-generation-experimental"></span><h1>Keras Data Generation<a class="headerlink" href="#keras-data-generation" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.data_generation.keras_data_generation_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.data_generation.</span></span><span class="sig-name descname"><span class="pre">keras_data_generation_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">n_images</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_image_size</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">data_generation_config</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.data_generation.keras_data_generation_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Function to perform data generation using the provided Keras model and data generation configuration.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> (<em>Model</em>) – Keras model to generate data for.</p></li>
+<li><p><strong>n_images</strong> (<em>int</em>) – Number of images to generate.</p></li>
+<li><p><strong>output_image_size</strong> (<em>Tuple</em>) – Size of the output images.</p></li>
+<li><p><strong>data_generation_config</strong> (<em>DataGenerationConfig</em>) – Configuration for data generation.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>Finalized list containing generated images.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>List[tf.Tensor]</p>
+</dd>
+<dt class="field-even">Return type<span class="colon">:</span></dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">Tensor</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Data Generation</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.html b/docs/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.html
new file mode 100644
index 000000000..1c7688ad3
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_gradient_post_training_quantization_experimental.html
@@ -0,0 +1,165 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Keras Gradient Based Post Training Quantization &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Gradient Based Post Training Quantization</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="keras-gradient-based-post-training-quantization">
+<span id="ug-keras-gradient-post-training-quantization"></span><h1>Keras Gradient Based Post Training Quantization<a class="headerlink" href="#keras-gradient-based-post-training-quantization" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.gptq.keras_gradient_post_training_quantization">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.gptq.</span></span><span class="sig-name descname"><span class="pre">keras_gradient_post_training_quantization</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">gptq_config</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">gptq_representative_data_gen</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fw_info</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_INFO</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.gptq.keras_gradient_post_training_quantization" title="Permalink to this definition">¶</a></dt>
+<dd><p>Quantize a trained Keras model using post-training quantization. The model is quantized using a
+symmetric constraint quantization thresholds (power of two).
+The model is first optimized using several transformations (e.g. BatchNormalization folding to
+preceding layers). Then, using a given dataset, statistics (e.g. min/max, histogram, etc.) are
+being collected for each layer’s output (and input, depends on the quantization configuration).
+For each possible bit width (per layer) a threshold is then being calculated using the collected
+statistics. Then, if given a mixed precision config in the core_config, using an ILP solver we find
+a mixed-precision configuration, and set a bit-width for each layer. The model is then quantized
+(both coefficients and activations by default).
+In order to limit the maximal model’s size, a target KPI need to be passed after weights_memory
+is set (in bytes).
+Then, the quantized weights are optimized using gradient based post
+training quantization by comparing points between the float and quantized models, and minimizing the observed
+loss.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_model</strong> (<em>Model</em>) – Keras model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for calibration.</p></li>
+<li><p><strong>gptq_config</strong> (<a class="reference internal" href="../classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfig" title="model_compression_toolkit.gptq.GradientPTQConfig"><em>GradientPTQConfig</em></a>) – Configuration for using gptq (e.g. optimizer).</p></li>
+<li><p><strong>gptq_representative_data_gen</strong> (<em>Callable</em>) – Dataset used for GPTQ training. If None defaults to representative_data_gen</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – KPI object to limit the search of the mixed-precision configuration as desired.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – Configuration object containing parameters of how the model should be quantized, including mixed precision parameters.</p></li>
+<li><p><strong>fw_info</strong> (<a class="reference internal" href="../classes/FrameworkInfo.html#model_compression_toolkit.core.FrameworkInfo" title="model_compression_toolkit.core.FrameworkInfo"><em>FrameworkInfo</em></a>) – Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.). <a class="reference external" href="https://github.com/sony/model_optimization/blob/main/model_compression_toolkit/core/keras/default_framework_info.py">Default Keras info</a></p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the Keras model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized model and information the user may need to handle the quantized model.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import a Keras model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.applications.mobilenet</span> <span class="kn">import</span> <span class="n">MobileNet</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">MobileNet</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator, for required number of calibration iterations (num_calibration_batches):
+In this example a random dataset of 10 batches each containing 4 images is used.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">num_calibration_batches</span> <span class="o">=</span> <span class="mi">10</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">num_calibration_batches</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">4</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Create an MCT core config, containing the quantization configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>If mixed precision is desired, create an MCT core config with a mixed-precision configuration, to quantize a model
+with different bitwidths for different layers.
+The candidates bitwidth for quantization should be defined in the target platform model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">(</span><span class="n">mixed_precision_config</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">MixedPrecisionQuantizationConfig</span><span class="p">(</span><span class="n">num_of_images</span><span class="o">=</span><span class="mi">1</span><span class="p">))</span>
+</pre></div>
+</div>
+<p>For mixed-precision set a target KPI object:
+Create a KPI object to limit our returned model’s size. Note that this value affects only coefficients
+that should be quantized (for example, the kernel of Conv2D in Keras will be affected by this value,
+while the bias will not):</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">kpi</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">KPI</span><span class="p">(</span><span class="n">model</span><span class="o">.</span><span class="n">count_params</span><span class="p">()</span> <span class="o">*</span> <span class="mf">0.75</span><span class="p">)</span>  <span class="c1"># About 0.75 of the model size when quantized with 8 bits.</span>
+</pre></div>
+</div>
+<p>Create GPTQ config:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">gptq_config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">get_keras_gptq_config</span><span class="p">(</span><span class="n">n_epochs</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Pass the model with the representative dataset generator to get a quantized model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span><span class="p">,</span> <span class="n">quantization_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">keras_gradient_post_training_quantization</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">gptq_config</span><span class="p">,</span> <span class="n">target_kpi</span><span class="o">=</span><span class="n">kpi</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">)</span>
+</pre></div>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><code class="xref py py-data docutils literal notranslate"><span class="pre">Tuple</span></code>[<code class="xref py py-class docutils literal notranslate"><span class="pre">Model</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">UserInformation</span></code>]</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Gradient Based Post Training Quantization</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_kpi_data_experimental.html b/docs/api/api_docs/methods/keras_kpi_data_experimental.html
new file mode 100644
index 000000000..d136d94de
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_kpi_data_experimental.html
@@ -0,0 +1,126 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Get KPI information for Keras Models &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get KPI information for Keras Models</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="get-kpi-information-for-keras-models">
+<span id="ug-keras-kpi-data"></span><h1>Get KPI information for Keras Models<a class="headerlink" href="#get-kpi-information-for-keras-models" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.core.keras_kpi_data">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">keras_kpi_data</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig(mixed_precision_config=MixedPrecisionQuantizationConfig())</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fw_info</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_INFO</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">KERAS_DEFAULT_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.keras_kpi_data" title="Permalink to this definition">¶</a></dt>
+<dd><p>Computes KPI data that can be used to calculate the desired target KPI for mixed-precision quantization.
+Builds the computation graph from the given model and hw modeling, and uses it to compute the KPI data.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_model</strong> (<em>Model</em>) – Keras model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for calibration.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – CoreConfig containing parameters for quantization and mixed precision of how the model should be quantized.</p></li>
+<li><p><strong>fw_info</strong> (<a class="reference internal" href="../classes/FrameworkInfo.html#model_compression_toolkit.core.FrameworkInfo" title="model_compression_toolkit.core.FrameworkInfo"><em>FrameworkInfo</em></a>) – Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.). <a class="reference external" href="https://github.com/sony/model_optimization/blob/main/model_compression_toolkit/core/keras/default_framework_info.py">Default Keras info</a></p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the Keras model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A KPI object with total weights parameters sum and max activation tensor.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import a Keras model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.applications.mobilenet</span> <span class="kn">import</span> <span class="n">MobileNet</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">MobileNet</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span> <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Import MCT and call for KPI data calculation:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">kpi_data</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">keras_kpi_data</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">)</span>
+</pre></div>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.common.mixed_precision.kpi_tools.kpi.KPI"><code class="xref py py-class docutils literal notranslate"><span class="pre">KPI</span></code></a></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get KPI information for Keras Models</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_load_quantizad_model.html b/docs/api/api_docs/methods/keras_load_quantizad_model.html
new file mode 100644
index 000000000..bf405bc93
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_load_quantizad_model.html
@@ -0,0 +1,101 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Load Quantized Keras Model &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Load Quantized Keras Model</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="load-quantized-keras-model">
+<span id="ug-keras-load-quantized-model"></span><h1>Load Quantized Keras Model<a class="headerlink" href="#load-quantized-keras-model" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.keras_load_quantized_model">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">keras_load_quantized_model</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">filepath</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">custom_objects</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">compile</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">options</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.keras_load_quantized_model" title="Permalink to this definition">¶</a></dt>
+<dd><p>This function wraps the keras load model and adds trainable quantizers classes to its custom objects.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>filepath</strong> – the model file path.</p></li>
+<li><p><strong>custom_objects</strong> – Additional custom objects</p></li>
+<li><p><strong>compile</strong> – Boolean, whether to compile the model after loading.</p></li>
+<li><p><strong>options</strong> – Optional <cite>tf.saved_model.LoadOptions</cite> object that specifies options for loading from SavedModel.</p></li>
+</ul>
+</dd>
+</dl>
+<p>Returns: A keras Model</p>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Load Quantized Keras Model</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_post_training_quantization_experimental.html b/docs/api/api_docs/methods/keras_post_training_quantization_experimental.html
new file mode 100644
index 000000000..ce57934e9
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_post_training_quantization_experimental.html
@@ -0,0 +1,156 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Keras Post Training Quantization &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Post Training Quantization</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="keras-post-training-quantization">
+<span id="ug-keras-post-training-quantization"></span><h1>Keras Post Training Quantization<a class="headerlink" href="#keras-post-training-quantization" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.ptq.keras_post_training_quantization">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.ptq.</span></span><span class="sig-name descname"><span class="pre">keras_post_training_quantization</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.ptq.keras_post_training_quantization" title="Permalink to this definition">¶</a></dt>
+<dd><p>Quantize a trained Keras model using post-training quantization. The model is quantized using a
+symmetric constraint quantization thresholds (power of two).
+The model is first optimized using several transformations (e.g. BatchNormalization folding to
+preceding layers). Then, using a given dataset, statistics (e.g. min/max, histogram, etc.) are
+being collected for each layer’s output (and input, depends on the quantization configuration).
+For each possible bit width (per layer) a threshold is then being calculated using the collected
+statistics. Then, if given a mixed precision config in the core_config, using an ILP solver we find
+a mixed-precision configuration, and set a bit-width for each layer. The model is then quantized
+(both coefficients and activations by default).
+In order to limit the maximal model’s size, a target KPI need to be passed after weights_memory
+is set (in bytes).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_model</strong> (<em>Model</em>) – Keras model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for calibration.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – KPI object to limit the search of the mixed-precision configuration as desired.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – Configuration object containing parameters of how the model should be quantized, including mixed precision parameters.</p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the Keras model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized model and information the user may need to handle the quantized model.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Keras model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.applications.mobilenet_v2</span> <span class="kn">import</span> <span class="n">MobileNetV2</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">MobileNetV2</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator, for required number of calibration iterations (num_calibration_batches):
+In this example a random dataset of 10 batches each containing 4 images is used.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">num_calibration_batches</span> <span class="o">=</span> <span class="mi">10</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">num_calibration_batches</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">4</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Create a MCT core config, containing the quantization configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>If mixed precision is desired, create a MCT core config with a mixed-precision configuration, to quantize a model with different bitwidths for different layers.
+The candidates bitwidth for quantization should be defined in the target platform model.
+In this example we use 1 image to search mixed-precision configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">(</span><span class="n">mixed_precision_config</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">MixedPrecisionQuantizationConfig</span><span class="p">(</span><span class="n">num_of_images</span><span class="o">=</span><span class="mi">1</span><span class="p">))</span>
+</pre></div>
+</div>
+<p>For mixed-precision set a target KPI object:
+Create a KPI object to limit our returned model’s size. Note that this value affects only coefficients
+that should be quantized (for example, the kernel of Conv2D in Keras will be affected by this value,
+while the bias will not):</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">kpi</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">KPI</span><span class="p">(</span><span class="n">model</span><span class="o">.</span><span class="n">count_params</span><span class="p">()</span> <span class="o">*</span> <span class="mf">0.75</span><span class="p">)</span>  <span class="c1"># About 0.75 of the model size when quantized with 8 bits.</span>
+</pre></div>
+</div>
+<p>Pass the model, the representative dataset generator, the configuration and the target KPI to get a
+quantized model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span><span class="p">,</span> <span class="n">quantization_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">ptq</span><span class="o">.</span><span class="n">keras_post_training_quantization</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">kpi</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>For more configuration options, please take a look at our <a class="reference external" href="https://sony.github.io/model_optimization/api/api_docs/modules/mixed_precision_quantization_config.html">API documentation</a>.</p>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Post Training Quantization</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_pruning_experimental.html b/docs/api/api_docs/methods/keras_pruning_experimental.html
new file mode 100644
index 000000000..828299501
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_pruning_experimental.html
@@ -0,0 +1,154 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Keras Structured Pruning &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Structured Pruning</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="keras-structured-pruning">
+<span id="ug-keras-pruning-experimental"></span><h1>Keras Structured Pruning<a class="headerlink" href="#keras-structured-pruning" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.keras_pruning_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">keras_pruning_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">pruning_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">PruningConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.pruning.keras_pruning_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform structured pruning on a Keras model to meet a specified target KPI.
+This function prunes the provided model according to the target KPI by grouping and pruning
+channels based on each layer’s SIMD configuration in the Target Platform Capabilities (TPC).
+By default, the importance of each channel group is determined using the Label-Free Hessian
+(LFH) method, assessing each channel’s sensitivity to the Hessian of the loss function.
+This pruning strategy considers groups of channels together for a more hardware-friendly
+architecture. The process involves analyzing the model with a representative dataset to
+identify groups of channels that can be removed with minimal impact on performance.</p>
+<p>Notice that the pruned model must be retrained to recover the compressed model’s performance.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> (<em>Model</em>) – The original Keras model to be pruned.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – The target Key Performance Indicators to be achieved through pruning.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – A function to generate representative data for pruning analysis.</p></li>
+<li><p><strong>pruning_config</strong> (<em>PruningConfig</em>) – Configuration settings for the pruning process. Defaults to standard config.</p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – Platform-specific constraints and capabilities.
+Defaults to DEFAULT_KERAS_TPC.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A tuple containing the pruned Keras model and associated pruning information.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>Tuple[Model, PruningInfo]</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Keras model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.applications.resnet50</span> <span class="kn">import</span> <span class="n">ResNet50</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">ResNet50</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span> <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Define a target KPI for pruning.
+Here, we aim to reduce the memory footprint of weights by 50%, assuming the model weights
+are represented in float32 data type (thus, each parameter is represented using 4 bytes):</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">dense_nparams</span> <span class="o">=</span> <span class="nb">sum</span><span class="p">([</span><span class="n">l</span><span class="o">.</span><span class="n">count_params</span><span class="p">()</span> <span class="k">for</span> <span class="n">l</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">layers</span><span class="p">])</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">target_kpi</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">KPI</span><span class="p">(</span><span class="n">weights_memory</span><span class="o">=</span><span class="n">dense_nparams</span> <span class="o">*</span> <span class="mi">4</span> <span class="o">*</span> <span class="mf">0.5</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Optionally, define a pruning configuration. num_score_approximations can be passed
+to configure the number of importance scores that will be calculated for each channel.
+A higher value for this parameter yields more precise score approximations but also
+extends the duration of the pruning process:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">pruning_config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">pruning</span><span class="o">.</span><span class="n">PruningConfig</span><span class="p">(</span><span class="n">num_score_approximations</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Perform pruning:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">pruned_model</span><span class="p">,</span> <span class="n">pruning_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">pruning</span><span class="o">.</span><span class="n">keras_pruning_experimental</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">model</span><span class="p">,</span> <span class="n">target_kpi</span><span class="o">=</span><span class="n">target_kpi</span><span class="p">,</span> <span class="n">representative_data_gen</span><span class="o">=</span><span class="n">repr_datagen</span><span class="p">,</span> <span class="n">pruning_config</span><span class="o">=</span><span class="n">pruning_config</span><span class="p">)</span>
+</pre></div>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><code class="xref py py-data docutils literal notranslate"><span class="pre">Tuple</span></code>[<code class="xref py py-class docutils literal notranslate"><span class="pre">Model</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">PruningInfo</span></code>]</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Structured Pruning</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_quantization_aware_training_finalize.html b/docs/api/api_docs/methods/keras_quantization_aware_training_finalize.html
new file mode 100644
index 000000000..0d3fba485
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_quantization_aware_training_finalize.html
@@ -0,0 +1,144 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Keras Quantization Aware Training Model Finalize &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Quantization Aware Training Model Finalize</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="keras-quantization-aware-training-model-finalize">
+<span id="ug-keras-quantization-aware-training-finalize-experimental"></span><h1>Keras Quantization Aware Training Model Finalize<a class="headerlink" href="#keras-quantization-aware-training-model-finalize" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.qat.</span></span><span class="sig-name descname"><span class="pre">keras_quantization_aware_training_finalize_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convert a model fine-tuned by the user (Trainable quantizers) to a model with Inferable quantizers.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><p><strong>in_model</strong> (<em>Model</em>) – Keras model to replace TrainableQuantizer with InferableQuantizer</p>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized model with Inferable quantizers</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Keras model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.applications.mobilenet_v2</span> <span class="kn">import</span> <span class="n">MobileNetV2</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">MobileNetV2</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span> <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Create a MCT core config, containing the quantization configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>If mixed precision is desired, create a MCT core config with a mixed-precision configuration, to quantize a model with different bitwidths for different layers.
+The candidates bitwidth for quantization should be defined in the target platform model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">(</span><span class="n">mixed_precision_config</span><span class="o">=</span><span class="n">MixedPrecisionQuantizationConfig</span><span class="p">())</span>
+</pre></div>
+</div>
+<p>For mixed-precision set a target KPI object:
+Create a KPI object to limit our returned model’s size. Note that this value affects only coefficients
+that should be quantized (for example, the kernel of Conv2D in Keras will be affected by this value,
+while the bias will not):</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">kpi</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">KPI</span><span class="p">(</span><span class="n">model</span><span class="o">.</span><span class="n">count_params</span><span class="p">()</span> <span class="o">*</span> <span class="mf">0.75</span><span class="p">)</span>  <span class="c1"># About 0.75 of the model size when quantized with 8 bits.</span>
+</pre></div>
+</div>
+<p>Pass the model, the representative dataset generator, the configuration and the target KPI to get a
+quantized model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span><span class="p">,</span> <span class="n">quantization_info</span><span class="p">,</span> <span class="n">custom_objects</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">qat</span><span class="o">.</span><span class="n">keras_quantization_aware_training_init_experimental</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">kpi</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Use the quantized model for fine-tuning. For loading the model from file, use the custom_objects dictionary:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span> <span class="o">=</span> <span class="n">tf</span><span class="o">.</span><span class="n">keras</span><span class="o">.</span><span class="n">models</span><span class="o">.</span><span class="n">load_model</span><span class="p">(</span><span class="n">model_file</span><span class="p">,</span> <span class="n">custom_objects</span><span class="o">=</span><span class="n">custom_objects</span><span class="p">)</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">qat</span><span class="o">.</span><span class="n">keras_quantization_aware_training_finalize_experimental</span><span class="p">(</span><span class="n">quantized_model</span><span class="p">)</span>
+</pre></div>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">Model</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Quantization Aware Training Model Finalize</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/keras_quantization_aware_training_init.html b/docs/api/api_docs/methods/keras_quantization_aware_training_init.html
new file mode 100644
index 000000000..eb840041f
--- /dev/null
+++ b/docs/api/api_docs/methods/keras_quantization_aware_training_init.html
@@ -0,0 +1,165 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Keras Quantization Aware Training Model Init &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Quantization Aware Training Model Init</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="keras-quantization-aware-training-model-init">
+<span id="ug-keras-quantization-aware-training-init-experimental"></span><h1>Keras Quantization Aware Training Model Init<a class="headerlink" href="#keras-quantization-aware-training-model-init" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.qat.</span></span><span class="sig-name descname"><span class="pre">keras_quantization_aware_training_init_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">qat_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QATConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fw_info</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_INFO</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_KERAS_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prepare a trained Keras model for quantization aware training. First the model quantization is optimized
+with post-training quantization, then the model layers are wrapped with QuantizeWrappers. The model is
+quantized using a symmetric quantization thresholds (power of two).
+The model is first optimized using several transformations (e.g. BatchNormalization folding to
+preceding layers). Then, using a given dataset, statistics (e.g. min/max, histogram, etc.) are
+being collected for each layer’s output (and input, depends on the quantization configuration).
+For each possible bit width (per layer) a threshold is then being calculated using the collected
+statistics. Then, if given a mixed precision config in the core_config, using an ILP solver we find
+a mixed-precision configuration, and set a bit-width for each layer. The model is built with fake_quant
+nodes for quantizing activation. Weights are kept as float and are quantized online while training by the
+quantization wrapper’s weight quantizer.
+In order to limit the maximal model’s size, a target KPI need to be passed after weights_memory
+is set (in bytes).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_model</strong> (<em>Model</em>) – Keras model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for initial calibration.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – KPI object to limit the search of the mixed-precision configuration as desired.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – Configuration object containing parameters of how the model should be quantized, including mixed precision parameters.</p></li>
+<li><p><strong>qat_config</strong> (<a class="reference internal" href="../modules/qat_config.html#model_compression_toolkit.qat.QATConfig" title="model_compression_toolkit.qat.QATConfig"><em>QATConfig</em></a>) – QAT configuration</p></li>
+<li><p><strong>fw_info</strong> (<a class="reference internal" href="../classes/FrameworkInfo.html#model_compression_toolkit.core.FrameworkInfo" title="model_compression_toolkit.core.FrameworkInfo"><em>FrameworkInfo</em></a>) – Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.).  <a class="reference external" href="https://github.com/sony/model_optimization/blob/main/model_compression_toolkit/core/keras/default_framework_info.py">Default Keras info</a></p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the Keras model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized model.
+User information that may be needed to handle the quantized model.
+Custom-Objects dictionary for loading the saved kers model.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Keras model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.applications.mobilenet_v2</span> <span class="kn">import</span> <span class="n">MobileNetV2</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">MobileNetV2</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator, for required number of calibration iterations (num_calibration_batches):
+In this example a random dataset of 10 batches each containing 4 images is used.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">num_calibration_batches</span> <span class="o">=</span> <span class="mi">10</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">num_calibration_batches</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">4</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Create a MCT core config, containing the quantization configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>If mixed precision is desired, create a MCT core config with a mixed-precision configuration, to quantize a model with different bitwidths for different layers.
+The candidates bitwidth for quantization should be defined in the target platform model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">(</span><span class="n">mixed_precision_config</span><span class="o">=</span><span class="n">MixedPrecisionQuantizationConfig</span><span class="p">())</span>
+</pre></div>
+</div>
+<p>For mixed-precision set a target KPI object:
+Create a KPI object to limit our returned model’s size. Note that this value affects only coefficients
+that should be quantized (for example, the kernel of Conv2D in Keras will be affected by this value,
+while the bias will not):</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">kpi</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">KPI</span><span class="p">(</span><span class="n">model</span><span class="o">.</span><span class="n">count_params</span><span class="p">()</span> <span class="o">*</span> <span class="mf">0.75</span><span class="p">)</span>  <span class="c1"># About 0.75 of the model size when quantized with 8 bits.</span>
+</pre></div>
+</div>
+<p>Pass the model, the representative dataset generator, the configuration and the target KPI to get a
+quantized model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span><span class="p">,</span> <span class="n">quantization_info</span><span class="p">,</span> <span class="n">custom_objects</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">qat</span><span class="o">.</span><span class="n">keras_quantization_aware_training_init_experimental</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">kpi</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Use the quantized model for fine-tuning. For loading the model from file, use the custom_objects dictionary:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span> <span class="o">=</span> <span class="n">tf</span><span class="o">.</span><span class="n">keras</span><span class="o">.</span><span class="n">models</span><span class="o">.</span><span class="n">load_model</span><span class="p">(</span><span class="n">model_file</span><span class="p">,</span> <span class="n">custom_objects</span><span class="o">=</span><span class="n">custom_objects</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>For more configuration options, please take a look at our <a class="reference external" href="https://sony.github.io/model_optimization/api/api_docs/modules/mixed_precision_quantization_config.html">API documentation</a>.</p>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Keras Quantization Aware Training Model Init</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_data_generation_experimental.html b/docs/api/api_docs/methods/pytorch_data_generation_experimental.html
new file mode 100644
index 000000000..36690dde9
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_data_generation_experimental.html
@@ -0,0 +1,109 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Pytorch Data Generation &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Data Generation</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pytorch-data-generation">
+<span id="ug-pytorch-data-generation-experimental"></span><h1>Pytorch Data Generation<a class="headerlink" href="#pytorch-data-generation" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.data_generation.pytorch_data_generation_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.data_generation.</span></span><span class="sig-name descname"><span class="pre">pytorch_data_generation_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">n_images</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">output_image_size</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">data_generation_config</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.data_generation.pytorch_data_generation_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Function to perform data generation using the provided model and data generation configuration.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> (<em>Module</em>) – PyTorch model to generate data for.</p></li>
+<li><p><strong>n_images</strong> (<em>int</em>) – Number of images to generate.</p></li>
+<li><p><strong>output_image_size</strong> (<em>Tuple</em>) – Size of the output images.</p></li>
+<li><p><strong>data_generation_config</strong> (<em>DataGenerationConfig</em>) – Configuration for data generation.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>Finalized list containing generated images.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>List[Tensor]</p>
+</dd>
+<dt class="field-even">Return type<span class="colon">:</span></dt>
+<dd class="field-even"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">List</span></code>[<code class="xref py py-class docutils literal notranslate"><span class="pre">Tensor</span></code>]</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Data Generation</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html b/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html
new file mode 100644
index 000000000..e5f7c2020
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html
@@ -0,0 +1,146 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Pytorch Gradient Based Post Training Quantization &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Gradient Based Post Training Quantization</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pytorch-gradient-based-post-training-quantization">
+<span id="ug-pytorch-gradient-post-training-quantization"></span><h1>Pytorch Gradient Based Post Training Quantization<a class="headerlink" href="#pytorch-gradient-based-post-training-quantization" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.gptq.</span></span><span class="sig-name descname"><span class="pre">pytorch_gradient_post_training_quantization</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">gptq_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">gptq_representative_data_gen</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization" title="Permalink to this definition">¶</a></dt>
+<dd><p>Quantize a trained Pytorch module using post-training quantization.
+By default, the module is quantized using a symmetric constraint quantization thresholds
+(power of two) as defined in the default TargetPlatformCapabilities.
+The module is first optimized using several transformations (e.g. BatchNormalization folding to
+preceding layers). Then, using a given dataset, statistics (e.g. min/max, histogram, etc.) are
+being collected for each layer’s output (and input, depends on the quantization configuration).
+Thresholds are then being calculated using the collected statistics and the module is quantized
+(both coefficients and activations by default).
+If gptq_config is passed, the quantized weights are optimized using gradient based post
+training quantization by comparing points between the float and quantized modules, and minimizing the
+observed loss.
+Then, the quantized weights are optimized using gradient based post
+training quantization by comparing points between the float and quantized models, and minimizing the observed
+loss.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> (<em>Module</em>) – Pytorch model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for calibration.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – KPI object to limit the search of the mixed-precision configuration as desired.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – Configuration object containing parameters of how the model should be quantized, including mixed precision parameters.</p></li>
+<li><p><strong>gptq_config</strong> (<a class="reference internal" href="../classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfig" title="model_compression_toolkit.gptq.GradientPTQConfig"><em>GradientPTQConfig</em></a>) – Configuration for using gptq (e.g. optimizer).</p></li>
+<li><p><strong>gptq_representative_data_gen</strong> (<em>Callable</em>) – Dataset used for GPTQ training. If None defaults to representative_data_gen</p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the PyTorch model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized module and information the user may need to handle the quantized module.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import Model Compression Toolkit:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Pytorch module:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">torchvision</span> <span class="kn">import</span> <span class="n">models</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">module</span> <span class="o">=</span> <span class="n">models</span><span class="o">.</span><span class="n">mobilenet_v2</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator, for required number of calibration iterations (num_calibration_batches):
+In this example a random dataset of 10 batches each containing 4 images is used.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">num_calibration_batches</span> <span class="o">=</span> <span class="mi">10</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">num_calibration_batches</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">4</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Create MCT core configurations with number of calibration iterations set to 1:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Pass the module, the representative dataset generator and the configuration (optional) to get a quantized module</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_module</span><span class="p">,</span> <span class="n">quantization_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">gptq</span><span class="o">.</span><span class="n">pytorch_gradient_post_training_quantization</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">,</span> <span class="n">gptq_config</span><span class="o">=</span><span class="n">gptq_conf</span><span class="p">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Gradient Based Post Training Quantization</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_kpi_data_experimental.html b/docs/api/api_docs/methods/pytorch_kpi_data_experimental.html
new file mode 100644
index 000000000..e1c6441d3
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_kpi_data_experimental.html
@@ -0,0 +1,126 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Get KPI information for PyTorch Models &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get KPI information for PyTorch Models</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="get-kpi-information-for-pytorch-models">
+<span id="ug-pytorch-kpi-data"></span><h1>Get KPI information for PyTorch Models<a class="headerlink" href="#get-kpi-information-for-pytorch-models" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.core.pytorch_kpi_data">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">pytorch_kpi_data</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig(mixed_precision_config=MixedPrecisionQuantizationConfig())</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fw_info</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_INFO</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">PYTORCH_DEFAULT_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.pytorch_kpi_data" title="Permalink to this definition">¶</a></dt>
+<dd><p>Computes KPI data that can be used to calculate the desired target KPI for mixed-precision quantization.
+Builds the computation graph from the given model and target platform capabilities, and uses it to compute the KPI data.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_model</strong> (<em>Model</em>) – PyTorch model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for calibration.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – CoreConfig containing parameters for quantization and mixed precision</p></li>
+<li><p><strong>fw_info</strong> (<a class="reference internal" href="../classes/FrameworkInfo.html#model_compression_toolkit.core.FrameworkInfo" title="model_compression_toolkit.core.FrameworkInfo"><em>FrameworkInfo</em></a>) – Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.). <a class="reference external" href="https://github.com/sony/model_optimization/blob/main/model_compression_toolkit/core/pytorch/default_framework_info.py">Default PyTorch info</a></p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the PyTorch model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A KPI object with total weights parameters sum and max activation tensor.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import a Pytorch model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">torchvision</span> <span class="kn">import</span> <span class="n">models</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">module</span> <span class="o">=</span> <span class="n">models</span><span class="o">.</span><span class="n">mobilenet_v2</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span> <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Import mct and call for KPI data calculation:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">kpi_data</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">pytorch_kpi_data</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">)</span>
+</pre></div>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.common.mixed_precision.kpi_tools.kpi.KPI"><code class="xref py py-class docutils literal notranslate"><span class="pre">KPI</span></code></a></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Get KPI information for PyTorch Models</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_post_training_quantization_experimental.html b/docs/api/api_docs/methods/pytorch_post_training_quantization_experimental.html
new file mode 100644
index 000000000..630598efb
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_post_training_quantization_experimental.html
@@ -0,0 +1,135 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Pytorch Post Training Quantization &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Post Training Quantization</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pytorch-post-training-quantization">
+<span id="ug-pytorch-post-training-quantization"></span><h1>Pytorch Post Training Quantization<a class="headerlink" href="#pytorch-post-training-quantization" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.ptq.pytorch_post_training_quantization">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.ptq.</span></span><span class="sig-name descname"><span class="pre">pytorch_post_training_quantization</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_module</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.ptq.pytorch_post_training_quantization" title="Permalink to this definition">¶</a></dt>
+<dd><p>Quantize a trained Pytorch module using post-training quantization.
+By default, the module is quantized using a symmetric constraint quantization thresholds
+(power of two) as defined in the default TargetPlatformCapabilities.
+The module is first optimized using several transformations (e.g. BatchNormalization folding to
+preceding layers). Then, using a given dataset, statistics (e.g. min/max, histogram, etc.) are
+being collected for each layer’s output (and input, depends on the quantization configuration).
+Thresholds are then being calculated using the collected statistics and the module is quantized
+(both coefficients and activations by default).
+If gptq_config is passed, the quantized weights are optimized using gradient based post
+training quantization by comparing points between the float and quantized modules, and minimizing the
+observed loss.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_module</strong> (<em>Module</em>) – Pytorch module to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for calibration.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – KPI object to limit the search of the mixed-precision configuration as desired.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – Configuration object containing parameters of how the model should be quantized, including mixed precision parameters.</p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the PyTorch model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized module and information the user may need to handle the quantized module.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import a Pytorch module:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">torchvision</span> <span class="kn">import</span> <span class="n">models</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">module</span> <span class="o">=</span> <span class="n">models</span><span class="o">.</span><span class="n">mobilenet_v2</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator, for required number of calibration iterations (num_calibration_batches):
+In this example a random dataset of 10 batches each containing 4 images is used.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">num_calibration_batches</span> <span class="o">=</span> <span class="mi">10</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">num_calibration_batches</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">4</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Import MCT and pass the module with the representative dataset generator to get a quantized module
+Set number of clibration iterations to 1:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_module</span><span class="p">,</span> <span class="n">quantization_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">ptq</span><span class="o">.</span><span class="n">pytorch_post_training_quantization</span><span class="p">(</span><span class="n">module</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Post Training Quantization</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_pruning_experimental.html b/docs/api/api_docs/methods/pytorch_pruning_experimental.html
new file mode 100644
index 000000000..d3efe563f
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_pruning_experimental.html
@@ -0,0 +1,158 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>Pytorch Structured Pruning &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Structured Pruning</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pytorch-structured-pruning">
+<span id="ug-pytorch-pruning-experimental"></span><h1>Pytorch Structured Pruning<a class="headerlink" href="#pytorch-structured-pruning" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.pruning.pytorch_pruning_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.pruning.</span></span><span class="sig-name descname"><span class="pre">pytorch_pruning_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">pruning_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">PruningConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYOTRCH_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.pruning.pytorch_pruning_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Perform structured pruning on a Pytorch model to meet a specified target KPI.
+This function prunes the provided model according to the target KPI by grouping and pruning
+channels based on each layer’s SIMD configuration in the Target Platform Capabilities (TPC).
+By default, the importance of each channel group is determined using the Label-Free Hessian
+(LFH) method, assessing each channel’s sensitivity to the Hessian of the loss function.
+This pruning strategy considers groups of channels together for a more hardware-friendly
+architecture. The process involves analyzing the model with a representative dataset to
+identify groups of channels that can be removed with minimal impact on performance.</p>
+<p>Notice that the pruned model must be retrained to recover the compressed model’s performance.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> (<em>Module</em>) – The PyTorch model to be pruned.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – Key Performance Indicators specifying the pruning targets.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – A function to generate representative data for pruning analysis.</p></li>
+<li><p><strong>pruning_config</strong> (<em>PruningConfig</em>) – Configuration settings for the pruning process. Defaults to standard config.</p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – Platform-specific constraints and capabilities.
+Defaults to DEFAULT_PYTORCH_TPC.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A tuple containing the pruned Pytorch model and associated pruning information.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p>Tuple[Model, PruningInfo]</p>
+</dd>
+</dl>
+<div class="admonition note">
+<p class="admonition-title">Note</p>
+<p>The pruned model should be fine-tuned or retrained to recover or improve its performance post-pruning.</p>
+</div>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Pytorch model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">torchvision.models</span> <span class="kn">import</span> <span class="n">resnet50</span><span class="p">,</span> <span class="n">ResNet50_Weights</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">resnet50</span><span class="p">(</span><span class="n">weights</span><span class="o">=</span><span class="n">ResNet50_Weights</span><span class="o">.</span><span class="n">IMAGENET1K_V1</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span> <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Define a target KPI for pruning.
+Here, we aim to reduce the memory footprint of weights by 50%, assuming the model weights
+are represented in float32 data type (thus, each parameter is represented using 4 bytes):</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">dense_nparams</span> <span class="o">=</span> <span class="nb">sum</span><span class="p">(</span><span class="n">p</span><span class="o">.</span><span class="n">numel</span><span class="p">()</span> <span class="k">for</span> <span class="n">p</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">state_dict</span><span class="p">()</span><span class="o">.</span><span class="n">values</span><span class="p">())</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">target_kpi</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">KPI</span><span class="p">(</span><span class="n">weights_memory</span><span class="o">=</span><span class="n">dense_nparams</span> <span class="o">*</span> <span class="mi">4</span> <span class="o">*</span> <span class="mf">0.5</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Optionally, define a pruning configuration. num_score_approximations can be passed
+to configure the number of importance scores that will be calculated for each channel.
+A higher value for this parameter yields more precise score approximations but also
+extends the duration of the pruning process:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">pruning_config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">pruning</span><span class="o">.</span><span class="n">PruningConfig</span><span class="p">(</span><span class="n">num_score_approximations</span><span class="o">=</span><span class="mi">1</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Perform pruning:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">pruned_model</span><span class="p">,</span> <span class="n">pruning_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">pruning</span><span class="o">.</span><span class="n">pytorch_pruning_experimental</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">model</span><span class="p">,</span> <span class="n">target_kpi</span><span class="o">=</span><span class="n">target_kpi</span><span class="p">,</span> <span class="n">representative_data_gen</span><span class="o">=</span><span class="n">repr_datagen</span><span class="p">,</span> <span class="n">pruning_config</span><span class="o">=</span><span class="n">pruning_config</span><span class="p">)</span>
+</pre></div>
+</div>
+<dl class="field-list simple">
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><code class="xref py py-data docutils literal notranslate"><span class="pre">Tuple</span></code>[<code class="xref py py-class docutils literal notranslate"><span class="pre">Module</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">PruningInfo</span></code>]</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">Pytorch Structured Pruning</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize.html b/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize.html
new file mode 100644
index 000000000..0dd0f11e3
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_quantization_aware_training_finalize.html
@@ -0,0 +1,127 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>PyTorch Quantization Aware Training Model Finalize &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">PyTorch Quantization Aware Training Model Finalize</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pytorch-quantization-aware-training-model-finalize">
+<span id="ug-pytorch-quantization-aware-training-finalize-experimental"></span><h1>PyTorch Quantization Aware Training Model Finalize<a class="headerlink" href="#pytorch-quantization-aware-training-model-finalize" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.qat.</span></span><span class="sig-name descname"><span class="pre">pytorch_quantization_aware_training_finalize_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Convert a model fine-tuned by the user to a network with QuantizeWrappers containing
+InferableQuantizers, that quantizes both the layers weights and outputs</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><p><strong>in_model</strong> (<em>Model</em>) – Pytorch model to remove QuantizeWrappers.</p>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized model with QuantizeWrappers and InferableQuantizers.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Pytorch model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">torchvision.models</span> <span class="kn">import</span> <span class="n">mobilenet_v2</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">mobilenet_v2</span><span class="p">(</span><span class="n">pretrained</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Create a random dataset generator:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span> <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))]</span>
+</pre></div>
+</div>
+<p>Create a MCT core config, containing the quantization configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Pass the model, the representative dataset generator, the configuration and the target KPI to get a
+quantized model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span><span class="p">,</span> <span class="n">quantization_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">qat</span><span class="o">.</span><span class="n">pytorch_quantization_aware_training_init_experimental</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Use the quantized model for fine-tuning. Finally, remove the quantizer wrappers and keep a quantize model ready for inference.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">qat</span><span class="o">.</span><span class="n">pytorch_quantization_aware_training_finalize_experimental</span><span class="p">(</span><span class="n">quantized_model</span><span class="p">)</span>
+</pre></div>
+</div>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">PyTorch Quantization Aware Training Model Finalize</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/pytorch_quantization_aware_training_init.html b/docs/api/api_docs/methods/pytorch_quantization_aware_training_init.html
new file mode 100644
index 000000000..f915beca8
--- /dev/null
+++ b/docs/api/api_docs/methods/pytorch_quantization_aware_training_init.html
@@ -0,0 +1,152 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>PyTorch Quantization Aware Training Model Init &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">PyTorch Quantization Aware Training Model Init</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="pytorch-quantization-aware-training-model-init">
+<span id="ug-pytorch-quantization-aware-training-init-experimental"></span><h1>PyTorch Quantization Aware Training Model Init<a class="headerlink" href="#pytorch-quantization-aware-training-model-init" title="Permalink to this heading">¶</a></h1>
+<dl class="py function">
+<dt class="sig sig-object py" id="model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental">
+<span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.qat.</span></span><span class="sig-name descname"><span class="pre">pytorch_quantization_aware_training_init_experimental</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">in_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">representative_data_gen</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_kpi</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">core_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">CoreConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">qat_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QATConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fw_info</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_INFO</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">target_platform_capabilities</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_PYTORCH_TPC</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental" title="Permalink to this definition">¶</a></dt>
+<dd><p>Prepare a trained Pytorch model for quantization aware training. First the model quantization is optimized
+with post-training quantization, then the model layers are wrapped with QuantizeWrappers. The model is
+quantized using a symmetric quantization thresholds (power of two).
+The model is first optimized using several transformations (e.g. BatchNormalization folding to
+preceding layers). Then, using a given dataset, statistics (e.g. min/max, histogram, etc.) are
+being collected for each layer’s output (and input, depends on the quantization configuration).
+For each possible bit width (per layer) a threshold is then being calculated using the collected
+statistics. Then, if given a mixed precision config in the core_config, using an ILP solver we find
+a mixed-precision configuration, and set a bit-width for each layer. The model is built with fake_quant
+nodes for quantizing activation. Weights are kept as float and are quantized online while training by the
+quantization wrapper’s weight quantizer.
+In order to limit the maximal model’s size, a target KPI need to be passed after weights_memory
+is set (in bytes).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>in_model</strong> (<em>Model</em>) – Pytorch model to quantize.</p></li>
+<li><p><strong>representative_data_gen</strong> (<em>Callable</em>) – Dataset used for initial calibration.</p></li>
+<li><p><strong>target_kpi</strong> (<a class="reference internal" href="../modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI" title="model_compression_toolkit.core.KPI"><em>KPI</em></a>) – KPI object to limit the search of the mixed-precision configuration as desired.</p></li>
+<li><p><strong>core_config</strong> (<a class="reference internal" href="../modules/core_config.html#model_compression_toolkit.core.CoreConfig" title="model_compression_toolkit.core.CoreConfig"><em>CoreConfig</em></a>) – Configuration object containing parameters of how the model should be quantized, including mixed precision parameters.</p></li>
+<li><p><strong>qat_config</strong> (<a class="reference internal" href="../modules/qat_config.html#model_compression_toolkit.qat.QATConfig" title="model_compression_toolkit.qat.QATConfig"><em>QATConfig</em></a>) – QAT configuration</p></li>
+<li><p><strong>fw_info</strong> (<a class="reference internal" href="../classes/FrameworkInfo.html#model_compression_toolkit.core.FrameworkInfo" title="model_compression_toolkit.core.FrameworkInfo"><em>FrameworkInfo</em></a>) – Information needed for quantization about the specific framework (e.g., kernel channels indices, groups of layers by how they should be quantized, etc.).  <a class="reference external" href="https://github.com/sony/model_optimization/blob/main/model_compression_toolkit/core/pytorch/default_framework_info.py">Default Pytorch info</a></p></li>
+<li><p><strong>target_platform_capabilities</strong> (<a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="model_compression_toolkit.target_platform.TargetPlatformCapabilities"><em>TargetPlatformCapabilities</em></a>) – TargetPlatformCapabilities to optimize the Pytorch model according to.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>A quantized model.
+User information that may be needed to handle the quantized model.</p>
+</dd>
+</dl>
+<p class="rubric">Examples</p>
+<p>Import MCT:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+</pre></div>
+</div>
+<p>Import a Pytorch model:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">torchvision.models</span> <span class="kn">import</span> <span class="n">mobilenet_v2</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">model</span> <span class="o">=</span> <span class="n">mobilenet_v2</span><span class="p">(</span><span class="n">pretrained</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+</pre></div>
+</div>
+<blockquote>
+<div><p>Create a random dataset generator, for required number of calibration iterations (num_calibration_batches):
+In this example a random dataset of 10 batches each containing 4 images is used.</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">num_calibration_batches</span> <span class="o">=</span> <span class="mi">10</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="k">def</span> <span class="nf">repr_datagen</span><span class="p">():</span>
+<span class="gp">&gt;&gt;&gt; </span>    <span class="k">for</span> <span class="n">_</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">num_calibration_batches</span><span class="p">):</span>
+<span class="gp">&gt;&gt;&gt; </span>        <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">4</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">))]</span>
+</pre></div>
+</div>
+<blockquote>
+<div><p>Create a MCT core config, containing the quantization configuration:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">config</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">CoreConfig</span><span class="p">()</span>
+</pre></div>
+</div>
+<p>Pass the model, the representative dataset generator, the configuration and the target KPI to get a
+quantized model. Now the model contains quantizer wrappers for fine tunning the weights:</p>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">quantized_model</span><span class="p">,</span> <span class="n">quantization_info</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">qat</span><span class="o">.</span><span class="n">pytorch_quantization_aware_training_init_experimental</span><span class="p">(</span><span class="n">model</span><span class="p">,</span> <span class="n">repr_datagen</span><span class="p">,</span> <span class="n">core_config</span><span class="o">=</span><span class="n">config</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>For more configuration options, please take a look at our <a class="reference external" href="https://sony.github.io/model_optimization/api/api_docs/modules/mixed_precision_quantization_config.html">API documentation</a>.</p>
+</div></blockquote>
+</div></blockquote>
+</dd></dl>
+
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">PyTorch Quantization Aware Training Model Init</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/methods/set_logger_path.html b/docs/api/api_docs/methods/set_logger_path.html
index af9c88cb0..8f6d40611 100644
--- a/docs/api/api_docs/methods/set_logger_path.html
+++ b/docs/api/api_docs/methods/set_logger_path.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>Enable a Logger &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>Enable a Logger &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Enable a Logger</a></li> 
       </ul>
     </div>  
@@ -41,16 +42,16 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="enable-a-logger">
-<span id="ug-set-logger-path"></span><h1>Enable a Logger<a class="headerlink" href="#enable-a-logger" title="Permalink to this headline">¶</a></h1>
+<span id="ug-set-logger-path"></span><h1>Enable a Logger<a class="headerlink" href="#enable-a-logger" title="Permalink to this heading">¶</a></h1>
 <dl class="py function">
 <dt class="sig sig-object py" id="model_compression_toolkit.set_log_folder">
 <span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">set_log_folder</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">folder</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">level</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">logging.INFO</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.set_log_folder" title="Permalink to this definition">¶</a></dt>
 <dd><p>Set a directory path for saving a log file.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>folder</strong> (<em>str</em>) – Folder path to save the log file.</p></li>
-<li><p><strong>level</strong> (<em>int</em>) – Level of verbosity to set to the logger.</p></li>
+<li><p><strong>folder</strong> – Folder path to save the log file.</p></li>
+<li><p><strong>level</strong> – Level of verbosity to set to the logger.</p></li>
 </ul>
 </dd>
 </dl>
@@ -74,7 +75,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -85,13 +86,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Enable a Logger</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/core_config.html b/docs/api/api_docs/modules/core_config.html
new file mode 100644
index 000000000..37ef02de7
--- /dev/null
+++ b/docs/api/api_docs/modules/core_config.html
@@ -0,0 +1,113 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>core_config Module &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">core_config Module</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="core-config-module">
+<span id="ug-core-config"></span><h1>core_config Module<a class="headerlink" href="#core-config-module" title="Permalink to this heading">¶</a></h1>
+<section id="coreconfig">
+<h2>CoreConfig<a class="headerlink" href="#coreconfig" title="Permalink to this heading">¶</a></h2>
+<p><strong>Class to configure the optimization process of the model:</strong></p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.core.CoreConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">CoreConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">quantization_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationConfig()</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">mixed_precision_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">debug_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DebugConfig()</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.CoreConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>A class to hold the configurations classes of the MCT-core.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>quantization_config</strong> (<a class="reference internal" href="quantization_config.html#model_compression_toolkit.core.QuantizationConfig" title="model_compression_toolkit.core.QuantizationConfig"><em>QuantizationConfig</em></a>) – Config for quantization.</p></li>
+<li><p><strong>mixed_precision_config</strong> (<a class="reference internal" href="mixed_precision_quantization_config.html#model_compression_toolkit.core.MixedPrecisionQuantizationConfig" title="model_compression_toolkit.core.MixedPrecisionQuantizationConfig"><em>MixedPrecisionQuantizationConfig</em></a>) – Config for mixed precision quantization (optional, default=None).</p></li>
+<li><p><strong>debug_config</strong> (<a class="reference internal" href="debug_config.html#model_compression_toolkit.core.DebugConfig" title="model_compression_toolkit.core.DebugConfig"><em>DebugConfig</em></a>) – Config for debugging and editing the network quantization process.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <div>
+    <h3><a href="../../../index.html">Table of Contents</a></h3>
+    <ul>
+<li><a class="reference internal" href="#">core_config Module</a><ul>
+<li><a class="reference internal" href="#coreconfig">CoreConfig</a></li>
+</ul>
+</li>
+</ul>
+
+  </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">core_config Module</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/debug_config.html b/docs/api/api_docs/modules/debug_config.html
new file mode 100644
index 000000000..40bfbdcc9
--- /dev/null
+++ b/docs/api/api_docs/modules/debug_config.html
@@ -0,0 +1,113 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>debug_config Module &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">debug_config Module</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="debug-config-module">
+<span id="ug-debug-config"></span><h1>debug_config Module<a class="headerlink" href="#debug-config-module" title="Permalink to this heading">¶</a></h1>
+<section id="debugconfig">
+<h2>DebugConfig<a class="headerlink" href="#debugconfig" title="Permalink to this heading">¶</a></h2>
+<p><strong>Class to configure params for debugging purposes:</strong></p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.core.DebugConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">DebugConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">analyze_similarity</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">network_editor</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">[]</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.DebugConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>A class for MCT core debug information.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>analyze_similarity</strong> (<em>bool</em>) – Whether to plot similarity figures within TensorBoard (when logger is
+enabled) or not. Can be used to pinpoint problematic layers in the quantization process.</p></li>
+<li><p><strong>network_editor</strong> (<em>List</em><em>[</em><a class="reference internal" href="network_editor.html#model_compression_toolkit.core.network_editor.EditRule" title="model_compression_toolkit.core.network_editor.EditRule"><em>EditRule</em></a><em>]</em>) – A list of rules and actions to edit the network for quantization.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <div>
+    <h3><a href="../../../index.html">Table of Contents</a></h3>
+    <ul>
+<li><a class="reference internal" href="#">debug_config Module</a><ul>
+<li><a class="reference internal" href="#debugconfig">DebugConfig</a></li>
+</ul>
+</li>
+</ul>
+
+  </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">debug_config Module</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/exporter.html b/docs/api/api_docs/modules/exporter.html
new file mode 100644
index 000000000..f7f1c37d5
--- /dev/null
+++ b/docs/api/api_docs/modules/exporter.html
@@ -0,0 +1,455 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>exporter Module &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">exporter Module</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="exporter-module">
+<span id="ug-exporter"></span><h1>exporter Module<a class="headerlink" href="#exporter-module" title="Permalink to this heading">¶</a></h1>
+<p>Allows to export a quantized model in different serialization formats and quantization formats.
+For more details about the export formats and options, please refer to the project’s GitHub <a class="reference external" href="https://github.com/sony/model_optimization/tree/main/model_compression_toolkit/exporter">README file</a>.
+If you have any questions or issues, please open an issue in this GitHub repository.</p>
+<section id="quantizationformat">
+<h2>QuantizationFormat<a class="headerlink" href="#quantizationformat" title="Permalink to this heading">¶</a></h2>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.exporter.QuantizationFormat">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.exporter.</span></span><span class="sig-name descname"><span class="pre">QuantizationFormat</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.exporter.QuantizationFormat" title="Permalink to this definition">¶</a></dt>
+<dd><p>Specify which quantization format to use for exporting a quantized model.</p>
+<p>FAKELY_QUANT - Weights and activations are quantized but represented using float data type.</p>
+<p>INT8 - Weights and activations are represented using 8-bit integer data type.</p>
+<p>MCTQ - Weights and activations are quantized using mct_quantizers custom quantizers.</p>
+</dd></dl>
+
+</section>
+<section id="kerasexportserializationformat">
+<h2>KerasExportSerializationFormat<a class="headerlink" href="#kerasexportserializationformat" title="Permalink to this heading">¶</a></h2>
+<p>Select the serialization format for exporting a quantized Keras model.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.exporter.KerasExportSerializationFormat">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.exporter.</span></span><span class="sig-name descname"><span class="pre">KerasExportSerializationFormat</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.exporter.KerasExportSerializationFormat" title="Permalink to this definition">¶</a></dt>
+<dd><p>Specify which serialization format to use for exporting a quantized Keras model.</p>
+<p>KERAS - .keras file format</p>
+<p>TFLITE - .tflite file format</p>
+</dd></dl>
+
+</section>
+<section id="keras-export-model">
+<h2>keras_export_model<a class="headerlink" href="#keras-export-model" title="Permalink to this heading">¶</a></h2>
+<p>Allows to export a Keras model that was quantized via MCT.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.exporter.keras_export_model">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.exporter.</span></span><span class="sig-name descname"><span class="pre">keras_export_model</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">save_model_path</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">is_layer_exportable_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">is_keras_layer_exportable</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">serialization_format</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">KerasExportSerializationFormat.KERAS</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">quantization_format</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationFormat.MCTQ</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.exporter.keras_export_model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Export a Keras quantized model to a h5 or tflite model.
+The model will be saved to the path in save_model_path.
+keras_export_model supports the combination of QuantizationFormat.FAKELY_QUANT (where weights
+and activations are float fakely-quantized values) and KerasExportSerializationFormat.KERAS_H5 (where the model
+will be saved to h5 model) or the combination of KerasExportSerializationFormat.TFLITE (where the model will be
+saved to tflite model) with QuantizationFormat.FAKELY_QUANT or QuantizationFormat.INT8 (where weights and
+activations are represented using 8bits integers).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> – Model to export.</p></li>
+<li><p><strong>save_model_path</strong> – Path to save the model.</p></li>
+<li><p><strong>is_layer_exportable_fn</strong> – Callable to check whether a layer can be exported or not.</p></li>
+<li><p><strong>serialization_format</strong> – Format to export the model according to (by default</p></li>
+<li><p><strong>KerasExportSerializationFormat.KERAS_H5</strong><strong>)</strong><strong>.</strong> – </p></li>
+<li><p><strong>quantization_format</strong> – Format of how quantizers are exported (fakely-quant, int8, MCTQ quantizers).</p></li>
+</ul>
+</dd>
+<dt class="field-even">Returns<span class="colon">:</span></dt>
+<dd class="field-even"><p>Custom objects dictionary needed to load the model.</p>
+</dd>
+<dt class="field-odd">Return type<span class="colon">:</span></dt>
+<dd class="field-odd"><p><code class="xref py py-class docutils literal notranslate"><span class="pre">Dict</span></code>[<code class="xref py py-class docutils literal notranslate"><span class="pre">str</span></code>, <code class="xref py py-class docutils literal notranslate"><span class="pre">type</span></code>]</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+<section id="keras-tutorial">
+<h2>Keras Tutorial<a class="headerlink" href="#keras-tutorial" title="Permalink to this heading">¶</a></h2>
+<p>To export a TensorFlow model as a quantized model, it is necessary to first apply quantization
+to the model using MCT:</p>
+<div class="highlight-shell notranslate"><div class="highlight"><pre><span></span>!<span class="w"> </span>pip<span class="w"> </span>install<span class="w"> </span>-q<span class="w"> </span>mct-nightly
+</pre></div>
+</div>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="kn">from</span> <span class="nn">keras.applications</span> <span class="kn">import</span> <span class="n">ResNet50</span>
+<span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+
+<span class="c1"># Create a model</span>
+<span class="n">float_model</span> <span class="o">=</span> <span class="n">ResNet50</span><span class="p">()</span>
+<span class="c1"># Quantize the model.</span>
+<span class="c1"># Notice that here the representative dataset is random for demonstration only.</span>
+<span class="n">quantized_exportable_model</span><span class="p">,</span> <span class="n">_</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">ptq</span><span class="o">.</span><span class="n">keras_post_training_quantization</span><span class="p">(</span><span class="n">float_model</span><span class="p">,</span>
+                                                                         <span class="n">representative_data_gen</span><span class="o">=</span><span class="k">lambda</span><span class="p">:</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">3</span><span class="p">))])</span>
+</pre></div>
+</div>
+<section id="keras-serialization-format">
+<h3>keras serialization format<a class="headerlink" href="#keras-serialization-format" title="Permalink to this heading">¶</a></h3>
+<p>The model will be exported as a tensorflow <cite>.keras</cite> model where weights and activations are quantized but represented using a float32 dtype.
+Two optional quantization formats are available: MCTQ and FAKELY_QUANT.</p>
+</section>
+<section id="mctq">
+<h3>MCTQ<a class="headerlink" href="#mctq" title="Permalink to this heading">¶</a></h3>
+<p>By default, <cite>mct.exporter.keras_export_model</cite> will export the quantized Keras model to
+a .keras model with custom quantizers from mct_quantizers module.</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">tempfile</span>
+
+<span class="c1"># Path of exported model</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">keras_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.keras&#39;</span><span class="p">)</span>
+
+<span class="c1"># Export a keras model with mctq custom quantizers.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">keras_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                <span class="n">save_model_path</span><span class="o">=</span><span class="n">keras_file_path</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Notice that the model has the same size as the quantized exportable model as weights data types are float.</p>
+</section>
+<section id="fakely-quantized-in-keras">
+<h3>Fakely-Quantized in Keras<a class="headerlink" href="#fakely-quantized-in-keras" title="Permalink to this heading">¶</a></h3>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="c1"># Path of exported model</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">keras_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.keras&#39;</span><span class="p">)</span>
+
+<span class="c1"># Use mode KerasExportSerializationFormat.KERAS for a .keras model</span>
+<span class="c1"># and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights</span>
+<span class="c1"># and activations.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">keras_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                <span class="n">save_model_path</span><span class="o">=</span><span class="n">keras_file_path</span><span class="p">,</span>
+                                <span class="n">quantization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">QuantizationFormat</span><span class="o">.</span><span class="n">FAKELY_QUANT</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.</p>
+</section>
+<section id="tflite">
+<h3>TFLite<a class="headerlink" href="#tflite" title="Permalink to this heading">¶</a></h3>
+<p>The tflite serialization format export in two qauntization formats: INT8 and FAKELY_QUANT.</p>
+</section>
+<section id="int8-tflite">
+<h3>INT8 TFLite<a class="headerlink" href="#int8-tflite" title="Permalink to this heading">¶</a></h3>
+<p>The model will be exported as a tflite model where weights and activations are represented as 8bit integers.</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">tempfile</span>
+
+<span class="c1"># Path of exported model</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">tflite_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.tflite&#39;</span><span class="p">)</span>
+
+<span class="c1"># Use mode KerasExportSerializationFormat.TFLITE for tflite model and quantization_format.INT8.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">keras_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                <span class="n">save_model_path</span><span class="o">=</span><span class="n">tflite_file_path</span><span class="p">,</span>
+                                <span class="n">serialization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">KerasExportSerializationFormat</span><span class="o">.</span><span class="n">TFLITE</span><span class="p">,</span>
+                                <span class="n">quantization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">QuantizationFormat</span><span class="o">.</span><span class="n">INT8</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Compare size of float and quantized model:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">os</span>
+
+<span class="c1"># Save float model to measure its size</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">float_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.keras&#39;</span><span class="p">)</span>
+<span class="n">float_model</span><span class="o">.</span><span class="n">save</span><span class="p">(</span><span class="n">float_file_path</span><span class="p">)</span>
+
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;Float model in Mb:&quot;</span><span class="p">,</span> <span class="n">os</span><span class="o">.</span><span class="n">path</span><span class="o">.</span><span class="n">getsize</span><span class="p">(</span><span class="n">float_file_path</span><span class="p">)</span> <span class="o">/</span> <span class="nb">float</span><span class="p">(</span><span class="mi">2</span> <span class="o">**</span> <span class="mi">20</span><span class="p">))</span>
+<span class="nb">print</span><span class="p">(</span><span class="s2">&quot;Quantized model in Mb:&quot;</span><span class="p">,</span> <span class="n">os</span><span class="o">.</span><span class="n">path</span><span class="o">.</span><span class="n">getsize</span><span class="p">(</span><span class="n">tflite_file_path</span><span class="p">)</span> <span class="o">/</span> <span class="nb">float</span><span class="p">(</span><span class="mi">2</span> <span class="o">**</span> <span class="mi">20</span><span class="p">))</span>
+<span class="nb">print</span><span class="p">(</span><span class="sa">f</span><span class="s1">&#39;Compression ratio: </span><span class="si">{</span><span class="n">os</span><span class="o">.</span><span class="n">path</span><span class="o">.</span><span class="n">getsize</span><span class="p">(</span><span class="n">float_file_path</span><span class="p">)</span><span class="w"> </span><span class="o">/</span><span class="w"> </span><span class="n">os</span><span class="o">.</span><span class="n">path</span><span class="o">.</span><span class="n">getsize</span><span class="p">(</span><span class="n">tflite_file_path</span><span class="p">)</span><span class="si">}</span><span class="s1">&#39;</span><span class="p">)</span>
+</pre></div>
+</div>
+</section>
+<section id="fakely-quantized-tflite">
+<h3>Fakely-Quantized TFLite<a class="headerlink" href="#fakely-quantized-tflite" title="Permalink to this heading">¶</a></h3>
+<p>The model will be exported as a tflite model where weights and activations are quantized but represented with a float data type.</p>
+</section>
+<section id="usage-example">
+<h3>Usage Example<a class="headerlink" href="#usage-example" title="Permalink to this heading">¶</a></h3>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="c1"># Path of exported model</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">tflite_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.tflite&#39;</span><span class="p">)</span>
+
+<span class="c1"># Use mode KerasExportSerializationFormat.TFLITE for tflite model and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights</span>
+<span class="c1"># and activations.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">keras_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                <span class="n">save_model_path</span><span class="o">=</span><span class="n">tflite_file_path</span><span class="p">,</span>
+                                <span class="n">serialization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">KerasExportSerializationFormat</span><span class="o">.</span><span class="n">TFLITE</span><span class="p">,</span>
+                                <span class="n">quantization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">QuantizationFormat</span><span class="o">.</span><span class="n">FAKELY_QUANT</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.</p>
+</section>
+</section>
+<section id="pytorchexportserializationformat">
+<h2>PytorchExportSerializationFormat<a class="headerlink" href="#pytorchexportserializationformat" title="Permalink to this heading">¶</a></h2>
+<p>Select the serialization format for exporting a quantized Pytorch model.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.exporter.PytorchExportSerializationFormat">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.exporter.</span></span><span class="sig-name descname"><span class="pre">PytorchExportSerializationFormat</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.exporter.PytorchExportSerializationFormat" title="Permalink to this definition">¶</a></dt>
+<dd><p>Specify which serialization format to use for exporting a quantized Pytorch model.</p>
+<p>TORCHSCRIPT - torchscript format</p>
+<p>ONNX - onnx format</p>
+</dd></dl>
+
+</section>
+<section id="pytorch-export-model">
+<h2>pytorch_export_model<a class="headerlink" href="#pytorch-export-model" title="Permalink to this heading">¶</a></h2>
+<p>Allows to export a Pytorch model that was quantized via MCT.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.exporter.pytorch_export_model">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.exporter.</span></span><span class="sig-name descname"><span class="pre">pytorch_export_model</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">save_model_path</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">repr_dataset</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">is_layer_exportable_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">is_pytorch_layer_exportable</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">serialization_format</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">PytorchExportSerializationFormat.ONNX</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">quantization_format</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationFormat.MCTQ</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">onnx_opset_version</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULT_ONNX_OPSET_VERSION</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.exporter.pytorch_export_model" title="Permalink to this definition">¶</a></dt>
+<dd><p>Export a PyTorch quantized model to a torchscript or onnx model.
+The model will be saved to the path in save_model_path.
+Currently, pytorch_export_model supports only QuantizationFormat.FAKELY_QUANT (where weights
+and activations are float fakely-quantized values) and PytorchExportSerializationFormat.TORCHSCRIPT
+(where the model will be saved to TorchScript model) or PytorchExportSerializationFormat.ONNX
+(where the model will be saved to ONNX model).</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>model</strong> – Model to export.</p></li>
+<li><p><strong>save_model_path</strong> – Path to save the model.</p></li>
+<li><p><strong>repr_dataset</strong> – Representative dataset for tracing the pytorch model (mandatory for exporting it).</p></li>
+<li><p><strong>is_layer_exportable_fn</strong> – Callable to check whether a layer can be exported or not.</p></li>
+<li><p><strong>serialization_format</strong> – Format to export the model according to (by default</p></li>
+<li><p><strong>PytorchExportSerializationFormat.ONNX</strong><strong>)</strong><strong>.</strong> – </p></li>
+<li><p><strong>quantization_format</strong> – Format of how quantizers are exported (fakely-quant, int8, MCTQ quantizers).</p></li>
+<li><p><strong>onnx_opset_version</strong> – ONNX opset version to use for exported ONNX model.</p></li>
+</ul>
+</dd>
+<dt class="field-even">Return type<span class="colon">:</span></dt>
+<dd class="field-even"><p><code class="xref py py-obj docutils literal notranslate"><span class="pre">None</span></code></p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+<section id="pytorch-tutorial">
+<h2>Pytorch Tutorial<a class="headerlink" href="#pytorch-tutorial" title="Permalink to this heading">¶</a></h2>
+<p>To export a Pytorch model as a quantized model, it is necessary to first apply quantization
+to the model using MCT:</p>
+<div class="highlight-shell notranslate"><div class="highlight"><pre><span></span>!<span class="w"> </span>pip<span class="w"> </span>install<span class="w"> </span>-q<span class="w"> </span>mct-nightly
+</pre></div>
+</div>
+<p>In order to export your quantized model to ONNX format, and use it for inference, some additional packages are needed. Notice, this is needed only for models exported to ONNX format, so this part can be skipped if this is not planned:</p>
+<div class="highlight-shell notranslate"><div class="highlight"><pre><span></span>!<span class="w"> </span>pip<span class="w"> </span>install<span class="w"> </span>-q<span class="w"> </span>onnx<span class="w"> </span>onnxruntime<span class="w"> </span>onnxruntime-extensions
+</pre></div>
+</div>
+<p>Now, let’s start the export demonstration by quantizing the model using MCT:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
+<span class="kn">import</span> <span class="nn">torch</span>
+<span class="kn">from</span> <span class="nn">torchvision.models.mobilenetv2</span> <span class="kn">import</span> <span class="n">mobilenet_v2</span>
+
+<span class="c1"># Create a model</span>
+<span class="n">float_model</span> <span class="o">=</span> <span class="n">mobilenet_v2</span><span class="p">()</span>
+
+
+<span class="c1"># Notice that here the representative dataset is random for demonstration only.</span>
+<span class="k">def</span> <span class="nf">representative_data_gen</span><span class="p">():</span>
+    <span class="k">yield</span> <span class="p">[</span><span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">random</span><span class="p">((</span><span class="mi">1</span><span class="p">,</span> <span class="mi">3</span><span class="p">,</span> <span class="mi">224</span><span class="p">,</span> <span class="mi">224</span><span class="p">))]</span>
+
+
+<span class="n">quantized_exportable_model</span><span class="p">,</span> <span class="n">_</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">ptq</span><span class="o">.</span><span class="n">pytorch_post_training_quantization</span><span class="p">(</span><span class="n">float_model</span><span class="p">,</span> <span class="n">representative_data_gen</span><span class="o">=</span><span class="n">representative_data_gen</span><span class="p">)</span>
+</pre></div>
+</div>
+<section id="onnx">
+<h3>ONNX<a class="headerlink" href="#onnx" title="Permalink to this heading">¶</a></h3>
+<p>The model will be exported in ONNX format where weights and activations are represented as float. Notice that <cite>onnx</cite> should be installed in order to export the model to an ONNX model.</p>
+<p>There are two optional formats to choose: MCTQ or FAKELY_QUANT.</p>
+</section>
+<section id="mctq-quantization-format">
+<h3>MCTQ Quantization Format<a class="headerlink" href="#mctq-quantization-format" title="Permalink to this heading">¶</a></h3>
+<p>By default, <cite>mct.exporter.pytorch_export_model</cite> will export the quantized pytorch model to
+an ONNX model with custom quantizers from mct_quantizers module.</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="c1"># Path of exported model</span>
+<span class="n">onnx_file_path</span> <span class="o">=</span> <span class="s1">&#39;model_format_onnx_mctq.onnx&#39;</span>
+
+<span class="c1"># Export ONNX model with mctq quantizers.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">pytorch_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                  <span class="n">save_model_path</span><span class="o">=</span><span class="n">onnx_file_path</span><span class="p">,</span>
+                                  <span class="n">repr_dataset</span><span class="o">=</span><span class="n">representative_data_gen</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Notice that the model has the same size as the quantized exportable model as weights data types are float.</p>
+</section>
+<section id="onnx-opset-version">
+<h3>ONNX opset version<a class="headerlink" href="#onnx-opset-version" title="Permalink to this heading">¶</a></h3>
+<p>By default, the used ONNX opset version is 15, but this can be changed using <cite>onnx_opset_version</cite>:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="c1"># Export ONNX model with mctq quantizers.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">pytorch_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                  <span class="n">save_model_path</span><span class="o">=</span><span class="n">onnx_file_path</span><span class="p">,</span>
+                                  <span class="n">repr_dataset</span><span class="o">=</span><span class="n">representative_data_gen</span><span class="p">,</span>
+                                  <span class="n">onnx_opset_version</span><span class="o">=</span><span class="mi">16</span><span class="p">)</span>
+</pre></div>
+</div>
+<div class="line-block">
+<div class="line"><br /></div>
+</div>
+</section>
+<section id="use-exported-model-for-inference">
+<h3>Use exported model for inference<a class="headerlink" href="#use-exported-model-for-inference" title="Permalink to this heading">¶</a></h3>
+<p>To load and infer using the exported model, which was exported to an ONNX file in MCTQ format, we will use <cite>mct_quantizers</cite> method <cite>get_ort_session_options</cite> during onnxruntime session creation. <strong>Notice</strong>, inference on models that are exported in this format are slowly and suffers from longer latency. However, inference of these models on IMX500 will not suffer from this issue.</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">mct_quantizers</span> <span class="k">as</span> <span class="nn">mctq</span>
+<span class="kn">import</span> <span class="nn">onnxruntime</span> <span class="k">as</span> <span class="nn">ort</span>
+
+<span class="n">sess</span> <span class="o">=</span> <span class="n">ort</span><span class="o">.</span><span class="n">InferenceSession</span><span class="p">(</span><span class="n">onnx_file_path</span><span class="p">,</span>
+                            <span class="n">mctq</span><span class="o">.</span><span class="n">get_ort_session_options</span><span class="p">(),</span>
+                            <span class="n">providers</span><span class="o">=</span><span class="p">[</span><span class="s1">&#39;CUDAExecutionProvider&#39;</span><span class="p">,</span> <span class="s1">&#39;CPUExecutionProvider&#39;</span><span class="p">])</span>
+
+<span class="n">_input_data</span> <span class="o">=</span> <span class="nb">next</span><span class="p">(</span><span class="n">representative_data_gen</span><span class="p">())[</span><span class="mi">0</span><span class="p">]</span><span class="o">.</span><span class="n">astype</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">float32</span><span class="p">)</span>
+<span class="n">_model_output_name</span> <span class="o">=</span> <span class="n">sess</span><span class="o">.</span><span class="n">get_outputs</span><span class="p">()[</span><span class="mi">0</span><span class="p">]</span><span class="o">.</span><span class="n">name</span>
+<span class="n">_model_input_name</span> <span class="o">=</span> <span class="n">sess</span><span class="o">.</span><span class="n">get_inputs</span><span class="p">()[</span><span class="mi">0</span><span class="p">]</span><span class="o">.</span><span class="n">name</span>
+
+<span class="c1"># Run inference</span>
+<span class="n">predictions</span> <span class="o">=</span> <span class="n">sess</span><span class="o">.</span><span class="n">run</span><span class="p">([</span><span class="n">_model_output_name</span><span class="p">],</span> <span class="p">{</span><span class="n">_model_input_name</span><span class="p">:</span> <span class="n">_input_data</span><span class="p">})</span>
+</pre></div>
+</div>
+<div class="line-block">
+<div class="line"><br /></div>
+</div>
+</section>
+<section id="fakely-quantized-in-pytorch">
+<h3>Fakely-Quantized in Pytorch<a class="headerlink" href="#fakely-quantized-in-pytorch" title="Permalink to this heading">¶</a></h3>
+<p>To export a fakely-quantized model, use QuantizationFormat.FAKELY_QUANT:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">tempfile</span>
+
+<span class="c1"># Path of exported model</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">onnx_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.onnx&#39;</span><span class="p">)</span>
+
+<span class="c1"># Use QuantizationFormat.FAKELY_QUANT for fakely-quantized weights and activations.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">pytorch_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                  <span class="n">save_model_path</span><span class="o">=</span><span class="n">onnx_file_path</span><span class="p">,</span>
+                                  <span class="n">repr_dataset</span><span class="o">=</span><span class="n">representative_data_gen</span><span class="p">,</span>
+                                  <span class="n">quantization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">QuantizationFormat</span><span class="o">.</span><span class="n">FAKELY_QUANT</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Notice that the fakely-quantized model has the same size as the quantized
+exportable model as weights data types are float.</p>
+</section>
+<section id="torchscript">
+<h3>TorchScript<a class="headerlink" href="#torchscript" title="Permalink to this heading">¶</a></h3>
+<p>The model will be exported in TorchScript format where weights and activations are
+quantized but represented as float (fakely quant).</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="c1"># Path of exported model</span>
+<span class="n">_</span><span class="p">,</span> <span class="n">torchscript_file_path</span> <span class="o">=</span> <span class="n">tempfile</span><span class="o">.</span><span class="n">mkstemp</span><span class="p">(</span><span class="s1">&#39;.pt&#39;</span><span class="p">)</span>
+
+
+<span class="c1"># Use mode PytorchExportSerializationFormat.TORCHSCRIPT a torchscript model</span>
+<span class="c1"># and QuantizationFormat.FAKELY_QUANT for fakely-quantized weights and activations.</span>
+<span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">pytorch_export_model</span><span class="p">(</span><span class="n">model</span><span class="o">=</span><span class="n">quantized_exportable_model</span><span class="p">,</span>
+                                  <span class="n">save_model_path</span><span class="o">=</span><span class="n">torchscript_file_path</span><span class="p">,</span>
+                                  <span class="n">repr_dataset</span><span class="o">=</span><span class="n">representative_data_gen</span><span class="p">,</span>
+                                  <span class="n">serialization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">PytorchExportSerializationFormat</span><span class="o">.</span><span class="n">TORCHSCRIPT</span><span class="p">,</span>
+                                  <span class="n">quantization_format</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">exporter</span><span class="o">.</span><span class="n">QuantizationFormat</span><span class="o">.</span><span class="n">FAKELY_QUANT</span><span class="p">)</span>
+</pre></div>
+</div>
+<p>Notice that the fakely-quantized model has the same size as the quantized exportable model as weights data types are
+float.</p>
+</section>
+</section>
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <div>
+    <h3><a href="../../../index.html">Table of Contents</a></h3>
+    <ul>
+<li><a class="reference internal" href="#">exporter Module</a><ul>
+<li><a class="reference internal" href="#quantizationformat">QuantizationFormat</a></li>
+<li><a class="reference internal" href="#kerasexportserializationformat">KerasExportSerializationFormat</a></li>
+<li><a class="reference internal" href="#keras-export-model">keras_export_model</a></li>
+<li><a class="reference internal" href="#keras-tutorial">Keras Tutorial</a><ul>
+<li><a class="reference internal" href="#keras-serialization-format">keras serialization format</a></li>
+<li><a class="reference internal" href="#mctq">MCTQ</a></li>
+<li><a class="reference internal" href="#fakely-quantized-in-keras">Fakely-Quantized in Keras</a></li>
+<li><a class="reference internal" href="#tflite">TFLite</a></li>
+<li><a class="reference internal" href="#int8-tflite">INT8 TFLite</a></li>
+<li><a class="reference internal" href="#fakely-quantized-tflite">Fakely-Quantized TFLite</a></li>
+<li><a class="reference internal" href="#usage-example">Usage Example</a></li>
+</ul>
+</li>
+<li><a class="reference internal" href="#pytorchexportserializationformat">PytorchExportSerializationFormat</a></li>
+<li><a class="reference internal" href="#pytorch-export-model">pytorch_export_model</a></li>
+<li><a class="reference internal" href="#pytorch-tutorial">Pytorch Tutorial</a><ul>
+<li><a class="reference internal" href="#onnx">ONNX</a></li>
+<li><a class="reference internal" href="#mctq-quantization-format">MCTQ Quantization Format</a></li>
+<li><a class="reference internal" href="#onnx-opset-version">ONNX opset version</a></li>
+<li><a class="reference internal" href="#use-exported-model-for-inference">Use exported model for inference</a></li>
+<li><a class="reference internal" href="#fakely-quantized-in-pytorch">Fakely-Quantized in Pytorch</a></li>
+<li><a class="reference internal" href="#torchscript">TorchScript</a></li>
+</ul>
+</li>
+</ul>
+</li>
+</ul>
+
+  </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">exporter Module</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/layer_filters.html b/docs/api/api_docs/modules/layer_filters.html
index 704e6be88..3a94b765c 100644
--- a/docs/api/api_docs/modules/layer_filters.html
+++ b/docs/api/api_docs/modules/layer_filters.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>Layer Attributes Filters &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>Layer Attributes Filters &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Layer Attributes Filters</a></li> 
       </ul>
     </div>  
@@ -41,17 +42,17 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="layer-attributes-filters">
-<span id="ug-layer-filters"></span><h1>Layer Attributes Filters<a class="headerlink" href="#layer-attributes-filters" title="Permalink to this headline">¶</a></h1>
+<span id="ug-layer-filters"></span><h1>Layer Attributes Filters<a class="headerlink" href="#layer-attributes-filters" title="Permalink to this heading">¶</a></h1>
 <p>In order to create LayerFilterParams which needed to filter layers by their attributes,
 one may use the next filters to check if a layer configuration holds the created LayerFilterParams:</p>
 <section id="attribute-filters">
-<h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Permalink to this headline">¶</a></h2>
+<h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.Eq">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">Eq</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.Eq" title="Permalink to this definition">¶</a></dt>
 <dd><p>Filter configurations such that it matches configurations that have an attribute with a value that equals to the value that Eq holds.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>attr</strong> (<em>str</em>) – Attribute to filter a layer’s configuration according to.</p></li>
 <li><p><strong>value</strong> (<em>Any</em>) – Value to filter to filter a layer’s configuration according to.</p></li>
@@ -69,7 +70,7 @@ <h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Perm
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">NotEq</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.NotEq" title="Permalink to this definition">¶</a></dt>
 <dd><p>Filter configurations such that it matches configurations that have an attribute with a value that is not equal to the value that NotEq holds.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>attr</strong> (<em>str</em>) – Attribute to filter a layer’s configuration according to.</p></li>
 <li><p><strong>value</strong> (<em>Any</em>) – Value to filter to filter a layer’s configuration according to.</p></li>
@@ -88,7 +89,7 @@ <h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Perm
 <dd><p>Filter configurations such that it matches configurations
 that have an attribute with a value that is greater than the value that Greater holds.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>attr</strong> (<em>str</em>) – Attribute to filter a layer’s configuration according to.</p></li>
 <li><p><strong>value</strong> (<em>Any</em>) – Value to filter to filter a layer’s configuration according to.</p></li>
@@ -107,7 +108,7 @@ <h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Perm
 <dd><p>Filter configurations such that it matches configurations
 that have an attribute with a value that is greater or equal than the value that GreaterEq holds.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>attr</strong> (<em>str</em>) – Attribute to filter a layer’s configuration according to.</p></li>
 <li><p><strong>value</strong> (<em>Any</em>) – Value to filter to filter a layer’s configuration according to.</p></li>
@@ -125,7 +126,7 @@ <h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Perm
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">Smaller</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.Smaller" title="Permalink to this definition">¶</a></dt>
 <dd><p>Filter configurations such that it matches configurations that have an attribute with a value that is smaller than the value that Smaller holds.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>attr</strong> (<em>str</em>) – Attribute to filter a layer’s configuration according to.</p></li>
 <li><p><strong>value</strong> (<em>Any</em>) – Value to filter to filter a layer’s configuration according to.</p></li>
@@ -143,7 +144,7 @@ <h2>Attribute Filters<a class="headerlink" href="#attribute-filters" title="Perm
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">SmallerEq</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.SmallerEq" title="Permalink to this definition">¶</a></dt>
 <dd><p>Filter configurations such that it matches configurations that have an attribute with a value that is smaller or equal than the value that SmallerEq holds.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>attr</strong> (<em>str</em>) – Attribute to filter a layer’s configuration according to.</p></li>
 <li><p><strong>value</strong> (<em>Any</em>) – Value to filter to filter a layer’s configuration according to.</p></li>
@@ -182,7 +183,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -193,13 +194,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">Layer Attributes Filters</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/mixed_precision_quantization_config.html b/docs/api/api_docs/modules/mixed_precision_quantization_config.html
index 74980341c..e37d5079e 100644
--- a/docs/api/api_docs/modules/mixed_precision_quantization_config.html
+++ b/docs/api/api_docs/modules/mixed_precision_quantization_config.html
@@ -42,13 +42,13 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="mixed-precision-quantization-config-module">
-<span id="ug-mixed-precision-quantization-config"></span><h1>mixed_precision_quantization_config Module<a class="headerlink" href="#mixed-precision-quantization-config-module" title="Permalink to this heading">¶</a></h1>
+<span id="ug-mixed-precision-quantization-config-v2"></span><h1>mixed_precision_quantization_config Module<a class="headerlink" href="#mixed-precision-quantization-config-module" title="Permalink to this heading">¶</a></h1>
 <section id="kpi">
 <h2>KPI<a class="headerlink" href="#kpi" title="Permalink to this heading">¶</a></h2>
 <p><strong>Object to configure resources to use when searching for a mixed-precision configuration for a model:</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">KPI</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">weights_memory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_memory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">total_memory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">bops</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em><span class="sig-paren">)</span></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.KPI">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">KPI</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">weights_memory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_memory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">total_memory</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">bops</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">np.inf</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.KPI" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class to represent measurements of performance.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters<span class="colon">:</span></dt>
@@ -66,24 +66,25 @@ <h2>KPI<a class="headerlink" href="#kpi" title="Permalink to this heading">¶</a
 <div class="line"><br /></div>
 </div>
 </section>
-<section id="mixedprecisionquantizationconfig">
-<h2>MixedPrecisionQuantizationConfig<a class="headerlink" href="#mixedprecisionquantizationconfig" title="Permalink to this heading">¶</a></h2>
+<section id="mixedprecisionquantizationconfigv2">
+<h2>MixedPrecisionQuantizationConfigV2<a class="headerlink" href="#mixedprecisionquantizationconfigv2" title="Permalink to this heading">¶</a></h2>
 <p><strong>Class to configure the quantization process of the model when quantizing in mixed-precision:</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.MixedPrecisionQuantizationConfig">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">MixedPrecisionQuantizationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">qc</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">DEFAULTCONFIG</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">compute_distance_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">compute_mse</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">distance_weighting_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">get_average_weights</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">num_of_images</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">32</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">configuration_overwrite</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">num_interest_points_factor</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">1.0</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.MixedPrecisionQuantizationConfig" title="Permalink to this definition">¶</a></dt>
-<dd><p>Class to wrap all different parameters the library quantize the input model according to.
-Unlike QuantizationConfig, number of bits for quantization is a list of possible bit widths to
-support mixed-precision model quantization.</p>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.MixedPrecisionQuantizationConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">MixedPrecisionQuantizationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">compute_distance_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">distance_weighting_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">get_average_weights</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">num_of_images</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">32</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">configuration_overwrite</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">num_interest_points_factor</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">1.0</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">use_hessian_based_scores</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">norm_scores</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">refine_mp_solution</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">metric_normalization_threshold</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">1e10</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.MixedPrecisionQuantizationConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>Class with mixed precision parameters to quantize the input model.</p>
 <dl class="field-list simple">
 <dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>qc</strong> (<a class="reference internal" href="../../experimental_api_docs/modules/quantization_config.html#model_compression_toolkit.QuantizationConfig" title="model_compression_toolkit.QuantizationConfig"><em>QuantizationConfig</em></a>) – QuantizationConfig object containing parameters of how the model should be quantized.</p></li>
 <li><p><strong>compute_distance_fn</strong> (<em>Callable</em>) – Function to compute a distance between two tensors.</p></li>
 <li><p><strong>distance_weighting_method</strong> (<em>Callable</em>) – Function to use when weighting the distances among different layers when computing the sensitivity metric.</p></li>
 <li><p><strong>num_of_images</strong> (<em>int</em>) – Number of images to use to evaluate the sensitivity of a mixed-precision model comparing to the float model.</p></li>
 <li><p><strong>configuration_overwrite</strong> (<em>List</em><em>[</em><em>int</em><em>]</em>) – A list of integers that enables overwrite of mixed precision with a predefined one.</p></li>
-<li><p><strong>num_interest_points_factor</strong> – A multiplication factor between zero and one (represents percentage) to reduce the number of interest points used to calculate the distance metric.</p></li>
+<li><p><strong>num_interest_points_factor</strong> (<em>float</em>) – A multiplication factor between zero and one (represents percentage) to reduce the number of interest points used to calculate the distance metric.</p></li>
+<li><p><strong>use_hessian_based_scores</strong> (<em>bool</em>) – Whether to use Hessian-based scores for weighted average distance metric computation.</p></li>
+<li><p><strong>norm_scores</strong> (<em>bool</em>) – Whether to normalize the returned scores for the weighted distance metric (to get values between 0 and 1).</p></li>
+<li><p><strong>refine_mp_solution</strong> (<em>bool</em>) – Whether to try to improve the final mixed-precision configuration using a greedy algorithm that searches layers to increase their bit-width, or not.</p></li>
+<li><p><strong>metric_normalization_threshold</strong> (<em>float</em>) – A threshold for checking the mixed precision distance metric values, In case of values larger than this threshold, the metric will be scaled to prevent numerical issues.</p></li>
 </ul>
 </dd>
 </dl>
@@ -104,7 +105,7 @@ <h3><a href="../../../index.html">Table of Contents</a></h3>
     <ul>
 <li><a class="reference internal" href="#">mixed_precision_quantization_config Module</a><ul>
 <li><a class="reference internal" href="#kpi">KPI</a></li>
-<li><a class="reference internal" href="#mixedprecisionquantizationconfig">MixedPrecisionQuantizationConfig</a></li>
+<li><a class="reference internal" href="#mixedprecisionquantizationconfigv2">MixedPrecisionQuantizationConfigV2</a></li>
 </ul>
 </li>
 </ul>
diff --git a/docs/api/api_docs/modules/network_editor.html b/docs/api/api_docs/modules/network_editor.html
index 2b01b1349..f34dfba5f 100644
--- a/docs/api/api_docs/modules/network_editor.html
+++ b/docs/api/api_docs/modules/network_editor.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>network_editor Module &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>network_editor Module &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">network_editor Module</a></li> 
       </ul>
     </div>  
@@ -41,38 +42,38 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="network-editor-module">
-<span id="ug-network-editor"></span><h1>network_editor Module<a class="headerlink" href="#network-editor-module" title="Permalink to this headline">¶</a></h1>
+<span id="ug-network-editor"></span><h1>network_editor Module<a class="headerlink" href="#network-editor-module" title="Permalink to this heading">¶</a></h1>
 <p><strong>The model can be edited by a list of EditRules to apply on nodes in a graph that represents the model during the model quantization. Each EditRule is a tuple of a filter and an action, where we apply the action on each node the filter matches</strong></p>
 <section id="editrule">
-<h2>EditRule<a class="headerlink" href="#editrule" title="Permalink to this headline">¶</a></h2>
+<h2>EditRule<a class="headerlink" href="#editrule" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.EditRule">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">EditRule</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">filter</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">action</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.EditRule" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.EditRule">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">EditRule</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">filter</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">action</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.EditRule" title="Permalink to this definition">¶</a></dt>
 <dd><p>A tuple of a node filter and an action. The filter matches nodes in the graph which represents the model,
 and the action is applied on these nodes during the quantization process.</p>
 <p class="rubric">Examples</p>
-<p>Create an EditRule to quantize all Conv2D wights using 9 bits:</p>
+<p>Create an EditRule to quantize all Conv2D kernel attribute weights using 9 bits:</p>
 <div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">model_compression_toolkit.core.keras.constants</span> <span class="kn">import</span> <span class="n">KERNEL</span>
 <span class="gp">&gt;&gt;&gt; </span><span class="kn">from</span> <span class="nn">tensorflow.keras.layers</span> <span class="kn">import</span> <span class="n">Conv2D</span>
-<span class="gp">&gt;&gt;&gt; </span><span class="n">er_list</span> <span class="o">=</span> <span class="p">[</span><span class="n">EditRule</span><span class="p">(</span><span class="nb">filter</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">network_editor</span><span class="o">.</span><span class="n">NodeTypeFilter</span><span class="p">(</span><span class="n">Conv2D</span><span class="p">),</span>
-<span class="gp">&gt;&gt;&gt; </span><span class="n">action</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">network_editor</span><span class="o">.</span><span class="n">ChangeCandidatesWeightsQuantConfigAttr</span><span class="p">(</span><span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">9</span><span class="p">))]</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">er_list</span> <span class="o">=</span> <span class="p">[</span><span class="n">mct</span><span class="o">.</span><span class="n">network_editor</span><span class="o">.</span><span class="n">EditRule</span><span class="p">(</span><span class="nb">filter</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">network_editor</span><span class="o">.</span><span class="n">NodeTypeFilter</span><span class="p">(</span><span class="n">Conv2D</span><span class="p">),</span> <span class="n">action</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">network_editor</span><span class="o">.</span><span class="n">ChangeCandidatesWeightsQuantConfigAttr</span><span class="p">(</span><span class="n">attr_name</span><span class="o">=</span><span class="n">KERNEL</span><span class="p">,</span> <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">9</span><span class="p">))]</span>
 </pre></div>
 </div>
-<p>Then the rules list can be passed to <a class="reference internal" href="../methods/keras_post_training_quantization.html#model_compression_toolkit.keras_post_training_quantization" title="model_compression_toolkit.keras_post_training_quantization"><code class="xref py py-func docutils literal notranslate"><span class="pre">keras_post_training_quantization()</span></code></a>
+<p>Then the rules list can be passed to <code class="xref py py-func docutils literal notranslate"><span class="pre">keras_post_training_quantization()</span></code>
 to modify the network during the quantization process.</p>
 <p>Create new instance of EditRule(filter, action)</p>
 </dd></dl>
 
 </section>
 <section id="filters">
-<h2>Filters<a class="headerlink" href="#filters" title="Permalink to this headline">¶</a></h2>
+<h2>Filters<a class="headerlink" href="#filters" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.NodeTypeFilter">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">NodeTypeFilter</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">node_type</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.NodeTypeFilter" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.NodeTypeFilter">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">NodeTypeFilter</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">node_type</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.NodeTypeFilter" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class NodeNameFilter to check if a node is of a specific type.</p>
 <p>Init a NodeTypeFilter object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>node_type</strong> – Node type to check.</p>
 </dd>
 </dl>
@@ -82,12 +83,12 @@ <h2>Filters<a class="headerlink" href="#filters" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.NodeNameFilter">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">NodeNameFilter</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">node_name</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.NodeNameFilter" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.NodeNameFilter">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">NodeNameFilter</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">node_name</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.NodeNameFilter" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class NodeNameFilter to check if a node’s name has a specific value.</p>
 <p>Init a NodeNameFilter object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>node_name</strong> – Node name to check.</p>
 </dd>
 </dl>
@@ -97,12 +98,12 @@ <h2>Filters<a class="headerlink" href="#filters" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.NodeNameScopeFilter">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">NodeNameScopeFilter</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">node_name_scope</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.NodeNameScopeFilter" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.NodeNameScopeFilter">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">NodeNameScopeFilter</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">node_name_scope</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.NodeNameScopeFilter" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class NodeNameFilter to check if a string is in a node’s name.</p>
 <p>Init a NodeNameScopeFilter object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>node_name_scope</strong> – String to check if exists in node name.</p>
 </dd>
 </dl>
@@ -110,14 +111,17 @@ <h2>Filters<a class="headerlink" href="#filters" title="Permalink to this headli
 
 </section>
 <section id="actions">
-<h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headline">¶</a></h2>
+<h2>Actions<a class="headerlink" href="#actions" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeFinalWeightsQuantConfigAttr">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeFinalWeightsQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeFinalWeightsQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeFinalWeightsQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr_name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
 <dd><p>Change attributes in a layer’s final weights quantization config.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>kwargs</strong> – Dictionary of attr_name and attr_value to change layer’s final weights quantization config.</p>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>attr_name</strong> – The weights attribute’s name to set the weights quantization params function for.</p></li>
+<li><p><strong>kwargs</strong> – Dictionary of attr_name and attr_value to change layer’s final weights quantization config.</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
@@ -126,12 +130,15 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantConfigAttr">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesWeightsQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesWeightsQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr_name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
 <dd><p>Change attributes in a layer’s weights quantization configuration candidates.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>kwargs</strong> – Dictionary of attr_name and attr_value to change layer’s weights quantization configuration candidates.</p>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>attr_name</strong> – The weights attribute’s name to set the weights quantization params function for.</p></li>
+<li><p><strong>kwargs</strong> – Dictionary of attr_name and attr_value to change layer’s weights quantization configuration candidates.</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
@@ -140,11 +147,11 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeFinalActivationQuantConfigAttr">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeFinalActivationQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeFinalActivationQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeFinalActivationQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
 <dd><p>Change attributes in a layer’s final activation quantization config.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>kwargs</strong> – Dictionary of attr_name and attr_value to change layer’s final activation quantization config.</p>
 </dd>
 </dl>
@@ -154,11 +161,11 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantConfigAttr">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesActivationQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesActivationQuantConfigAttr</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr" title="Permalink to this definition">¶</a></dt>
 <dd><p>Change attributes in a layer’s activation quantization configuration candidates.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>kwargs</strong> – Dictionary of attr_name and attr_value to change in the layer’s activation quantization configuration candidates.</p>
 </dd>
 </dl>
@@ -168,13 +175,14 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeQuantizationParamFunction">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeQuantizationParamFunction</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantization_params_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_params_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeQuantizationParamFunction" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeQuantizationParamFunction</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr_name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_quantization_params_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_params_fn</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class ChangeQuantizationParamFunction to change a node’s weights/activations quantization params function.</p>
 <p>Init a ChangeQuantizationParamFunction object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
+<li><p><strong>attr_name</strong> – The weights attribute’s name to set the weights quantization params function for (if setting weights params).</p></li>
 <li><p><strong>activation_quantization_params_fn</strong> – a params function for a node’s activations.</p></li>
 <li><p><strong>weights_quantization_params_fn</strong> – a params function for a node’s weights.</p></li>
 </ul>
@@ -186,13 +194,16 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeFinalWeightsQuantizationMethod">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeFinalWeightsQuantizationMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">weights_quantization_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeFinalWeightsQuantizationMethod" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeFinalWeightsQuantizationMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class ChangeFinalWeightsQuantizationMethod to change a node’s weights/activations quantizer function.</p>
 <p>Init a ChangeFinalWeightsQuantizationMethod object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>weights_quantization_method</strong> – a quantization method for a node’s weights.</p>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>attr_name</strong> – The weights attribute’s name to set the weights quantization method for.</p></li>
+<li><p><strong>weights_quantization_method</strong> – a quantization method for a node’s weights.</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
@@ -201,13 +212,16 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantizationMethod">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesWeightsQuantizationMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">weights_quantization_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantizationMethod" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesWeightsQuantizationMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">attr_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class ChangeCandidatesWeightsQuantizationMethod to change a node’s weights quantizer function.</p>
 <p>Init a ChangeCandidatesWeightsQuantizationMethod object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><p><strong>weights_quantization_method</strong> – a quantization method for a node’s weights.</p>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>weights_quantization_method</strong> – a quantization method for a node’s weights.</p></li>
+<li><p><strong>attr_name</strong> – The weights attribute’s name to set the weights quantization params function for.</p></li>
+</ul>
 </dd>
 </dl>
 </dd></dl>
@@ -216,12 +230,12 @@ <h2>Actions<a class="headerlink" href="#actions" title="Permalink to this headli
 <div class="line"><br /></div>
 </div>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantizationMethod">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesActivationQuantizationMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantization_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantizationMethod" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.network_editor.</span></span><span class="sig-name descname"><span class="pre">ChangeCandidatesActivationQuantizationMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantization_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class ChangeQuantizationMethod to change a node’s activations quantizer function.</p>
 <p>Init a ChangeCandidatesActivationQuantizationMethod object.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>activation_quantization_method</strong> – a quantization method for a node’s activations.</p>
 </dd>
 </dl>
@@ -258,7 +272,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -269,13 +283,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">network_editor Module</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/qat_config.html b/docs/api/api_docs/modules/qat_config.html
new file mode 100644
index 000000000..e062c191c
--- /dev/null
+++ b/docs/api/api_docs/modules/qat_config.html
@@ -0,0 +1,131 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>qat_config Module &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">qat_config Module</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="qat-config-module">
+<span id="ug-qat-config"></span><h1>qat_config Module<a class="headerlink" href="#qat-config-module" title="Permalink to this heading">¶</a></h1>
+<section id="trainingmethod">
+<h2>TrainingMethod<a class="headerlink" href="#trainingmethod" title="Permalink to this heading">¶</a></h2>
+<p><strong>Select a QAT training method:</strong></p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.qat.TrainingMethod">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.qat.</span></span><span class="sig-name descname"><span class="pre">TrainingMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.qat.TrainingMethod" title="Permalink to this definition">¶</a></dt>
+<dd><p>An enum for selecting a QAT training method</p>
+<p>STE - Standard straight-through estimator. Includes PowerOfTwo, symmetric &amp; uniform quantizers</p>
+<p>DQA -  DNN Quantization with Attention. Includes a smooth quantization introduces by DQA method</p>
+<p>LSQ - Learned Step size Quantization. Includes PowerOfTwo, symmetric &amp; uniform quantizers: <a class="reference external" href="https://arxiv.org/pdf/1902.08153.pdf">https://arxiv.org/pdf/1902.08153.pdf</a></p>
+</dd></dl>
+
+<div class="line-block">
+<div class="line"><br /></div>
+</div>
+</section>
+<section id="qatconfig">
+<h2>QATConfig<a class="headerlink" href="#qatconfig" title="Permalink to this heading">¶</a></h2>
+<p><strong>Class to configure the quantization process of the model when quantizing using Quantization-aware Training (QAT):</strong></p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.qat.QATConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.qat.</span></span><span class="sig-name descname"><span class="pre">QATConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">weight_training_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">TrainingMethod.STE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_training_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">TrainingMethod.STE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weight_quantizer_params_override</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_quantizer_params_override</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.qat.QATConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>QAT configuration class.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>weight_training_method</strong> (<a class="reference internal" href="#model_compression_toolkit.qat.TrainingMethod" title="model_compression_toolkit.qat.TrainingMethod"><em>TrainingMethod</em></a>) – Training method for weight quantizers</p></li>
+<li><p><strong>activation_training_method</strong> (<a class="reference internal" href="#model_compression_toolkit.qat.TrainingMethod" title="model_compression_toolkit.qat.TrainingMethod"><em>TrainingMethod</em></a>) – Training method for activation quantizers:</p></li>
+<li><p><strong>weight_quantizer_params_override</strong> – A dictionary of parameters to override in weight quantization quantizer instantiation. Defaults to None (no parameters)</p></li>
+<li><p><strong>activation_quantizer_params_override</strong> – A dictionary of parameters to override in activation quantization quantizer instantiation. Defaults to None (no parameters)</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <div>
+    <h3><a href="../../../index.html">Table of Contents</a></h3>
+    <ul>
+<li><a class="reference internal" href="#">qat_config Module</a><ul>
+<li><a class="reference internal" href="#trainingmethod">TrainingMethod</a></li>
+<li><a class="reference internal" href="#qatconfig">QATConfig</a></li>
+</ul>
+</li>
+</ul>
+
+  </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">qat_config Module</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/quantization_config.html b/docs/api/api_docs/modules/quantization_config.html
index 2bd31e1fe..2639a8d4a 100644
--- a/docs/api/api_docs/modules/quantization_config.html
+++ b/docs/api/api_docs/modules/quantization_config.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>quantization_config Module &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>quantization_config Module &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">quantization_config Module</a></li> 
       </ul>
     </div>  
@@ -41,13 +42,13 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="quantization-config-module">
-<span id="ug-quantization-config"></span><h1>quantization_config Module<a class="headerlink" href="#quantization-config-module" title="Permalink to this headline">¶</a></h1>
+<span id="ug-quantization-config"></span><h1>quantization_config Module<a class="headerlink" href="#quantization-config-module" title="Permalink to this heading">¶</a></h1>
 <section id="quantizationerrormethod">
-<h2>QuantizationErrorMethod<a class="headerlink" href="#quantizationerrormethod" title="Permalink to this headline">¶</a></h2>
+<h2>QuantizationErrorMethod<a class="headerlink" href="#quantizationerrormethod" title="Permalink to this heading">¶</a></h2>
 <p><strong>Enum to select a method for quantization parameters’ selection:</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.QuantizationErrorMethod">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">QuantizationErrorMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.QuantizationErrorMethod" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.QuantizationErrorMethod">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">QuantizationErrorMethod</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">value</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.QuantizationErrorMethod" title="Permalink to this definition">¶</a></dt>
 <dd><p>Method for quantization threshold selection:</p>
 <p>NOCLIPPING - Use min/max values as thresholds.</p>
 <p>MSE - Use min square error for minimizing quantization noise.</p>
@@ -61,20 +62,20 @@ <h2>QuantizationErrorMethod<a class="headerlink" href="#quantizationerrormethod"
 </div>
 </section>
 <section id="quantizationconfig">
-<h2>QuantizationConfig<a class="headerlink" href="#quantizationconfig" title="Permalink to this headline">¶</a></h2>
+<h2>QuantizationConfig<a class="headerlink" href="#quantizationconfig" title="Permalink to this heading">¶</a></h2>
 <p><strong>Class to configure the quantization process of the model:</strong></p>
 <dl class="py class">
-<dt class="sig sig-object py" id="model_compression_toolkit.QuantizationConfig">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.</span></span><span class="sig-name descname"><span class="pre">QuantizationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_error_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationErrorMethod.MSE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_error_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationErrorMethod.MSE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">relu_bound_to_power_of_2</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_bias_correction</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_per_channel_threshold</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">input_scaling</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">softmax_shift</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_activation_correction</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_channel_equalization</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">z_threshold</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">math.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">min_threshold</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">MIN_THRESHOLD</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">l_p_value</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">2</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_ratio</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">0.05</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_threshold_recalculation</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.QuantizationConfig" title="Permalink to this definition">¶</a></dt>
+<dt class="sig sig-object py" id="model_compression_toolkit.core.QuantizationConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.core.</span></span><span class="sig-name descname"><span class="pre">QuantizationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_error_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationErrorMethod.MSE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_error_method</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">QuantizationErrorMethod.MSE</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">relu_bound_to_power_of_2</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_bias_correction</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_second_moment_correction</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">input_scaling</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">softmax_shift</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_activation_correction</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_channel_equalization</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">z_threshold</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">math.inf</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">min_threshold</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">MIN_THRESHOLD</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">l_p_value</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">2</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">linear_collapsing</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">residual_collapsing</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">True</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_ratio</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">0.05</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_threshold_recalculation</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">shift_negative_params_search</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">False</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.core.QuantizationConfig" title="Permalink to this definition">¶</a></dt>
 <dd><p>Class to wrap all different parameters the library quantize the input model according to.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
-<li><p><strong>activation_error_method</strong> (<a class="reference internal" href="#model_compression_toolkit.QuantizationErrorMethod" title="model_compression_toolkit.QuantizationErrorMethod"><em>QuantizationErrorMethod</em></a>) – Which method to use from QuantizationErrorMethod for activation quantization threshold selection.</p></li>
-<li><p><strong>weights_error_method</strong> (<a class="reference internal" href="#model_compression_toolkit.QuantizationErrorMethod" title="model_compression_toolkit.QuantizationErrorMethod"><em>QuantizationErrorMethod</em></a>) – Which method to use from QuantizationErrorMethod for activation quantization threshold selection.</p></li>
+<li><p><strong>activation_error_method</strong> (<a class="reference internal" href="#model_compression_toolkit.core.QuantizationErrorMethod" title="model_compression_toolkit.core.QuantizationErrorMethod"><em>QuantizationErrorMethod</em></a>) – Which method to use from QuantizationErrorMethod for activation quantization threshold selection.</p></li>
+<li><p><strong>weights_error_method</strong> (<a class="reference internal" href="#model_compression_toolkit.core.QuantizationErrorMethod" title="model_compression_toolkit.core.QuantizationErrorMethod"><em>QuantizationErrorMethod</em></a>) – Which method to use from QuantizationErrorMethod for activation quantization threshold selection.</p></li>
 <li><p><strong>relu_bound_to_power_of_2</strong> (<em>bool</em>) – Whether to use relu to power of 2 scaling correction or not.</p></li>
 <li><p><strong>weights_bias_correction</strong> (<em>bool</em>) – Whether to use weights bias correction or not.</p></li>
-<li><p><strong>weights_per_channel_threshold</strong> (<em>bool</em>) – Whether to quantize the weights per-channel or not (per-tensor).</p></li>
+<li><p><strong>weights_second_moment_correction</strong> (<em>bool</em>) – Whether to use weights second_moment correction or not.</p></li>
 <li><p><strong>input_scaling</strong> (<em>bool</em>) – Whether to use input scaling or not.</p></li>
 <li><p><strong>softmax_shift</strong> (<em>bool</em>) – Whether to use softmax shift or not.</p></li>
 <li><p><strong>shift_negative_activation_correction</strong> (<em>bool</em>) – Whether to use shifting negative activation correction or not.</p></li>
@@ -82,8 +83,10 @@ <h2>QuantizationConfig<a class="headerlink" href="#quantizationconfig" title="Pe
 <li><p><strong>z_threshold</strong> (<em>float</em>) – Value of z score for outliers removal.</p></li>
 <li><p><strong>min_threshold</strong> (<em>float</em>) – Minimum threshold to use during thresholds selection.</p></li>
 <li><p><strong>l_p_value</strong> (<em>int</em>) – The p value of L_p norm threshold selection.</p></li>
+<li><p><strong>block_collapsing</strong> (<em>bool</em>) – Whether to collapse block one to another in the input network</p></li>
 <li><p><strong>shift_negative_ratio</strong> (<em>float</em>) – Value for the ratio between the minimal negative value of a non-linearity output to its activation threshold, which above it - shifting negative activation should occur if enabled.</p></li>
 <li><p><strong>shift_negative_threshold_recalculation</strong> (<em>bool</em>) – Whether or not to recompute the threshold after shifting negative activation.</p></li>
+<li><p><strong>shift_negative_params_search</strong> (<em>bool</em>) – Whether to search for optimal shift and threshold in shift negative activation.</p></li>
 </ul>
 </dd>
 </dl>
@@ -91,13 +94,14 @@ <h2>QuantizationConfig<a class="headerlink" href="#quantizationconfig" title="Pe
 <p>One may create a quantization configuration to quantize a model according to.
 For example, to quantize a model’s weights and activation using thresholds, such that
 weights threshold selection is done using MSE, activation threshold selection is done using NOCLIPPING (min/max),
-enabling relu_bound_to_power_of_2, weights_bias_correction, and quantizing the weights per-channel,
+enabling relu_bound_to_power_of_2, weights_bias_correction,
 one can instantiate a quantization configuration:</p>
-<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="n">qc</span> <span class="o">=</span> <span class="n">QuantizationConfig</span><span class="p">(</span><span class="n">activation_error_method</span><span class="o">=</span><span class="n">QuantizationErrorMethod</span><span class="o">.</span><span class="n">NOCLIPPING</span><span class="p">,</span><span class="n">weights_error_method</span><span class="o">=</span><span class="n">QuantizationErrorMethod</span><span class="o">.</span><span class="n">MSE</span><span class="p">,</span><span class="n">relu_bound_to_power_of_2</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span><span class="n">weights_bias_correction</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span><span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
+<div class="doctest highlight-default notranslate"><div class="highlight"><pre><span></span><span class="gp">&gt;&gt;&gt; </span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="gp">&gt;&gt;&gt; </span><span class="n">qc</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">QuantizationConfig</span><span class="p">(</span><span class="n">activation_error_method</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">QuantizationErrorMethod</span><span class="o">.</span><span class="n">NOCLIPPING</span><span class="p">,</span> <span class="n">weights_error_method</span><span class="o">=</span><span class="n">mct</span><span class="o">.</span><span class="n">core</span><span class="o">.</span><span class="n">QuantizationErrorMethod</span><span class="o">.</span><span class="n">MSE</span><span class="p">,</span> <span class="n">relu_bound_to_power_of_2</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span> <span class="n">weights_bias_correction</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
 </pre></div>
 </div>
 <p>The QuantizationConfig instanse can then be passed to
-<a class="reference internal" href="../methods/keras_post_training_quantization.html#model_compression_toolkit.keras_post_training_quantization" title="model_compression_toolkit.keras_post_training_quantization"><code class="xref py py-func docutils literal notranslate"><span class="pre">keras_post_training_quantization()</span></code></a></p>
+<a class="reference internal" href="../methods/keras_post_training_quantization_experimental.html#model_compression_toolkit.ptq.keras_post_training_quantization" title="model_compression_toolkit.ptq.keras_post_training_quantization"><code class="xref py py-func docutils literal notranslate"><span class="pre">keras_post_training_quantization()</span></code></a></p>
 </dd></dl>
 
 </section>
@@ -130,7 +134,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -141,13 +145,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">quantization_config Module</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/target_platform.html b/docs/api/api_docs/modules/target_platform.html
index e3f421a7a..e57071ab8 100644
--- a/docs/api/api_docs/modules/target_platform.html
+++ b/docs/api/api_docs/modules/target_platform.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>target_platform Module &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>target_platform Module &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">target_platform Module</a></li> 
       </ul>
     </div>  
@@ -41,7 +42,7 @@ <h3>Navigation</h3>
           <div class="body" role="main">
             
   <section id="target-platform-module">
-<span id="ug-target-platform"></span><h1>target_platform Module<a class="headerlink" href="#target-platform-module" title="Permalink to this headline">¶</a></h1>
+<span id="ug-target-platform"></span><h1>target_platform Module<a class="headerlink" href="#target-platform-module" title="Permalink to this heading">¶</a></h1>
 <p>MCT can be configured to quantize and optimize models for different hardware settings.
 For example, when using qnnpack backend for Pytorch model inference, Pytorch <a class="reference external" href="https://github.com/pytorch/pytorch/blob/master/torch/ao/quantization/qconfig.py#L199">quantization
 configuration</a>
@@ -50,28 +51,30 @@ <h3>Navigation</h3>
 Conv2D</a>.</p>
 <p>This can be addressed in MCT by using the target_platform module, that can configure different
 parameters that are hardware-related, and the optimization process will use this to optimize the model accordingly.
-Models for TFLite and qnnpack can be observed <a class="reference external" href="https://github.com/sony/model_optimization/tree/main/model_compression_toolkit/tpc_models">here</a>, and can be used using <a class="reference internal" href="../methods/get_target_platform_capabilities.html#ug-get-target-platform-capabilities"><span class="std std-ref">get_target_platform_capabilities function</span></a>.</p>
+Models for IMX500, TFLite and qnnpack can be observed <a class="reference external" href="https://github.com/sony/model_optimization/tree/main/model_compression_toolkit/target_platform_capabilities">here</a>, and can be used using <a class="reference internal" href="../methods/get_target_platform_capabilities.html#ug-get-target-platform-capabilities"><span class="std std-ref">get_target_platform_capabilities function</span></a>.</p>
 <div class="line-block">
 <div class="line"><br /></div>
 </div>
 <div class="admonition note">
 <p class="admonition-title">Note</p>
-<p>For now, fusing operators information from <a class="reference internal" href="#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformModel</span></code></a>
-is ignored during the optimization process (fusing still occurs but using an existing mechanism).
-Also, parts of <a class="reference internal" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a> is ignored (currently,
-the quantizer type, number of bits, and quantization enable/disable information is used during the
-optimization process).</p>
+<p>For now, some fields of <a class="reference internal" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a> are ignored during
+the optimization process (currently, the quantizer type, number of bits, and quantization enable/disable information
+are in use).</p>
 <ul class="simple">
-<li><p>MCT will use more information from <a class="reference internal" href="#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformModel</span></code></a>, in the future.</p></li>
+<li><p>MCT will use more information from <a class="reference internal" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a>, in the future.</p></li>
 </ul>
 </div>
 <div class="line-block">
 <div class="line"><br /></div>
 </div>
+<p>The object MCT should get called TargetPlatformCapabilities (or shortly TPC).
+This diagram demonstrates the main components:</p>
+<a class="reference internal image-reference" href="../../../images/tpc.jpg"><img alt="../../../images/tpc.jpg" src="../../../images/tpc.jpg" style="width: 768.0px; height: 432.0px;" /></a>
+<p>Now, we will explain about each component with examples.</p>
 <p>The first part is configuring the quantization method for both wights and activations of an operator.
 Several methods can be used using QuantizationMethod API:</p>
 <section id="quantizationmethod">
-<h2>QuantizationMethod<a class="headerlink" href="#quantizationmethod" title="Permalink to this headline">¶</a></h2>
+<h2>QuantizationMethod<a class="headerlink" href="#quantizationmethod" title="Permalink to this heading">¶</a></h2>
 <p>Select a method to use during quantization:</p>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.QuantizationMethod">
@@ -79,9 +82,10 @@ <h2>QuantizationMethod<a class="headerlink" href="#quantizationmethod" title="Pe
 <dd><p>Method for quantization function selection:</p>
 <p>POWER_OF_TWO - Symmetric, uniform, threshold is power of two quantization.</p>
 <p>KMEANS - k-means quantization.</p>
-<p>LUT_QUANTIZER - quantization using a look up table.</p>
+<p>LUT_POT_QUANTIZER - quantization using a lookup table and power of 2 threshold.</p>
 <p>SYMMETRIC - Symmetric, uniform, quantization.</p>
 <p>UNIFORM - uniform quantization,</p>
+<p>LUT_SYM_QUANTIZER - quantization using a lookup table and symmetric threshold.</p>
 </dd></dl>
 
 <div class="line-block">
@@ -91,25 +95,23 @@ <h2>QuantizationMethod<a class="headerlink" href="#quantizationmethod" title="Pe
 Quantization configuration of different operators can be created using OpQuantizationConfig:</p>
 </section>
 <section id="opquantizationconfig">
-<h2>OpQuantizationConfig<a class="headerlink" href="#opquantizationconfig" title="Permalink to this headline">¶</a></h2>
+<h2>OpQuantizationConfig<a class="headerlink" href="#opquantizationconfig" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.OpQuantizationConfig">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">OpQuantizationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantization_method</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_method</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_n_bits</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_n_bits</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_per_channel_threshold</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">enable_weights_quantization</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">enable_activation_quantization</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">quantization_preserving</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fixed_scale</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fixed_zero_point</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_multiplier_nbits</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="Permalink to this definition">¶</a></dt>
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">OpQuantizationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">default_weight_attr_config</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">attr_weights_configs_mapping</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_quantization_method</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_n_bits</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">enable_activation_quantization</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">quantization_preserving</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fixed_scale</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">fixed_zero_point</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">simd_size</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="Permalink to this definition">¶</a></dt>
 <dd><p>OpQuantizationConfig is a class to configure the quantization parameters of an operator.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
+<li><p><strong>default_weight_attr_config</strong> (<em>AttributeQuantizationConfig</em>) – A default attribute quantization configuration for the operation.</p></li>
+<li><p><strong>attr_weights_configs_mapping</strong> (<em>dict</em>) – A mapping between an op attribute name and its quantization configuration.</p></li>
 <li><p><strong>activation_quantization_method</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.QuantizationMethod" title="model_compression_toolkit.target_platform.QuantizationMethod"><em>QuantizationMethod</em></a>) – Which method to use from QuantizationMethod for activation quantization.</p></li>
-<li><p><strong>weights_quantization_method</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.QuantizationMethod" title="model_compression_toolkit.target_platform.QuantizationMethod"><em>QuantizationMethod</em></a>) – Which method to use from QuantizationMethod for weights quantization.</p></li>
 <li><p><strong>activation_n_bits</strong> (<em>int</em>) – Number of bits to quantize the activations.</p></li>
-<li><p><strong>weights_n_bits</strong> (<em>int</em>) – Number of bits to quantize the coefficients.</p></li>
-<li><p><strong>weights_per_channel_threshold</strong> (<em>bool</em>) – Whether to quantize the weights per-channel or not (per-tensor).</p></li>
-<li><p><strong>enable_weights_quantization</strong> (<em>bool</em>) – Whether to quantize the model weights or not.</p></li>
 <li><p><strong>enable_activation_quantization</strong> (<em>bool</em>) – Whether to quantize the model activations or not.</p></li>
 <li><p><strong>quantization_preserving</strong> (<em>bool</em>) – Whether quantization parameters should be the same for an operator’s input and output.</p></li>
 <li><p><strong>fixed_scale</strong> (<em>float</em>) – Scale to use for an operator quantization parameters.</p></li>
 <li><p><strong>fixed_zero_point</strong> (<em>int</em>) – Zero-point to use for an operator quantization parameters.</p></li>
-<li><p><strong>weights_multiplier_nbits</strong> (<em>int</em>) – Number of bits to use when quantizing in look-up-table.</p></li>
+<li><p><strong>simd_size</strong> (<em>int</em>) – Per op integer representing the Single Instruction, Multiple Data (SIMD) width of an operator. It indicates the number of data elements that can be fetched and processed simultaneously in a single instruction.</p></li>
 </ul>
 </dd>
 </dl>
@@ -141,14 +143,14 @@ <h2>OpQuantizationConfig<a class="headerlink" href="#opquantizationconfig" title
 configuration options for an operator:</p>
 </section>
 <section id="quantizationconfigoptions">
-<h2>QuantizationConfigOptions<a class="headerlink" href="#quantizationconfigoptions" title="Permalink to this headline">¶</a></h2>
+<h2>QuantizationConfigOptions<a class="headerlink" href="#quantizationconfigoptions" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.QuantizationConfigOptions">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">QuantizationConfigOptions</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">quantization_config_list</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">base_config</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.QuantizationConfigOptions" title="Permalink to this definition">¶</a></dt>
 <dd><p>Wrap a set of quantization configurations to consider during the quantization
 of an operator.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>quantization_config_list</strong> (<em>List</em><em>[</em><a class="reference internal" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><em>OpQuantizationConfig</em></a><em>]</em>) – List of possible OpQuantizationConfig to gather.</p></li>
 <li><p><strong>base_config</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><em>OpQuantizationConfig</em></a>) – Fallback OpQuantizationConfig to use when optimizing the model in a non mixed-precision manner.</p></li>
@@ -183,7 +185,7 @@ <h2>QuantizationConfigOptions<a class="headerlink" href="#quantizationconfigopti
 group operators by common properties and configure patterns of operators to fuse:</p>
 </section>
 <section id="targetplatformmodel">
-<h2>TargetPlatformModel<a class="headerlink" href="#targetplatformmodel" title="Permalink to this headline">¶</a></h2>
+<h2>TargetPlatformModel<a class="headerlink" href="#targetplatformmodel" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.TargetPlatformModel">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">TargetPlatformModel</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">default_qco</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">'default_tp_model'</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.TargetPlatformModel" title="Permalink to this definition">¶</a></dt>
@@ -191,7 +193,7 @@ <h2>TargetPlatformModel<a class="headerlink" href="#targetplatformmodel" title="
 The model contains definition of operators, quantization configurations of them, and
 fusing patterns so that multiple operators will be combined into a single operator.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>default_qco</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.QuantizationConfigOptions" title="model_compression_toolkit.target_platform.QuantizationConfigOptions"><em>QuantizationConfigOptions</em></a>) – Default QuantizationConfigOptions to use for operators that their QuantizationConfigOptions are not defined in the model.</p></li>
 <li><p><strong>name</strong> (<em>str</em>) – Name of the model.</p></li>
@@ -220,13 +222,13 @@ <h2>TargetPlatformModel<a class="headerlink" href="#targetplatformmodel" title="
 <p>Then, we can start defining the model by creating OperatorsSets:</p>
 </section>
 <section id="operatorsset">
-<h2>OperatorsSet<a class="headerlink" href="#operatorsset" title="Permalink to this headline">¶</a></h2>
+<h2>OperatorsSet<a class="headerlink" href="#operatorsset" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.OperatorsSet">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">OperatorsSet</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">qc_options</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.OperatorsSet" title="Permalink to this definition">¶</a></dt>
 <dd><p>Set of operators that are represented by a unique label.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>name</strong> (<em>str</em>) – Set’s label (must be unique in a TargetPlatformModel).</p></li>
 <li><p><strong>qc_options</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.QuantizationConfigOptions" title="model_compression_toolkit.target_platform.QuantizationConfigOptions"><em>QuantizationConfigOptions</em></a>) – Configuration options to use for this set of operations.</p></li>
@@ -264,12 +266,12 @@ <h2>OperatorsSet<a class="headerlink" href="#operatorsset" title="Permalink to t
 quantization is applied between them when they appear in a model:</p>
 </section>
 <section id="fusing">
-<h2>Fusing<a class="headerlink" href="#fusing" title="Permalink to this headline">¶</a></h2>
+<h2>Fusing<a class="headerlink" href="#fusing" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.Fusing">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">Fusing</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">operator_groups_list</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.Fusing" title="Permalink to this definition">¶</a></dt>
 <dd><dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><p><strong>name</strong> – Name of component.</p>
 </dd>
 </dl>
@@ -318,18 +320,15 @@ <h2>Fusing<a class="headerlink" href="#fusing" title="Permalink to this headline
 <p>When multiple operators should be fused in a similar way, an OperatorSetConcat can be used:</p>
 </section>
 <section id="operatorsetconcat">
-<h2>OperatorSetConcat<a class="headerlink" href="#operatorsetconcat" title="Permalink to this headline">¶</a></h2>
+<h2>OperatorSetConcat<a class="headerlink" href="#operatorsetconcat" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.OperatorSetConcat">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">OperatorSetConcat</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="o"><span class="pre">*</span></span><span class="n"><span class="pre">opsets</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.OperatorSetConcat" title="Permalink to this definition">¶</a></dt>
 <dd><p>Concatenate a list of operator sets to treat them similarly in different places (like fusing).</p>
 <p>Group a list of operation sets.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
-<dd class="field-odd"><ul class="simple">
-<li><p><strong>*opsets</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.OperatorsSet" title="model_compression_toolkit.target_platform.OperatorsSet"><em>OperatorsSet</em></a>) – List of operator sets to group.</p></li>
-<li><p><strong>opsets</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.OperatorsSet" title="model_compression_toolkit.common.target_platform.operators.OperatorsSet"><em>model_compression_toolkit.common.target_platform.operators.OperatorsSet</em></a>) – </p></li>
-</ul>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><p><strong>*opsets</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.OperatorsSet" title="model_compression_toolkit.target_platform.OperatorsSet"><em>OperatorsSet</em></a>) – List of operator sets to group.</p>
 </dd>
 </dl>
 </dd></dl>
@@ -351,17 +350,22 @@ <h2>OperatorSetConcat<a class="headerlink" href="#operatorsetconcat" title="Perm
 </div>
 </section>
 <section id="targetplatformmodel-code-example">
-<h2>TargetPlatformModel Code Example<a class="headerlink" href="#targetplatformmodel-code-example" title="Permalink to this headline">¶</a></h2>
+<h2>TargetPlatformModel Code Example<a class="headerlink" href="#targetplatformmodel-code-example" title="Permalink to this heading">¶</a></h2>
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">List</span><span class="p">,</span> <span class="n">Tuple</span>
 
 <span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
-<span class="kn">from</span> <span class="nn">model_compression_toolkit.common.target_platform</span> <span class="kn">import</span> <span class="n">OpQuantizationConfig</span><span class="p">,</span> <span class="n">TargetPlatformModel</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.constants</span> <span class="kn">import</span> <span class="n">FLOAT_BITWIDTH</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.constants</span> <span class="kn">import</span> <span class="n">KERNEL_ATTR</span><span class="p">,</span> <span class="n">BIAS_ATTR</span><span class="p">,</span> <span class="n">WEIGHTS_N_BITS</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.target_platform</span> <span class="kn">import</span> <span class="n">OpQuantizationConfig</span><span class="p">,</span> \
+    <span class="n">TargetPlatformModel</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.target_platform.op_quantization_config</span> <span class="kn">import</span> \
+    <span class="n">AttributeQuantizationConfig</span>
 
-<span class="n">tpc</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">target_platform</span>
+<span class="n">tp</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">target_platform</span>
 
 
-<span class="k">def</span> <span class="nf">get_default_tp_model</span><span class="p">()</span> <span class="o">-&gt;</span> <span class="n">TargetPlatformModel</span><span class="p">:</span>
-    <span class="sd">&quot;&quot;&quot;</span>
+<span class="k">def</span> <span class="nf">get_tp_model</span><span class="p">()</span> <span class="o">-&gt;</span> <span class="n">TargetPlatformModel</span><span class="p">:</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
 <span class="sd">    A method that generates a default target platform model, with base 8-bit quantization configuration and 8, 4, 2</span>
 <span class="sd">    bits configuration list for mixed-precision quantization.</span>
 <span class="sd">    NOTE: in order to generate a target platform model with different configurations but with the same Operators Sets</span>
@@ -371,15 +375,15 @@ <h2>TargetPlatformModel Code Example<a class="headerlink" href="#targetplatformm
 <span class="sd">    Returns: A TargetPlatformModel object.</span>
 
 <span class="sd">    &quot;&quot;&quot;</span>
-    <span class="n">base_config</span><span class="p">,</span> <span class="n">mixed_precision_cfg_list</span> <span class="o">=</span> <span class="n">get_op_quantization_configs</span><span class="p">()</span>
-    <span class="k">return</span> <span class="n">generate_tp_model</span><span class="p">(</span><span class="n">default_config</span><span class="o">=</span><span class="n">base_config</span><span class="p">,</span>
+    <span class="n">base_config</span><span class="p">,</span> <span class="n">mixed_precision_cfg_list</span><span class="p">,</span> <span class="n">default_config</span> <span class="o">=</span> <span class="n">get_op_quantization_configs</span><span class="p">()</span>
+    <span class="k">return</span> <span class="n">generate_tp_model</span><span class="p">(</span><span class="n">default_config</span><span class="o">=</span><span class="n">default_config</span><span class="p">,</span>
                              <span class="n">base_config</span><span class="o">=</span><span class="n">base_config</span><span class="p">,</span>
                              <span class="n">mixed_precision_cfg_list</span><span class="o">=</span><span class="n">mixed_precision_cfg_list</span><span class="p">,</span>
-                             <span class="n">name</span><span class="o">=</span><span class="s1">&#39;default_tp_model&#39;</span><span class="p">)</span>
+                             <span class="n">name</span><span class="o">=</span><span class="s1">&#39;imx500_tp_model&#39;</span><span class="p">)</span>
 
 
-<span class="k">def</span> <span class="nf">get_op_quantization_configs</span><span class="p">()</span> <span class="o">-&gt;</span> <span class="n">Tuple</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">,</span> <span class="n">List</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">]]:</span>
-    <span class="sd">&quot;&quot;&quot;</span>
+<span class="k">def</span> <span class="nf">get_op_quantization_configs</span><span class="p">()</span> <span class="o">-&gt;</span> <span class="n">Tuple</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">,</span> <span class="n">List</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">],</span> <span class="n">OpQuantizationConfig</span><span class="p">]:</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
 <span class="sd">    Creates a default configuration object for 8-bit quantization, to be used to set a default TargetPlatformModel.</span>
 <span class="sd">    In addition, creates a default configuration objects list (with 8, 4 and 2 bit quantization) to be used as</span>
 <span class="sd">    default configuration for mixed-precision quantization.</span>
@@ -387,39 +391,85 @@ <h2>TargetPlatformModel Code Example<a class="headerlink" href="#targetplatformm
 <span class="sd">    Returns: An OpQuantizationConfig config object and a list of OpQuantizationConfig objects.</span>
 
 <span class="sd">    &quot;&quot;&quot;</span>
+
+    <span class="c1"># TODO: currently, we don&#39;t want to quantize any attribute but the kernel by default,</span>
+    <span class="c1">#  to preserve the current behavior of MCT, so quantization is disabled for all other attributes.</span>
+    <span class="c1">#  Other quantization parameters are set to what we eventually want to quantize by default</span>
+    <span class="c1">#  when we enable multi-attributes quantization - THIS NEED TO BE MODIFIED IN ALL TP MODELS!</span>
+
+    <span class="c1"># define a default quantization config for all non-specified weights attributes.</span>
+    <span class="n">default_weight_attr_config</span> <span class="o">=</span> <span class="n">AttributeQuantizationConfig</span><span class="p">(</span>
+        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
+        <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>  <span class="c1"># TODO: this will changed to True once implementing multi-attributes quantization</span>
+        <span class="n">lut_values_bitwidth</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+
+    <span class="c1"># define a quantization config to quantize the kernel (for layers where there is a kernel attribute).</span>
+    <span class="n">kernel_base_config</span> <span class="o">=</span> <span class="n">AttributeQuantizationConfig</span><span class="p">(</span>
+        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">SYMMETRIC</span><span class="p">,</span>
+        <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+        <span class="n">lut_values_bitwidth</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+
+    <span class="c1"># define a quantization config to quantize the bias (for layers where there is a bias attribute).</span>
+    <span class="n">bias_config</span> <span class="o">=</span> <span class="n">AttributeQuantizationConfig</span><span class="p">(</span>
+        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
+        <span class="n">weights_n_bits</span><span class="o">=</span><span class="n">FLOAT_BITWIDTH</span><span class="p">,</span>
+        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">lut_values_bitwidth</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+
     <span class="c1"># Create a quantization config.</span>
     <span class="c1"># A quantization configuration defines how an operator</span>
     <span class="c1"># should be quantized on the modeled hardware:</span>
-    <span class="n">eight_bits</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OpQuantizationConfig</span><span class="p">(</span>
-        <span class="n">activation_quantization_method</span><span class="o">=</span><span class="n">tpc</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
-        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tpc</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
+
+    <span class="c1"># We define a default config for operation without kernel attribute.</span>
+    <span class="c1"># This is the default config that should be used for non-linear operations.</span>
+    <span class="n">eight_bits_default</span> <span class="o">=</span> <span class="n">tp</span><span class="o">.</span><span class="n">OpQuantizationConfig</span><span class="p">(</span>
+        <span class="n">default_weight_attr_config</span><span class="o">=</span><span class="n">default_weight_attr_config</span><span class="p">,</span>
+        <span class="n">attr_weights_configs_mapping</span><span class="o">=</span><span class="p">{},</span>
+        <span class="n">activation_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
+        <span class="n">activation_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+        <span class="n">enable_activation_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+        <span class="n">quantization_preserving</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">fixed_scale</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
+        <span class="n">fixed_zero_point</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
+        <span class="n">simd_size</span><span class="o">=</span><span class="mi">32</span><span class="p">)</span>
+
+    <span class="c1"># We define an 8-bit config for linear operations quantization, that include a kernel and bias attributes.</span>
+    <span class="n">linear_eight_bits</span> <span class="o">=</span> <span class="n">tp</span><span class="o">.</span><span class="n">OpQuantizationConfig</span><span class="p">(</span>
+        <span class="n">default_weight_attr_config</span><span class="o">=</span><span class="n">default_weight_attr_config</span><span class="p">,</span>
+        <span class="n">attr_weights_configs_mapping</span><span class="o">=</span><span class="p">{</span><span class="n">KERNEL_ATTR</span><span class="p">:</span> <span class="n">kernel_base_config</span><span class="p">,</span> <span class="n">BIAS_ATTR</span><span class="p">:</span> <span class="n">bias_config</span><span class="p">},</span>
+        <span class="n">activation_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
         <span class="n">activation_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
-        <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
-        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
-        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
         <span class="n">enable_activation_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
         <span class="n">quantization_preserving</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
         <span class="n">fixed_scale</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
         <span class="n">fixed_zero_point</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
-        <span class="n">weights_multiplier_nbits</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+        <span class="n">simd_size</span><span class="o">=</span><span class="mi">32</span><span class="p">)</span>
 
     <span class="c1"># To quantize a model using mixed-precision, create</span>
     <span class="c1"># a list with more than one OpQuantizationConfig.</span>
     <span class="c1"># In this example, we quantize some operations&#39; weights</span>
     <span class="c1"># using 2, 4 or 8 bits, and when using 2 or 4 bits, it&#39;s possible</span>
     <span class="c1"># to quantize the operations&#39; activations using LUT.</span>
-    <span class="n">four_bits</span> <span class="o">=</span> <span class="n">eight_bits</span><span class="o">.</span><span class="n">clone_and_edit</span><span class="p">(</span><span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">4</span><span class="p">)</span>
-    <span class="n">two_bits</span> <span class="o">=</span> <span class="n">eight_bits</span><span class="o">.</span><span class="n">clone_and_edit</span><span class="p">(</span><span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">2</span><span class="p">)</span>
-    <span class="n">mixed_precision_cfg_list</span> <span class="o">=</span> <span class="p">[</span><span class="n">eight_bits</span><span class="p">,</span> <span class="n">four_bits</span><span class="p">,</span> <span class="n">two_bits</span><span class="p">]</span>
+    <span class="n">four_bits</span> <span class="o">=</span> <span class="n">linear_eight_bits</span><span class="o">.</span><span class="n">clone_and_edit</span><span class="p">(</span><span class="n">attr_to_edit</span><span class="o">=</span><span class="p">{</span><span class="n">KERNEL_ATTR</span><span class="p">:</span> <span class="p">{</span><span class="n">WEIGHTS_N_BITS</span><span class="p">:</span> <span class="mi">4</span><span class="p">}},</span>
+                                                 <span class="n">simd_size</span><span class="o">=</span><span class="n">linear_eight_bits</span><span class="o">.</span><span class="n">simd_size</span> <span class="o">*</span> <span class="mi">2</span><span class="p">)</span>
+    <span class="n">two_bits</span> <span class="o">=</span> <span class="n">linear_eight_bits</span><span class="o">.</span><span class="n">clone_and_edit</span><span class="p">(</span><span class="n">attr_to_edit</span><span class="o">=</span><span class="p">{</span><span class="n">KERNEL_ATTR</span><span class="p">:</span> <span class="p">{</span><span class="n">WEIGHTS_N_BITS</span><span class="p">:</span> <span class="mi">2</span><span class="p">}},</span>
+                                                <span class="n">simd_size</span><span class="o">=</span><span class="n">linear_eight_bits</span><span class="o">.</span><span class="n">simd_size</span> <span class="o">*</span> <span class="mi">4</span><span class="p">)</span>
 
-    <span class="k">return</span> <span class="n">eight_bits</span><span class="p">,</span> <span class="n">mixed_precision_cfg_list</span>
+    <span class="n">mixed_precision_cfg_list</span> <span class="o">=</span> <span class="p">[</span><span class="n">linear_eight_bits</span><span class="p">,</span> <span class="n">four_bits</span><span class="p">,</span> <span class="n">two_bits</span><span class="p">]</span>
+
+    <span class="k">return</span> <span class="n">linear_eight_bits</span><span class="p">,</span> <span class="n">mixed_precision_cfg_list</span><span class="p">,</span> <span class="n">eight_bits_default</span>
 
 
 <span class="k">def</span> <span class="nf">generate_tp_model</span><span class="p">(</span><span class="n">default_config</span><span class="p">:</span> <span class="n">OpQuantizationConfig</span><span class="p">,</span>
                       <span class="n">base_config</span><span class="p">:</span> <span class="n">OpQuantizationConfig</span><span class="p">,</span>
                       <span class="n">mixed_precision_cfg_list</span><span class="p">:</span> <span class="n">List</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">],</span>
                       <span class="n">name</span><span class="p">:</span> <span class="nb">str</span><span class="p">)</span> <span class="o">-&gt;</span> <span class="n">TargetPlatformModel</span><span class="p">:</span>
-    <span class="sd">&quot;&quot;&quot;</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
 <span class="sd">    Generates TargetPlatformModel with default defined Operators Sets, based on the given base configuration and</span>
 <span class="sd">    mixed-precision configurations options list.</span>
 
@@ -437,58 +487,12 @@ <h2>TargetPlatformModel Code Example<a class="headerlink" href="#targetplatformm
     <span class="c1"># of possible configurations to consider when quantizing a set of operations (in mixed-precision, for example).</span>
     <span class="c1"># If the QuantizationConfigOptions contains only one configuration,</span>
     <span class="c1"># this configuration will be used for the operation quantization:</span>
-    <span class="n">default_configuration_options</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">QuantizationConfigOptions</span><span class="p">([</span><span class="n">default_config</span><span class="p">])</span>
+    <span class="n">default_configuration_options</span> <span class="o">=</span> <span class="n">tp</span><span class="o">.</span><span class="n">QuantizationConfigOptions</span><span class="p">([</span><span class="n">default_config</span><span class="p">])</span>
 
     <span class="c1"># Create a TargetPlatformModel and set its default quantization config.</span>
     <span class="c1"># This default configuration will be used for all operations</span>
     <span class="c1"># unless specified otherwise (see OperatorsSet, for example):</span>
-    <span class="n">generated_tpc</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">TargetPlatformModel</span><span class="p">(</span><span class="n">default_configuration_options</span><span class="p">,</span> <span class="n">name</span><span class="o">=</span><span class="n">name</span><span class="p">)</span>
-
-    <span class="c1"># To start defining the model&#39;s components (such as operator sets, and fusing patterns),</span>
-    <span class="c1"># use &#39;with&#39; the TargetPlatformModel instance, and create them as below:</span>
-    <span class="k">with</span> <span class="n">generated_tpc</span><span class="p">:</span>
-        <span class="c1"># Create an OperatorsSet to represent a set of operations.</span>
-        <span class="c1"># Each OperatorsSet has a unique label.</span>
-        <span class="c1"># If a quantization configuration options is passed, these options will</span>
-        <span class="c1"># be used for operations that will be attached to this set&#39;s label.</span>
-        <span class="c1"># Otherwise, it will be a configure-less set (used in fusing):</span>
-
-        <span class="c1"># May suit for operations like: Dropout, Reshape, etc.</span>
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;NoQuantization&quot;</span><span class="p">,</span>
-                         <span class="n">tpc</span><span class="o">.</span><span class="n">get_default_quantization_config_options</span><span class="p">()</span><span class="o">.</span><span class="n">clone_and_edit</span><span class="p">(</span>
-                             <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
-                             <span class="n">enable_activation_quantization</span><span class="o">=</span><span class="kc">False</span><span class="p">))</span>
-
-        <span class="c1"># Create Mixed-Precision quantization configuration options from the given list of OpQuantizationConfig objects</span>
-        <span class="n">mixed_precision_configuration_options</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">QuantizationConfigOptions</span><span class="p">(</span><span class="n">mixed_precision_cfg_list</span><span class="p">,</span>
-                                                                              <span class="n">base_config</span><span class="o">=</span><span class="n">base_config</span><span class="p">)</span>
-
-        <span class="c1"># Define operator sets that use mixed_precision_configuration_options:</span>
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;ConvTranspose&quot;</span><span class="p">,</span> <span class="n">mixed_precision_configuration_options</span><span class="p">)</span>
-        <span class="n">conv</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;Conv&quot;</span><span class="p">,</span> <span class="n">mixed_precision_configuration_options</span><span class="p">)</span>
-        <span class="n">fc</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;FullyConnected&quot;</span><span class="p">,</span> <span class="n">mixed_precision_configuration_options</span><span class="p">)</span>
-
-        <span class="c1"># Define operations sets without quantization configuration</span>
-        <span class="c1"># options (useful for creating fusing patterns, for example):</span>
-        <span class="n">any_relu</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;AnyReLU&quot;</span><span class="p">)</span>
-        <span class="n">add</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;Add&quot;</span><span class="p">)</span>
-        <span class="n">prelu</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;PReLU&quot;</span><span class="p">)</span>
-        <span class="n">swish</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;Swish&quot;</span><span class="p">)</span>
-        <span class="n">sigmoid</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;Sigmoid&quot;</span><span class="p">)</span>
-        <span class="n">tanh</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorsSet</span><span class="p">(</span><span class="s2">&quot;Tanh&quot;</span><span class="p">)</span>
-
-        <span class="c1"># Combine multiple operators into a single operator to avoid quantization between</span>
-        <span class="c1"># them. To do this we define fusing patterns using the OperatorsSets that were created.</span>
-        <span class="c1"># To group multiple sets with regard to fusing, an OperatorSetConcat can be created</span>
-        <span class="n">activations_after_conv_to_fuse</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorSetConcat</span><span class="p">(</span><span class="n">any_relu</span><span class="p">,</span> <span class="n">swish</span><span class="p">,</span> <span class="n">prelu</span><span class="p">,</span> <span class="n">sigmoid</span><span class="p">,</span> <span class="n">tanh</span><span class="p">)</span>
-        <span class="n">activations_after_fc_to_fuse</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">OperatorSetConcat</span><span class="p">(</span><span class="n">any_relu</span><span class="p">,</span> <span class="n">swish</span><span class="p">,</span> <span class="n">sigmoid</span><span class="p">)</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">Fusing</span><span class="p">([</span><span class="n">conv</span><span class="p">,</span> <span class="n">activations_after_conv_to_fuse</span><span class="p">])</span>
-        <span class="n">tpc</span><span class="o">.</span><span class="n">Fusing</span><span class="p">([</span><span class="n">fc</span><span class="p">,</span> <span class="n">activations_after_fc_to_fuse</span><span class="p">])</span>
-        <span class="n">tpc</span><span class="o">.</span><span class="n">Fusing</span><span class="p">([</span><span class="n">conv</span><span class="p">,</span> <span class="n">add</span><span class="p">,</span> <span class="n">any_relu</span><span class="p">])</span>
-        <span class="n">tpc</span><span class="o">.</span><span class="n">Fusing</span><span class="p">([</span><span class="n">conv</span><span class="p">,</span> <span class="n">any_relu</span><span class="p">,</span> <span class="n">add</span><span class="p">])</span>
-
-    <span class="k">return</span> <span class="n">generated_tpc</span>
+    <span class="n">generated_tpc</span> <span class="o">=</span> <span class="n">tp</span><span class="o">.</span><span class="n">TargetPlatformModel</span><span class="p">(</span><span class="n">default_configuration_options</span><span class="p">,</span> <span class="n">name</span><span class="o">=</span><span class="n">name</span><span class="p">)</span>
 </pre></div>
 </div>
 <div class="line-block">
@@ -503,16 +507,19 @@ <h2>TargetPlatformModel Code Example<a class="headerlink" href="#targetplatformm
 an OperationsSetToLayers can be used:</p>
 </section>
 <section id="operationssettolayers">
-<h2>OperationsSetToLayers<a class="headerlink" href="#operationssettolayers" title="Permalink to this headline">¶</a></h2>
+<h2>OperationsSetToLayers<a class="headerlink" href="#operationssettolayers" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.OperationsSetToLayers">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">OperationsSetToLayers</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">op_set_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">layers</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.OperationsSetToLayers" title="Permalink to this definition">¶</a></dt>
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">OperationsSetToLayers</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">op_set_name</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">layers</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">attr_mapping</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.OperationsSetToLayers" title="Permalink to this definition">¶</a></dt>
 <dd><p>Associate an OperatorsSet to a list of framework’s layers.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>op_set_name</strong> (<em>str</em>) – Name of OperatorsSet to associate with layers.</p></li>
 <li><p><strong>layers</strong> (<em>List</em><em>[</em><em>Any</em><em>]</em>) – List of layers/FilterLayerParams to associate with OperatorsSet.</p></li>
+<li><p><strong>attr_mapping</strong> (<em>dict</em>) – A mapping between a general attribute name to a DefaultDict that maps a layer type</p></li>
+<li><p><strong>circular</strong> (<em>to the layer's framework name of this attribute</em><em> (</em><em>the dictionary type is not specified to handle</em>) – </p></li>
+<li><p><strong>dependency</strong><strong>)</strong><strong>.</strong> – </p></li>
 </ul>
 </dd>
 </dl>
@@ -535,13 +542,13 @@ <h2>OperationsSetToLayers<a class="headerlink" href="#operationssettolayers" tit
 For that, LayerFilterParams can be used:</p>
 </section>
 <section id="layerfilterparams">
-<h2>LayerFilterParams<a class="headerlink" href="#layerfilterparams" title="Permalink to this headline">¶</a></h2>
+<h2>LayerFilterParams<a class="headerlink" href="#layerfilterparams" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.LayerFilterParams">
 <em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">LayerFilterParams</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">layer</span></span></em>, <em class="sig-param"><span class="o"><span class="pre">*</span></span><span class="n"><span class="pre">conditions</span></span></em>, <em class="sig-param"><span class="o"><span class="pre">**</span></span><span class="n"><span class="pre">kwargs</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.LayerFilterParams" title="Permalink to this definition">¶</a></dt>
 <dd><p>Wrap a layer with filters to filter framework’s layers by their attributes.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>layer</strong> – Layer to match when filtering.</p></li>
 <li><p><strong>*conditions</strong> (<em>AttributeFilter</em>) – List of conditions to satisfy.</p></li>
@@ -591,16 +598,17 @@ <h2>LayerFilterParams<a class="headerlink" href="#layerfilterparams" title="Perm
 which attaches the layers representations to OperatorsSets in a TargetPlatformModel instance:</p>
 </section>
 <section id="targetplatformcapabilities">
-<h2>TargetPlatformCapabilities<a class="headerlink" href="#targetplatformcapabilities" title="Permalink to this headline">¶</a></h2>
+<h2>TargetPlatformCapabilities<a class="headerlink" href="#targetplatformcapabilities" title="Permalink to this heading">¶</a></h2>
 <dl class="py class">
 <dt class="sig sig-object py" id="model_compression_toolkit.target_platform.TargetPlatformCapabilities">
-<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">TargetPlatformCapabilities</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">tp_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">'base'</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="Permalink to this definition">¶</a></dt>
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.target_platform.</span></span><span class="sig-name descname"><span class="pre">TargetPlatformCapabilities</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">tp_model</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">name</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">'base'</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">version</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.target_platform.TargetPlatformCapabilities" title="Permalink to this definition">¶</a></dt>
 <dd><p>Attach framework information to a modeled hardware.</p>
 <dl class="field-list simple">
-<dt class="field-odd">Parameters</dt>
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
 <dd class="field-odd"><ul class="simple">
 <li><p><strong>tp_model</strong> (<a class="reference internal" href="#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><em>TargetPlatformModel</em></a>) – Modeled hardware to attach framework information to.</p></li>
 <li><p><strong>name</strong> (<em>str</em>) – Name of the TargetPlatformCapabilities.</p></li>
+<li><p><strong>version</strong> (<em>str</em>) – TPC version.</p></li>
 </ul>
 </dd>
 </dl>
@@ -611,87 +619,79 @@ <h2>TargetPlatformCapabilities<a class="headerlink" href="#targetplatformcapabil
 to the TargetPlatformCapabilities like in the following example:</p>
 </section>
 <section id="targetplatformcapabilities-code-example">
-<h2>TargetPlatformCapabilities Code Example<a class="headerlink" href="#targetplatformcapabilities-code-example" title="Permalink to this headline">¶</a></h2>
-<div class="highlight-python notranslate"><div class="highlight"><pre><span></span>
-<span class="kn">import</span> <span class="nn">tensorflow</span> <span class="k">as</span> <span class="nn">tf</span>
+<h2>TargetPlatformCapabilities Code Example<a class="headerlink" href="#targetplatformcapabilities-code-example" title="Permalink to this heading">¶</a></h2>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">List</span><span class="p">,</span> <span class="n">Tuple</span>
 
-<span class="kn">from</span> <span class="nn">model_compression_toolkit.common.target_platform</span> <span class="kn">import</span> <span class="n">TargetPlatformModel</span>
+<span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.constants</span> <span class="kn">import</span> <span class="n">FLOAT_BITWIDTH</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.constants</span> <span class="kn">import</span> <span class="n">KERNEL_ATTR</span><span class="p">,</span> <span class="n">BIAS_ATTR</span><span class="p">,</span> <span class="n">WEIGHTS_N_BITS</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.target_platform</span> <span class="kn">import</span> <span class="n">OpQuantizationConfig</span><span class="p">,</span> \
+    <span class="n">TargetPlatformModel</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.target_platform.op_quantization_config</span> <span class="kn">import</span> \
+    <span class="n">AttributeQuantizationConfig</span>
 
-<span class="k">if</span> <span class="n">tf</span><span class="o">.</span><span class="n">__version__</span> <span class="o">&lt;</span> <span class="s2">&quot;2.6&quot;</span><span class="p">:</span>
-    <span class="kn">from</span> <span class="nn">tensorflow.keras.layers</span> <span class="kn">import</span> <span class="n">Conv2D</span><span class="p">,</span> <span class="n">DepthwiseConv2D</span><span class="p">,</span> <span class="n">Dense</span><span class="p">,</span> <span class="n">Conv2DTranspose</span><span class="p">,</span> <span class="n">Reshape</span><span class="p">,</span> <span class="n">ZeroPadding2D</span><span class="p">,</span> <span class="n">Dropout</span><span class="p">,</span> \
-        <span class="n">MaxPooling2D</span><span class="p">,</span> <span class="n">Activation</span><span class="p">,</span> <span class="n">ReLU</span><span class="p">,</span> <span class="n">Add</span><span class="p">,</span> <span class="n">PReLU</span><span class="p">,</span> <span class="n">Flatten</span><span class="p">,</span> <span class="n">Cropping2D</span>
-<span class="k">else</span><span class="p">:</span>
-    <span class="kn">from</span> <span class="nn">keras.layers</span> <span class="kn">import</span> <span class="n">Conv2D</span><span class="p">,</span> <span class="n">DepthwiseConv2D</span><span class="p">,</span> <span class="n">Dense</span><span class="p">,</span> <span class="n">Conv2DTranspose</span><span class="p">,</span> <span class="n">Reshape</span><span class="p">,</span> <span class="n">ZeroPadding2D</span><span class="p">,</span> \
-    <span class="n">Dropout</span><span class="p">,</span> <span class="n">MaxPooling2D</span><span class="p">,</span> <span class="n">Activation</span><span class="p">,</span> <span class="n">ReLU</span><span class="p">,</span> <span class="n">Add</span><span class="p">,</span> <span class="n">PReLU</span><span class="p">,</span> <span class="n">Flatten</span><span class="p">,</span> <span class="n">Cropping2D</span>
+<span class="n">tp</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">target_platform</span>
 
-<span class="kn">from</span> <span class="nn">model_compression_toolkit.tpc_models.default_tp_model</span> <span class="kn">import</span> <span class="n">get_default_tp_model</span>
 
-<span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
-<span class="n">tpc</span> <span class="o">=</span> <span class="n">mct</span><span class="o">.</span><span class="n">target_platform</span>
+<span class="k">def</span> <span class="nf">get_tp_model</span><span class="p">()</span> <span class="o">-&gt;</span> <span class="n">TargetPlatformModel</span><span class="p">:</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
+<span class="sd">    A method that generates a default target platform model, with base 8-bit quantization configuration and 8, 4, 2</span>
+<span class="sd">    bits configuration list for mixed-precision quantization.</span>
+<span class="sd">    NOTE: in order to generate a target platform model with different configurations but with the same Operators Sets</span>
+<span class="sd">    (for tests, experiments, etc.), use this method implementation as a test-case, i.e., override the</span>
+<span class="sd">    &#39;get_op_quantization_configs&#39; method and use its output to call &#39;generate_tp_model&#39; with your configurations.</span>
 
+<span class="sd">    Returns: A TargetPlatformModel object.</span>
 
-<span class="k">def</span> <span class="nf">get_default_keras_tpc</span><span class="p">():</span>
-    <span class="n">default_tp_model</span> <span class="o">=</span> <span class="n">get_default_tp_model</span><span class="p">()</span>
-    <span class="k">return</span> <span class="n">generate_keras_default_tpc</span><span class="p">(</span><span class="n">name</span><span class="o">=</span><span class="s1">&#39;default_keras_tpc&#39;</span><span class="p">,</span>
-                                      <span class="n">tp_model</span><span class="o">=</span><span class="n">default_tp_model</span><span class="p">)</span>
+<span class="sd">    &quot;&quot;&quot;</span>
+    <span class="n">base_config</span><span class="p">,</span> <span class="n">mixed_precision_cfg_list</span><span class="p">,</span> <span class="n">default_config</span> <span class="o">=</span> <span class="n">get_op_quantization_configs</span><span class="p">()</span>
+    <span class="k">return</span> <span class="n">generate_tp_model</span><span class="p">(</span><span class="n">default_config</span><span class="o">=</span><span class="n">default_config</span><span class="p">,</span>
+                             <span class="n">base_config</span><span class="o">=</span><span class="n">base_config</span><span class="p">,</span>
+                             <span class="n">mixed_precision_cfg_list</span><span class="o">=</span><span class="n">mixed_precision_cfg_list</span><span class="p">,</span>
+                             <span class="n">name</span><span class="o">=</span><span class="s1">&#39;imx500_tp_model&#39;</span><span class="p">)</span>
 
 
-<span class="k">def</span> <span class="nf">generate_keras_default_tpc</span><span class="p">(</span><span class="n">name</span><span class="p">:</span> <span class="nb">str</span><span class="p">,</span> <span class="n">tp_model</span><span class="p">:</span> <span class="n">TargetPlatformModel</span><span class="p">):</span>
-    <span class="sd">&quot;&quot;&quot;</span>
-<span class="sd">    Generates a TargetPlatformCapabilities object with default operation sets to layers mapping.</span>
+<span class="k">def</span> <span class="nf">get_op_quantization_configs</span><span class="p">()</span> <span class="o">-&gt;</span> <span class="n">Tuple</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">,</span> <span class="n">List</span><span class="p">[</span><span class="n">OpQuantizationConfig</span><span class="p">],</span> <span class="n">OpQuantizationConfig</span><span class="p">]:</span>
+<span class="w">    </span><span class="sd">&quot;&quot;&quot;</span>
+<span class="sd">    Creates a default configuration object for 8-bit quantization, to be used to set a default TargetPlatformModel.</span>
+<span class="sd">    In addition, creates a default configuration objects list (with 8, 4 and 2 bit quantization) to be used as</span>
+<span class="sd">    default configuration for mixed-precision quantization.</span>
 
-<span class="sd">    Args:</span>
-<span class="sd">        name: Name of the TargetPlatformCapabilities.</span>
-<span class="sd">        tp_model: TargetPlatformModel object.</span>
+<span class="sd">    Returns: An OpQuantizationConfig config object and a list of OpQuantizationConfig objects.</span>
 
-<span class="sd">    Returns: a TargetPlatformCapabilities object for the given TargetPlatformModel.</span>
 <span class="sd">    &quot;&quot;&quot;</span>
 
-    <span class="n">keras_tpc</span> <span class="o">=</span> <span class="n">tpc</span><span class="o">.</span><span class="n">TargetPlatformCapabilities</span><span class="p">(</span><span class="n">tp_model</span><span class="p">,</span>
-                                                <span class="n">name</span><span class="o">=</span><span class="n">name</span><span class="p">)</span>
-    <span class="k">with</span> <span class="n">keras_tpc</span><span class="p">:</span>
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;NoQuantization&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">Reshape</span><span class="p">,</span>
-                                                     <span class="n">tf</span><span class="o">.</span><span class="n">reshape</span><span class="p">,</span>
-                                                     <span class="n">Flatten</span><span class="p">,</span>
-                                                     <span class="n">Cropping2D</span><span class="p">,</span>
-                                                     <span class="n">ZeroPadding2D</span><span class="p">,</span>
-                                                     <span class="n">Dropout</span><span class="p">,</span>
-                                                     <span class="n">MaxPooling2D</span><span class="p">,</span>
-                                                     <span class="n">tf</span><span class="o">.</span><span class="n">split</span><span class="p">,</span>
-                                                     <span class="n">tf</span><span class="o">.</span><span class="n">quantization</span><span class="o">.</span><span class="n">fake_quant_with_min_max_vars</span><span class="p">,</span>
-                                                     <span class="n">tf</span><span class="o">.</span><span class="n">math</span><span class="o">.</span><span class="n">argmax</span><span class="p">,</span>
-                                                     <span class="n">tf</span><span class="o">.</span><span class="n">shape</span><span class="p">,</span>
-                                                     <span class="n">tf</span><span class="o">.</span><span class="n">__operators__</span><span class="o">.</span><span class="n">getitem</span><span class="p">])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;Conv&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">Conv2D</span><span class="p">,</span>
-                                           <span class="n">DepthwiseConv2D</span><span class="p">,</span>
-                                           <span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">conv2d</span><span class="p">,</span>
-                                           <span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">depthwise_conv2d</span><span class="p">])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;FullyConnected&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">Dense</span><span class="p">])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;ConvTranspose&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">Conv2DTranspose</span><span class="p">,</span>
-                                                    <span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">conv2d_transpose</span><span class="p">])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;AnyReLU&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">relu</span><span class="p">,</span>
-                                              <span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">relu6</span><span class="p">,</span>
-                                              <span class="n">tpc</span><span class="o">.</span><span class="n">LayerFilterParams</span><span class="p">(</span><span class="n">ReLU</span><span class="p">,</span> <span class="n">negative_slope</span><span class="o">=</span><span class="mf">0.0</span><span class="p">),</span>
-                                              <span class="n">tpc</span><span class="o">.</span><span class="n">LayerFilterParams</span><span class="p">(</span><span class="n">Activation</span><span class="p">,</span> <span class="n">activation</span><span class="o">=</span><span class="s2">&quot;relu&quot;</span><span class="p">)])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;Add&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">tf</span><span class="o">.</span><span class="n">add</span><span class="p">,</span>
-                                          <span class="n">Add</span><span class="p">])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;PReLU&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">PReLU</span><span class="p">])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;Swish&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">swish</span><span class="p">,</span>
-                                            <span class="n">tpc</span><span class="o">.</span><span class="n">LayerFilterParams</span><span class="p">(</span><span class="n">Activation</span><span class="p">,</span> <span class="n">activation</span><span class="o">=</span><span class="s2">&quot;swish&quot;</span><span class="p">)])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;Sigmoid&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">sigmoid</span><span class="p">,</span>
-                                              <span class="n">tpc</span><span class="o">.</span><span class="n">LayerFilterParams</span><span class="p">(</span><span class="n">Activation</span><span class="p">,</span> <span class="n">activation</span><span class="o">=</span><span class="s2">&quot;sigmoid&quot;</span><span class="p">)])</span>
-
-        <span class="n">tpc</span><span class="o">.</span><span class="n">OperationsSetToLayers</span><span class="p">(</span><span class="s2">&quot;Tanh&quot;</span><span class="p">,</span> <span class="p">[</span><span class="n">tf</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">tanh</span><span class="p">,</span>
-                                           <span class="n">tpc</span><span class="o">.</span><span class="n">LayerFilterParams</span><span class="p">(</span><span class="n">Activation</span><span class="p">,</span> <span class="n">activation</span><span class="o">=</span><span class="s2">&quot;tanh&quot;</span><span class="p">)])</span>
-    <span class="k">return</span> <span class="n">keras_tpc</span>
+    <span class="c1"># TODO: currently, we don&#39;t want to quantize any attribute but the kernel by default,</span>
+    <span class="c1">#  to preserve the current behavior of MCT, so quantization is disabled for all other attributes.</span>
+    <span class="c1">#  Other quantization parameters are set to what we eventually want to quantize by default</span>
+    <span class="c1">#  when we enable multi-attributes quantization - THIS NEED TO BE MODIFIED IN ALL TP MODELS!</span>
+
+    <span class="c1"># define a default quantization config for all non-specified weights attributes.</span>
+    <span class="n">default_weight_attr_config</span> <span class="o">=</span> <span class="n">AttributeQuantizationConfig</span><span class="p">(</span>
+        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
+        <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>  <span class="c1"># TODO: this will changed to True once implementing multi-attributes quantization</span>
+        <span class="n">lut_values_bitwidth</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+
+    <span class="c1"># define a quantization config to quantize the kernel (for layers where there is a kernel attribute).</span>
+    <span class="n">kernel_base_config</span> <span class="o">=</span> <span class="n">AttributeQuantizationConfig</span><span class="p">(</span>
+        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">SYMMETRIC</span><span class="p">,</span>
+        <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+        <span class="n">lut_values_bitwidth</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+
+    <span class="c1"># define a quantization config to quantize the bias (for layers where there is a bias attribute).</span>
+    <span class="n">bias_config</span> <span class="o">=</span> <span class="n">AttributeQuantizationConfig</span><span class="p">(</span>
+        <span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">tp</span><span class="o">.</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">POWER_OF_TWO</span><span class="p">,</span>
+        <span class="n">weights_n_bits</span><span class="o">=</span><span class="n">FLOAT_BITWIDTH</span><span class="p">,</span>
+        <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span>
+        <span class="n">lut_values_bitwidth</span><span class="o">=</span><span class="kc">None</span><span class="p">)</span>
+
+    <span class="c1"># Create a quantization config.</span>
+    <span class="c1"># A quantization configuration defines how an operator</span>
 </pre></div>
 </div>
 </section>
@@ -734,7 +734,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -745,13 +745,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">target_platform Module</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/api/api_docs/modules/trainable_infrastructure.html b/docs/api/api_docs/modules/trainable_infrastructure.html
new file mode 100644
index 000000000..db6e20290
--- /dev/null
+++ b/docs/api/api_docs/modules/trainable_infrastructure.html
@@ -0,0 +1,216 @@
+
+
+<!doctype html>
+
+<html lang="en">
+  <head>
+    <meta charset="utf-8" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
+
+    <title>trainable_infrastructure Module &#8212; MCT Documentation: ver 1.11.0</title>
+    <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
+    <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
+    
+    <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
+    <script src="../../../static/jquery.js"></script>
+    <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
+    <script src="../../../static/doctools.js"></script>
+    <script src="../../../static/bizstyle.js"></script>
+    <link rel="index" title="Index" href="../../../genindex.html" />
+    <link rel="search" title="Search" href="../../../search.html" />
+    <meta name="viewport" content="width=device-width,initial-scale=1.0" />
+    <!--[if lt IE 9]>
+    <script src="static/css3-mediaqueries.js"></script>
+    <![endif]-->
+  </head><body>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             accesskey="I">index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">trainable_infrastructure Module</a></li> 
+      </ul>
+    </div>  
+
+    <div class="document">
+      <div class="documentwrapper">
+        <div class="bodywrapper">
+          <div class="body" role="main">
+            
+  <section id="trainable-infrastructure-module">
+<span id="ug-trainable-infrastructure"></span><h1>trainable_infrastructure Module<a class="headerlink" href="#trainable-infrastructure-module" title="Permalink to this heading">¶</a></h1>
+<p>The trainable infrastructure is a module containing quantization abstraction and quantizers for hardware-oriented model optimization tools.
+It provides the required abstraction for trainable quantization methods such as quantization-aware training.
+It utilizes the Inferable Quantizers Infrastructure provided by the <a class="reference external" href="https://github.com/sony/mct_quantizers">MCT Quantizers</a> package, which proposes the required abstraction for emulating inference-time quantization.</p>
+<p>When using a trainable quantizer, each layer with quantized weights is wrapped with a “Quantization Wrapper” object,
+and each activation quantizer is being stored in an “Activation Quantization Holder” object.
+Both components are provided by the MCT Quantizers package.</p>
+<p>The quantizers in this module are built upon the “Inferable Quantizer” abstraction (from MCT Quantizers),
+and define the “Trainable Quantizer” framework,
+which contains learnable quantization parameters that can be optimized during training.</p>
+<p>Now, we will explain how a trainable quantizer is built and used.
+We start by explaining the basic building block of a trainable quantizer, and then explain how to initialize it using a configuration object.</p>
+<section id="basekerastrainablequantizer">
+<h2>BaseKerasTrainableQuantizer<a class="headerlink" href="#basekerastrainablequantizer" title="Permalink to this heading">¶</a></h2>
+<p>This class is a base class for trainable Keras quantizers which validates provided quantization config and defines an abstract function which any quantizer needs to implement.
+It adds to the base quantizer a get_config and from_config functions to enable loading and saving the keras model.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.trainable_infrastructure.</span></span><span class="sig-name descname"><span class="pre">BaseKerasTrainableQuantizer</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">quantization_config</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer" title="Permalink to this definition">¶</a></dt>
+<dd><p>This class is a base quantizer which validates provided quantization config and defines an abstract function which any quantizer needs to implement.
+This class adds to the base quantizer a get_config and from_config functions to enable loading and saving the keras model.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><p><strong>quantization_config</strong> – quantizer config class contains all the information about a quantizer configuration.</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+<section id="basepytorchtrainablequantizer">
+<h2>BasePytorchTrainableQuantizer<a class="headerlink" href="#basepytorchtrainablequantizer" title="Permalink to this heading">¶</a></h2>
+<p>This class is a base class for trainable Pytorch quantizers which validates provided quantization config and defines an abstract function which any quantizer needs to implement.
+It adds to the base quantizer a get_config and from_config functions to enable loading and saving the keras model.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.trainable_infrastructure.</span></span><span class="sig-name descname"><span class="pre">BasePytorchTrainableQuantizer</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">quantization_config</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer" title="Permalink to this definition">¶</a></dt>
+<dd><p>This class is a base Pytorch quantizer which validates the provided quantization config and defines an
+abstract function which any quantizer needs to implement.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><p><strong>quantization_config</strong> – quantizer config class contains all the information about the quantizer configuration.</p>
+</dd>
+</dl>
+</dd></dl>
+
+</section>
+<section id="trainablequantizerweightsconfig">
+<h2>TrainableQuantizerWeightsConfig<a class="headerlink" href="#trainablequantizerweightsconfig" title="Permalink to this heading">¶</a></h2>
+<p>This configuration object contains the necessary attributes for configuring a weights trainable quantizer.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.trainable_infrastructure.</span></span><span class="sig-name descname"><span class="pre">TrainableQuantizerWeightsConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">weights_quantization_method</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_n_bits</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_params</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">enable_weights_quantization</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_channels_axis</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_per_channel_threshold</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">min_threshold</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">weights_quantization_candidates</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>Attributes for configuring weights trainable quantizer.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>weights_quantization_method</strong> (<a class="reference internal" href="target_platform.html#model_compression_toolkit.target_platform.QuantizationMethod" title="model_compression_toolkit.target_platform.QuantizationMethod"><em>QuantizationMethod</em></a>) – Which method to use from QuantizationMethod for weights quantization.</p></li>
+<li><p><strong>weights_n_bits</strong> (<em>int</em>) – Number of bits to quantize the coefficients.</p></li>
+<li><p><strong>weights_quantization_params</strong> (<em>Dict</em>) – Dictionary that contains weights quantization params.</p></li>
+<li><p><strong>enable_weights_quantization</strong> (<em>bool</em>) – Whether to quantize the layer’s weights or not.</p></li>
+<li><p><strong>weights_channels_axis</strong> (<em>int</em>) – Axis to quantize a node’s kernel when quantizing per-channel.</p></li>
+<li><p><strong>weights_per_channel_threshold</strong> (<em>bool</em>) – Whether to quantize the weights per-channel or not (per-tensor).</p></li>
+<li><p><strong>min_threshold</strong> (<em>float</em>) – Minimum threshold to use during thresholds selection.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<p>For example, we can set a trainable weights quantizer with the following configuration:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.target_platform</span> <span class="kn">import</span> <span class="n">QuantizationMethod</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.constants</span> <span class="kn">import</span> <span class="n">THRESHOLD</span><span class="p">,</span> <span class="n">MIN_THRESHOLD</span>
+
+<span class="n">TrainableQuantizerWeightsConfig</span><span class="p">(</span><span class="n">weights_quantization_method</span><span class="o">=</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">SYMMETRIC</span><span class="p">,</span>
+                                           <span class="n">weights_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+                                           <span class="n">weights_quantization_params</span><span class="o">=</span><span class="p">{</span><span class="n">THRESHOLD</span><span class="p">:</span> <span class="mf">2.0</span><span class="p">},</span>
+                                           <span class="n">enable_weights_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+                                           <span class="n">weights_channels_axis</span><span class="o">=</span><span class="mi">3</span><span class="p">,</span>
+                                           <span class="n">weights_per_channel_threshold</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+                                           <span class="n">min_threshold</span><span class="o">=</span><span class="n">MIN_THRESHOLD</span><span class="p">)</span>
+</pre></div>
+</div>
+<div class="line-block">
+<div class="line"><br /></div>
+</div>
+</section>
+<section id="trainablequantizeractivationconfig">
+<h2>TrainableQuantizerActivationConfig<a class="headerlink" href="#trainablequantizeractivationconfig" title="Permalink to this heading">¶</a></h2>
+<p>This configuration object contains the necessary attributes for configuring an activation trainable quantizer.</p>
+<dl class="py class">
+<dt class="sig sig-object py" id="model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig">
+<em class="property"><span class="pre">class</span><span class="w"> </span></em><span class="sig-prename descclassname"><span class="pre">model_compression_toolkit.trainable_infrastructure.</span></span><span class="sig-name descname"><span class="pre">TrainableQuantizerActivationConfig</span></span><span class="sig-paren">(</span><em class="sig-param"><span class="n"><span class="pre">activation_quantization_method</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_n_bits</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_quantization_params</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">enable_activation_quantization</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">min_threshold</span></span></em>, <em class="sig-param"><span class="n"><span class="pre">activation_quantization_candidates</span></span><span class="o"><span class="pre">=</span></span><span class="default_value"><span class="pre">None</span></span></em><span class="sig-paren">)</span><a class="headerlink" href="#model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig" title="Permalink to this definition">¶</a></dt>
+<dd><p>Attributes for configuring activations trainable quantizer.</p>
+<dl class="field-list simple">
+<dt class="field-odd">Parameters<span class="colon">:</span></dt>
+<dd class="field-odd"><ul class="simple">
+<li><p><strong>activation_quantization_method</strong> (<a class="reference internal" href="target_platform.html#model_compression_toolkit.target_platform.QuantizationMethod" title="model_compression_toolkit.target_platform.QuantizationMethod"><em>QuantizationMethod</em></a>) – Which method to use from QuantizationMethod for activation quantization.</p></li>
+<li><p><strong>activation_n_bits</strong> (<em>int</em>) – Number of bits to quantize the activations.</p></li>
+<li><p><strong>activation_quantization_params</strong> (<em>Dict</em>) – Dictionary that contains activation quantization params.</p></li>
+<li><p><strong>enable_activation_quantization</strong> (<em>bool</em>) – Whether to quantize the layer’s activations or not.</p></li>
+<li><p><strong>min_threshold</strong> (<em>float</em>) – Minimum threshold to use during thresholds selection.</p></li>
+</ul>
+</dd>
+</dl>
+</dd></dl>
+
+<p>For example, we can set a trainable activation quantizer with the following configuration:</p>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">model_compression_toolkit.target_platform_capabilities.target_platform</span> <span class="kn">import</span> <span class="n">QuantizationMethod</span>
+<span class="kn">from</span> <span class="nn">model_compression_toolkit.constants</span> <span class="kn">import</span> <span class="n">THRESHOLD</span><span class="p">,</span> <span class="n">MIN_THRESHOLD</span>
+
+<span class="n">TrainableQuantizerActivationConfig</span><span class="p">(</span><span class="n">activation_quantization_method</span><span class="o">=</span><span class="n">QuantizationMethod</span><span class="o">.</span><span class="n">UNIFORM</span><span class="p">,</span>
+                                              <span class="n">activation_n_bits</span><span class="o">=</span><span class="mi">8</span><span class="p">,</span>
+                                              <span class="n">activation_quantization_params</span><span class="o">==</span><span class="p">{</span><span class="n">THRESHOLD</span><span class="p">:</span> <span class="mf">2.0</span><span class="p">},</span>
+                                              <span class="n">enable_activation_quantization</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
+                                              <span class="n">min_threshold</span><span class="o">=</span><span class="n">MIN_THRESHOLD</span><span class="p">)</span>
+</pre></div>
+</div>
+<div class="line-block">
+<div class="line"><br /></div>
+</div>
+</section>
+</section>
+
+
+            <div class="clearer"></div>
+          </div>
+        </div>
+      </div>
+      <div class="sphinxsidebar" role="navigation" aria-label="main navigation">
+        <div class="sphinxsidebarwrapper">
+  <div>
+    <h3><a href="../../../index.html">Table of Contents</a></h3>
+    <ul>
+<li><a class="reference internal" href="#">trainable_infrastructure Module</a><ul>
+<li><a class="reference internal" href="#basekerastrainablequantizer">BaseKerasTrainableQuantizer</a></li>
+<li><a class="reference internal" href="#basepytorchtrainablequantizer">BasePytorchTrainableQuantizer</a></li>
+<li><a class="reference internal" href="#trainablequantizerweightsconfig">TrainableQuantizerWeightsConfig</a></li>
+<li><a class="reference internal" href="#trainablequantizeractivationconfig">TrainableQuantizerActivationConfig</a></li>
+</ul>
+</li>
+</ul>
+
+  </div>
+<div id="searchbox" style="display: none" role="search">
+  <h3 id="searchlabel">Quick search</h3>
+    <div class="searchformwrapper">
+    <form class="search" action="../../../search.html" method="get">
+      <input type="text" name="q" aria-labelledby="searchlabel" autocomplete="off" autocorrect="off" autocapitalize="off" spellcheck="false"/>
+      <input type="submit" value="Go" />
+    </form>
+    </div>
+</div>
+<script>document.getElementById('searchbox').style.display = "block"</script>
+        </div>
+      </div>
+      <div class="clearer"></div>
+    </div>
+    <div class="related" role="navigation" aria-label="related navigation">
+      <h3>Navigation</h3>
+      <ul>
+        <li class="right" style="margin-right: 10px">
+          <a href="../../../genindex.html" title="General Index"
+             >index</a></li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
+        <li class="nav-item nav-item-this"><a href="">trainable_infrastructure Module</a></li> 
+      </ul>
+    </div>
+    <div class="footer" role="contentinfo">
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
+    </div>
+  </body>
+</html>
\ No newline at end of file
diff --git a/docs/api/api_docs/notes/tpc_note.html b/docs/api/api_docs/notes/tpc_note.html
index 3d79c2ff9..79e6b0b0c 100644
--- a/docs/api/api_docs/notes/tpc_note.html
+++ b/docs/api/api_docs/notes/tpc_note.html
@@ -2,12 +2,12 @@
 
 <!doctype html>
 
-<html>
+<html lang="en">
   <head>
     <meta charset="utf-8" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.17.1: http://docutils.sourceforge.net/" />
+    <meta name="viewport" content="width=device-width, initial-scale=1.0" /><meta name="generator" content="Docutils 0.18.1: http://docutils.sourceforge.net/" />
 
-    <title>&lt;no title&gt; &#8212; MCT Documentation: ver 1.4.0</title>
+    <title>&lt;no title&gt; &#8212; MCT Documentation: ver 1.11.0</title>
     <link rel="stylesheet" type="text/css" href="../../../static/pygments.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/bizstyle.css" />
     <link rel="stylesheet" type="text/css" href="../../../static/css/custom.css" />
@@ -15,6 +15,7 @@
     <script data-url_root="../../../" id="documentation_options" src="../../../static/documentation_options.js"></script>
     <script src="../../../static/jquery.js"></script>
     <script src="../../../static/underscore.js"></script>
+    <script src="../../../static/_sphinx_javascript_frameworks_compat.js"></script>
     <script src="../../../static/doctools.js"></script>
     <script src="../../../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../../../genindex.html" />
@@ -30,7 +31,7 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              accesskey="I">index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">&lt;no title&gt;</a></li> 
       </ul>
     </div>  
@@ -42,13 +43,11 @@ <h3>Navigation</h3>
             
   <div class="admonition note">
 <p class="admonition-title">Note</p>
-<p>For now, fusing operators information from <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformModel</span></code></a>
-is ignored during the optimization process (fusing still occurs but using an existing mechanism).
-Also, parts of <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a> is ignored (currently,
-the quantizer type, number of bits, and quantization enable/disable information is used during the
-optimization process).</p>
+<p>For now, some fields of <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a> are ignored during
+the optimization process (currently, the quantizer type, number of bits, and quantization enable/disable information
+are in use).</p>
 <ul class="simple">
-<li><p>MCT will use more information from <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformModel" title="model_compression_toolkit.target_platform.TargetPlatformModel"><code class="xref py py-class docutils literal notranslate"><span class="pre">TargetPlatformModel</span></code></a>, in the future.</p></li>
+<li><p>MCT will use more information from <a class="reference internal" href="../modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig" title="model_compression_toolkit.target_platform.OpQuantizationConfig"><code class="xref py py-class docutils literal notranslate"><span class="pre">OpQuantizationConfig</span></code></a>, in the future.</p></li>
 </ul>
 </div>
 
@@ -68,7 +67,7 @@ <h3 id="searchlabel">Quick search</h3>
     </form>
     </div>
 </div>
-<script>$('#searchbox').show(0);</script>
+<script>document.getElementById('searchbox').style.display = "block"</script>
         </div>
       </div>
       <div class="clearer"></div>
@@ -79,13 +78,13 @@ <h3>Navigation</h3>
         <li class="right" style="margin-right: 10px">
           <a href="../../../genindex.html" title="General Index"
              >index</a></li>
-        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.4.0</a> &#187;</li>
+        <li class="nav-item nav-item-0"><a href="../../../index.html">MCT Documentation: ver 1.11.0</a> &#187;</li>
         <li class="nav-item nav-item-this"><a href="">&lt;no title&gt;</a></li> 
       </ul>
     </div>
     <div class="footer" role="contentinfo">
-        &#169; Copyright 2022, Sony Semiconductors Israel.
-      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 4.5.0.
+        &#169; Copyright 2022, Sony Semiconductor Israel.
+      Created using <a href="https://www.sphinx-doc.org/">Sphinx</a> 5.0.2.
     </div>
   </body>
 </html>
\ No newline at end of file
diff --git a/docs/genindex.html b/docs/genindex.html
index 349de2131..9fb67ca01 100644
--- a/docs/genindex.html
+++ b/docs/genindex.html
@@ -65,11 +65,11 @@ <h1 id="index">Index</h1>
 <h2 id="B">B</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer">BaseKerasTrainableQuantizer (class in model_compression_toolkit.trainable_infrastructure)</a>
+      <li><a href="api/api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.BaseKerasTrainableQuantizer">BaseKerasTrainableQuantizer (class in model_compression_toolkit.trainable_infrastructure)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer">BasePytorchTrainableQuantizer (class in model_compression_toolkit.trainable_infrastructure)</a>
+      <li><a href="api/api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.BasePytorchTrainableQuantizer">BasePytorchTrainableQuantizer (class in model_compression_toolkit.trainable_infrastructure)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -77,29 +77,29 @@ <h2 id="B">B</h2>
 <h2 id="C">C</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantConfigAttr">ChangeCandidatesActivationQuantConfigAttr (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantConfigAttr">ChangeCandidatesActivationQuantConfigAttr (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeCandidatesActivationQuantizationMethod">ChangeCandidatesActivationQuantizationMethod (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeCandidatesActivationQuantizationMethod">ChangeCandidatesActivationQuantizationMethod (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantConfigAttr">ChangeCandidatesWeightsQuantConfigAttr (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantConfigAttr">ChangeCandidatesWeightsQuantConfigAttr (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeCandidatesWeightsQuantizationMethod">ChangeCandidatesWeightsQuantizationMethod (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeCandidatesWeightsQuantizationMethod">ChangeCandidatesWeightsQuantizationMethod (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeFinalActivationQuantConfigAttr">ChangeFinalActivationQuantConfigAttr (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeFinalActivationQuantConfigAttr">ChangeFinalActivationQuantConfigAttr (class in model_compression_toolkit.core.network_editor)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeFinalWeightsQuantConfigAttr">ChangeFinalWeightsQuantConfigAttr (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantConfigAttr">ChangeFinalWeightsQuantConfigAttr (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeFinalWeightsQuantizationMethod">ChangeFinalWeightsQuantizationMethod (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeFinalWeightsQuantizationMethod">ChangeFinalWeightsQuantizationMethod (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.ChangeQuantizationParamFunction">ChangeQuantizationParamFunction (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.ChangeQuantizationParamFunction">ChangeQuantizationParamFunction (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/classes/FrameworkInfo.html#model_compression_toolkit.ChannelAxis">ChannelAxis (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/classes/FrameworkInfo.html#model_compression_toolkit.core.ChannelAxis">ChannelAxis (class in model_compression_toolkit.core)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.channels_filtering_strategy">channels_filtering_strategy (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/classes/PruningConfig.html#model_compression_toolkit.pruning.channels_filtering_strategy">channels_filtering_strategy (in module model_compression_toolkit.pruning)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/core_config.html#model_compression_toolkit.core.CoreConfig">CoreConfig (class in model_compression_toolkit.core)</a>
+      <li><a href="api/api_docs/modules/core_config.html#model_compression_toolkit.core.CoreConfig">CoreConfig (class in model_compression_toolkit.core)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -107,11 +107,11 @@ <h2 id="C">C</h2>
 <h2 id="D">D</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/debug_config.html#model_compression_toolkit.DebugConfig">DebugConfig (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/modules/debug_config.html#model_compression_toolkit.core.DebugConfig">DebugConfig (class in model_compression_toolkit.core)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/classes/DefaultDict.html#model_compression_toolkit.DefaultDict">DefaultDict (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/classes/DefaultDict.html#model_compression_toolkit.DefaultDict">DefaultDict (class in model_compression_toolkit)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -119,11 +119,11 @@ <h2 id="D">D</h2>
 <h2 id="E">E</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.EditRule">EditRule (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.EditRule">EditRule (class in model_compression_toolkit.core.network_editor)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.Eq">Eq (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.Eq">Eq (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -131,17 +131,15 @@ <h2 id="E">E</h2>
 <h2 id="F">F</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/classes/FolderImageLoader.html#model_compression_toolkit.core.common.data_loader.FILETYPES">FILETYPES (in module model_compression_toolkit.core.common.data_loader)</a>
+      <li><a href="api/api_docs/classes/FolderImageLoader.html#model_compression_toolkit.core.common.data_loader.FILETYPES">FILETYPES (in module model_compression_toolkit.core.common.data_loader)</a>
 </li>
-      <li><a href="api/experimental_api_docs/classes/FolderImageLoader.html#model_compression_toolkit.FolderImageLoader">FolderImageLoader (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/classes/FolderImageLoader.html#model_compression_toolkit.core.FolderImageLoader">FolderImageLoader (class in model_compression_toolkit.core)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/classes/FrameworkInfo.html#model_compression_toolkit.FrameworkInfo">FrameworkInfo (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/classes/FrameworkInfo.html#model_compression_toolkit.core.FrameworkInfo">FrameworkInfo (class in model_compression_toolkit.core)</a>
 </li>
-      <li><a href="api/experimental_api_docs/classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfigV2.from_v1">from_v1() (model_compression_toolkit.gptq.GradientPTQConfigV2 class method)</a>
-</li>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.Fusing">Fusing (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.Fusing">Fusing (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -149,29 +147,27 @@ <h2 id="F">F</h2>
 <h2 id="G">G</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/classes/DefaultDict.html#model_compression_toolkit.DefaultDict.get">get() (model_compression_toolkit.DefaultDict method)</a>
+      <li><a href="api/api_docs/classes/DefaultDict.html#model_compression_toolkit.DefaultDict.get">get() (model_compression_toolkit.DefaultDict method)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/get_keras_gptq_config.html#model_compression_toolkit.gptq.get_keras_gptq_config">get_keras_gptq_config() (in module model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/methods/get_keras_data_generation_config.html#model_compression_toolkit.data_generation.get_keras_data_generation_config">get_keras_data_generation_config() (in module model_compression_toolkit.data_generation)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/get_pytorch_data_generation_config.html#model_compression_toolkit.data_generation.get_pytorch_data_generation_config">get_pytorch_data_generation_config() (in module model_compression_toolkit.data_generation)</a>
+      <li><a href="api/api_docs/methods/get_keras_gptq_config.html#model_compression_toolkit.gptq.get_keras_gptq_config">get_keras_gptq_config() (in module model_compression_toolkit.gptq)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/get_pytroch_gptq_config.html#model_compression_toolkit.gptq.get_pytorch_gptq_config">get_pytorch_gptq_config() (in module model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/methods/get_pytorch_data_generation_config.html#model_compression_toolkit.data_generation.get_pytorch_data_generation_config">get_pytorch_data_generation_config() (in module model_compression_toolkit.data_generation)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/get_target_platform_capabilities.html#model_compression_toolkit.get_target_platform_capabilities">get_target_platform_capabilities() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/get_pytroch_gptq_config.html#model_compression_toolkit.gptq.get_pytorch_gptq_config">get_pytorch_gptq_config() (in module model_compression_toolkit.gptq)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/methods/get_keras_data_generation_config.html#model_compression_toolkit.data_generation.get_tensorflow_data_generation_config">get_tensorflow_data_generation_config() (in module model_compression_toolkit.data_generation)</a>
-</li>
-      <li><a href="api/experimental_api_docs/classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GPTQHessianScoresConfig">GPTQHessianScoresConfig (class in model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/methods/get_target_platform_capabilities.html#model_compression_toolkit.get_target_platform_capabilities">get_target_platform_capabilities() (in module model_compression_toolkit)</a>
 </li>
-      <li><a href="api/experimental_api_docs/classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfig">GradientPTQConfig (class in model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GPTQHessianScoresConfig">GPTQHessianScoresConfig (class in model_compression_toolkit.gptq)</a>
 </li>
-      <li><a href="api/experimental_api_docs/classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfigV2">GradientPTQConfigV2 (class in model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/classes/GradientPTQConfig.html#model_compression_toolkit.gptq.GradientPTQConfig">GradientPTQConfig (class in model_compression_toolkit.gptq)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.Greater">Greater (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.Greater">Greater (class in model_compression_toolkit.target_platform)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.GreaterEq">GreaterEq (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.GreaterEq">GreaterEq (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -179,11 +175,11 @@ <h2 id="G">G</h2>
 <h2 id="I">I</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.importance_metric">importance_metric (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/classes/PruningConfig.html#model_compression_toolkit.pruning.importance_metric">importance_metric (in module model_compression_toolkit.pruning)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.importance_scores">importance_scores (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/classes/PruningInfo.html#model_compression_toolkit.pruning.importance_scores">importance_scores (in module model_compression_toolkit.pruning)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -191,35 +187,31 @@ <h2 id="I">I</h2>
 <h2 id="K">K</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/exporter.html#model_compression_toolkit.exporter.keras_export_model">keras_export_model (class in model_compression_toolkit.exporter)</a>
-</li>
-      <li><a href="api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.html#model_compression_toolkit.gptq.keras_gradient_post_training_quantization_experimental">keras_gradient_post_training_quantization_experimental() (in module model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/methods/keras_data_generation_experimental.html#model_compression_toolkit.data_generation.keras_data_generation_experimental">keras_data_generation_experimental() (in module model_compression_toolkit.data_generation)</a>
 </li>
-      <li><a href="api/api_docs/methods/keras_kpi_data.html#model_compression_toolkit.keras_kpi_data">keras_kpi_data() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/modules/exporter.html#model_compression_toolkit.exporter.keras_export_model">keras_export_model (class in model_compression_toolkit.exporter)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_kpi_data_experimental.html#model_compression_toolkit.core.keras_kpi_data_experimental">keras_kpi_data_experimental() (in module model_compression_toolkit.core)</a>
+      <li><a href="api/api_docs/methods/keras_gradient_post_training_quantization_experimental.html#model_compression_toolkit.gptq.keras_gradient_post_training_quantization">keras_gradient_post_training_quantization() (in module model_compression_toolkit.gptq)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_load_quantizad_model.html#model_compression_toolkit.keras_load_quantized_model">keras_load_quantized_model() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/keras_kpi_data_experimental.html#model_compression_toolkit.core.keras_kpi_data">keras_kpi_data() (in module model_compression_toolkit.core)</a>
 </li>
-      <li><a href="api/api_docs/methods/keras_post_training_quantization.html#model_compression_toolkit.keras_post_training_quantization">keras_post_training_quantization() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/keras_load_quantizad_model.html#model_compression_toolkit.keras_load_quantized_model">keras_load_quantized_model() (in module model_compression_toolkit)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_post_training_quantization_experimental.html#model_compression_toolkit.ptq.keras_post_training_quantization_experimental">keras_post_training_quantization_experimental() (in module model_compression_toolkit.ptq)</a>
+      <li><a href="api/api_docs/methods/keras_post_training_quantization_experimental.html#model_compression_toolkit.ptq.keras_post_training_quantization">keras_post_training_quantization() (in module model_compression_toolkit.ptq)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/api_docs/methods/keras_post_training_quantization_mixed_precision.html#model_compression_toolkit.keras_post_training_quantization_mixed_precision">keras_post_training_quantization_mixed_precision() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.keras_pruning_experimental">keras_pruning_experimental() (in module model_compression_toolkit.pruning)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.keras_pruning_experimental">keras_pruning_experimental() (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/methods/keras_quantization_aware_training_finalize.html#model_compression_toolkit.qat.keras_quantization_aware_training_finalize_experimental">keras_quantization_aware_training_finalize_experimental() (in module model_compression_toolkit.qat)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.html#model_compression_toolkit.qat.keras_quantization_aware_training_finalize">keras_quantization_aware_training_finalize() (in module model_compression_toolkit.qat)</a>
+      <li><a href="api/api_docs/methods/keras_quantization_aware_training_init.html#model_compression_toolkit.qat.keras_quantization_aware_training_init_experimental">keras_quantization_aware_training_init_experimental() (in module model_compression_toolkit.qat)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_quantization_aware_training_init.html#model_compression_toolkit.qat.keras_quantization_aware_training_init">keras_quantization_aware_training_init() (in module model_compression_toolkit.qat)</a>
+      <li><a href="api/api_docs/modules/exporter.html#model_compression_toolkit.exporter.KerasExportSerializationFormat">KerasExportSerializationFormat (class in model_compression_toolkit.exporter)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/exporter.html#model_compression_toolkit.exporter.KerasExportSerializationFormat">KerasExportSerializationFormat (class in model_compression_toolkit.exporter)</a>
+      <li><a href="api/api_docs/classes/DefaultDict.html#model_compression_toolkit.DefaultDict.keys">keys() (model_compression_toolkit.DefaultDict method)</a>
 </li>
-      <li><a href="api/experimental_api_docs/classes/DefaultDict.html#model_compression_toolkit.DefaultDict.keys">keys() (model_compression_toolkit.DefaultDict method)</a>
-</li>
-      <li><a href="api/experimental_api_docs/modules/mixed_precision_quantization_config.html#model_compression_toolkit.KPI">KPI (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.KPI">KPI (class in model_compression_toolkit.core)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -227,7 +219,7 @@ <h2 id="K">K</h2>
 <h2 id="L">L</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.LayerFilterParams">LayerFilterParams (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.LayerFilterParams">LayerFilterParams (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -235,11 +227,7 @@ <h2 id="L">L</h2>
 <h2 id="M">M</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/api_docs/modules/mixed_precision_quantization_config.html#model_compression_toolkit.MixedPrecisionQuantizationConfig">MixedPrecisionQuantizationConfig (class in model_compression_toolkit)</a>
-</li>
-  </ul></td>
-  <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.MixedPrecisionQuantizationConfigV2">MixedPrecisionQuantizationConfigV2 (class in model_compression_toolkit.core)</a>
+      <li><a href="api/api_docs/modules/mixed_precision_quantization_config.html#model_compression_toolkit.core.MixedPrecisionQuantizationConfig">MixedPrecisionQuantizationConfig (class in model_compression_toolkit.core)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -247,17 +235,17 @@ <h2 id="M">M</h2>
 <h2 id="N">N</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.NodeNameFilter">NodeNameFilter (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.NodeNameFilter">NodeNameFilter (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.NodeNameScopeFilter">NodeNameScopeFilter (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.NodeNameScopeFilter">NodeNameScopeFilter (class in model_compression_toolkit.core.network_editor)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/network_editor.html#model_compression_toolkit.network_editor.NodeTypeFilter">NodeTypeFilter (class in model_compression_toolkit.network_editor)</a>
+      <li><a href="api/api_docs/modules/network_editor.html#model_compression_toolkit.core.network_editor.NodeTypeFilter">NodeTypeFilter (class in model_compression_toolkit.core.network_editor)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.NotEq">NotEq (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.NotEq">NotEq (class in model_compression_toolkit.target_platform)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.num_score_approximations">num_score_approximations (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/classes/PruningConfig.html#model_compression_toolkit.pruning.num_score_approximations">num_score_approximations (in module model_compression_toolkit.pruning)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -265,15 +253,15 @@ <h2 id="N">N</h2>
 <h2 id="O">O</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OperationsSetToLayers">OperationsSetToLayers (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OperationsSetToLayers">OperationsSetToLayers (class in model_compression_toolkit.target_platform)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OperatorSetConcat">OperatorSetConcat (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OperatorSetConcat">OperatorSetConcat (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OperatorsSet">OperatorsSet (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OperatorsSet">OperatorsSet (class in model_compression_toolkit.target_platform)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig">OpQuantizationConfig (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.OpQuantizationConfig">OpQuantizationConfig (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -281,35 +269,31 @@ <h2 id="O">O</h2>
 <h2 id="P">P</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.pruning_masks">pruning_masks (in module model_compression_toolkit.pruning)</a>
-</li>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.PruningConfig">PruningConfig() (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/classes/PruningInfo.html#model_compression_toolkit.pruning.pruning_masks">pruning_masks (in module model_compression_toolkit.pruning)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_pruning_experimental.html#model_compression_toolkit.pruning.PruningInfo">PruningInfo() (in module model_compression_toolkit.pruning)</a>
+      <li><a href="api/api_docs/classes/PruningConfig.html#model_compression_toolkit.pruning.PruningConfig">PruningConfig() (in module model_compression_toolkit.pruning)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/pytorch_data_generation_experimental.html#model_compression_toolkit.data_generation.pytorch_data_generation_experimental">pytorch_data_generation_experimental() (in module model_compression_toolkit.data_generation)</a>
+      <li><a href="api/api_docs/classes/PruningInfo.html#model_compression_toolkit.pruning.PruningInfo">PruningInfo() (in module model_compression_toolkit.pruning)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/exporter.html#model_compression_toolkit.exporter.pytorch_export_model">pytorch_export_model (class in model_compression_toolkit.exporter)</a>
+      <li><a href="api/api_docs/methods/pytorch_data_generation_experimental.html#model_compression_toolkit.data_generation.pytorch_data_generation_experimental">pytorch_data_generation_experimental() (in module model_compression_toolkit.data_generation)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html#model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization_experimental">pytorch_gradient_post_training_quantization_experimental() (in module model_compression_toolkit.gptq)</a>
+      <li><a href="api/api_docs/modules/exporter.html#model_compression_toolkit.exporter.pytorch_export_model">pytorch_export_model (class in model_compression_toolkit.exporter)</a>
 </li>
-      <li><a href="api/api_docs/methods/pytorch_kpi_data.html#model_compression_toolkit.pytorch_kpi_data">pytorch_kpi_data() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html#model_compression_toolkit.gptq.pytorch_gradient_post_training_quantization">pytorch_gradient_post_training_quantization() (in module model_compression_toolkit.gptq)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/methods/pytorch_kpi_data_experimental.html#model_compression_toolkit.core.pytorch_kpi_data_experimental">pytorch_kpi_data_experimental() (in module model_compression_toolkit.core)</a>
-</li>
-      <li><a href="api/api_docs/methods/pytorch_post_training_quantization.html#model_compression_toolkit.pytorch_post_training_quantization">pytorch_post_training_quantization() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/pytorch_kpi_data_experimental.html#model_compression_toolkit.core.pytorch_kpi_data">pytorch_kpi_data() (in module model_compression_toolkit.core)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.html#model_compression_toolkit.ptq.pytorch_post_training_quantization_experimental">pytorch_post_training_quantization_experimental() (in module model_compression_toolkit.ptq)</a>
+      <li><a href="api/api_docs/methods/pytorch_post_training_quantization_experimental.html#model_compression_toolkit.ptq.pytorch_post_training_quantization">pytorch_post_training_quantization() (in module model_compression_toolkit.ptq)</a>
 </li>
-      <li><a href="api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.html#model_compression_toolkit.pytorch_post_training_quantization_mixed_precision">pytorch_post_training_quantization_mixed_precision() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/pytorch_pruning_experimental.html#model_compression_toolkit.pruning.pytorch_pruning_experimental">pytorch_pruning_experimental() (in module model_compression_toolkit.pruning)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.html#model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize">pytorch_quantization_aware_training_finalize() (in module model_compression_toolkit.qat)</a>
+      <li><a href="api/api_docs/methods/pytorch_quantization_aware_training_finalize.html#model_compression_toolkit.qat.pytorch_quantization_aware_training_finalize_experimental">pytorch_quantization_aware_training_finalize_experimental() (in module model_compression_toolkit.qat)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.html#model_compression_toolkit.qat.pytorch_quantization_aware_training_init">pytorch_quantization_aware_training_init() (in module model_compression_toolkit.qat)</a>
+      <li><a href="api/api_docs/methods/pytorch_quantization_aware_training_init.html#model_compression_toolkit.qat.pytorch_quantization_aware_training_init_experimental">pytorch_quantization_aware_training_init_experimental() (in module model_compression_toolkit.qat)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/exporter.html#model_compression_toolkit.exporter.PytorchExportSerializationFormat">PytorchExportSerializationFormat (class in model_compression_toolkit.exporter)</a>
+      <li><a href="api/api_docs/modules/exporter.html#model_compression_toolkit.exporter.PytorchExportSerializationFormat">PytorchExportSerializationFormat (class in model_compression_toolkit.exporter)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -317,17 +301,19 @@ <h2 id="P">P</h2>
 <h2 id="Q">Q</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/qat_config.html#model_compression_toolkit.qat.QATConfig">QATConfig (class in model_compression_toolkit.qat)</a>
+      <li><a href="api/api_docs/modules/qat_config.html#model_compression_toolkit.qat.QATConfig">QATConfig (class in model_compression_toolkit.qat)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/quantization_config.html#model_compression_toolkit.QuantizationConfig">QuantizationConfig (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/modules/quantization_config.html#model_compression_toolkit.core.QuantizationConfig">QuantizationConfig (class in model_compression_toolkit.core)</a>
+</li>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.QuantizationConfigOptions">QuantizationConfigOptions (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.QuantizationConfigOptions">QuantizationConfigOptions (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/quantization_config.html#model_compression_toolkit.core.QuantizationErrorMethod">QuantizationErrorMethod (class in model_compression_toolkit.core)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/quantization_config.html#model_compression_toolkit.QuantizationErrorMethod">QuantizationErrorMethod (class in model_compression_toolkit)</a>
+      <li><a href="api/api_docs/modules/exporter.html#model_compression_toolkit.exporter.QuantizationFormat">QuantizationFormat (class in model_compression_toolkit.exporter)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.QuantizationMethod">QuantizationMethod (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.QuantizationMethod">QuantizationMethod (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -335,15 +321,15 @@ <h2 id="Q">Q</h2>
 <h2 id="S">S</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/classes/FolderImageLoader.html#model_compression_toolkit.FolderImageLoader.sample">sample() (model_compression_toolkit.FolderImageLoader method)</a>
+      <li><a href="api/api_docs/classes/FolderImageLoader.html#model_compression_toolkit.core.FolderImageLoader.sample">sample() (model_compression_toolkit.core.FolderImageLoader method)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/set_logger_path.html#model_compression_toolkit.set_log_folder">set_log_folder() (in module model_compression_toolkit)</a>
+      <li><a href="api/api_docs/methods/set_logger_path.html#model_compression_toolkit.set_log_folder">set_log_folder() (in module model_compression_toolkit)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.Smaller">Smaller (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.Smaller">Smaller (class in model_compression_toolkit.target_platform)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.SmallerEq">SmallerEq (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/layer_filters.html#model_compression_toolkit.target_platform.SmallerEq">SmallerEq (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
 </tr></table>
@@ -351,19 +337,17 @@ <h2 id="S">S</h2>
 <h2 id="T">T</h2>
 <table style="width: 100%" class="indextable genindextable"><tr>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities">TargetPlatformCapabilities (class in model_compression_toolkit.target_platform)</a>
-</li>
-      <li><a href="api/experimental_api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformModel">TargetPlatformModel (class in model_compression_toolkit.target_platform)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformCapabilities">TargetPlatformCapabilities (class in model_compression_toolkit.target_platform)</a>
 </li>
-      <li><a href="api/experimental_api_docs/methods/keras_data_generation_experimental.html#model_compression_toolkit.data_generation.tensorflow_data_generation_experimental">tensorflow_data_generation_experimental() (in module model_compression_toolkit.data_generation)</a>
+      <li><a href="api/api_docs/modules/target_platform.html#model_compression_toolkit.target_platform.TargetPlatformModel">TargetPlatformModel (class in model_compression_toolkit.target_platform)</a>
 </li>
   </ul></td>
   <td style="width: 33%; vertical-align: top;"><ul>
-      <li><a href="api/experimental_api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig">TrainableQuantizerActivationConfig (class in model_compression_toolkit.trainable_infrastructure)</a>
+      <li><a href="api/api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.TrainableQuantizerActivationConfig">TrainableQuantizerActivationConfig (class in model_compression_toolkit.trainable_infrastructure)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig">TrainableQuantizerWeightsConfig (class in model_compression_toolkit.trainable_infrastructure)</a>
+      <li><a href="api/api_docs/modules/trainable_infrastructure.html#model_compression_toolkit.trainable_infrastructure.TrainableQuantizerWeightsConfig">TrainableQuantizerWeightsConfig (class in model_compression_toolkit.trainable_infrastructure)</a>
 </li>
-      <li><a href="api/experimental_api_docs/modules/qat_config.html#model_compression_toolkit.qat.TrainingMethod">TrainingMethod (class in model_compression_toolkit.qat)</a>
+      <li><a href="api/api_docs/modules/qat_config.html#model_compression_toolkit.qat.TrainingMethod">TrainingMethod (class in model_compression_toolkit.qat)</a>
 </li>
   </ul></td>
 </tr></table>
diff --git a/docs/guidelines/quickstart_pytorch.html b/docs/guidelines/quickstart_pytorch.html
index ba3a9d422..ab11858b8 100644
--- a/docs/guidelines/quickstart_pytorch.html
+++ b/docs/guidelines/quickstart_pytorch.html
@@ -20,7 +20,7 @@
     <script src="../static/bizstyle.js"></script>
     <link rel="index" title="Index" href="../genindex.html" />
     <link rel="search" title="Search" href="../search.html" />
-    <link rel="next" title="API Docs" href="../api/experimental_api_docs/index.html" />
+    <link rel="next" title="API Docs" href="../api/api_docs/index.html" />
     <link rel="prev" title="MCT Quickstart Guideline for Keras models" href="quickstart_keras.html" />
     <meta name="viewport" content="width=device-width,initial-scale=1.0" />
     <!--[if lt IE 9]>
@@ -34,7 +34,7 @@ <h3>Navigation</h3>
           <a href="../genindex.html" title="General Index"
              accesskey="I">index</a></li>
         <li class="right" >
-          <a href="../api/experimental_api_docs/index.html" title="API Docs"
+          <a href="../api/api_docs/index.html" title="API Docs"
              accesskey="N">next</a> |</li>
         <li class="right" >
           <a href="quickstart_keras.html" title="MCT Quickstart Guideline for Keras models"
@@ -153,7 +153,7 @@ <h4>Previous topic</h4>
   </div>
   <div>
     <h4>Next topic</h4>
-    <p class="topless"><a href="../api/experimental_api_docs/index.html"
+    <p class="topless"><a href="../api/api_docs/index.html"
                           title="next chapter">API Docs</a></p>
   </div>
 <div id="searchbox" style="display: none" role="search">
@@ -177,7 +177,7 @@ <h3>Navigation</h3>
           <a href="../genindex.html" title="General Index"
              >index</a></li>
         <li class="right" >
-          <a href="../api/experimental_api_docs/index.html" title="API Docs"
+          <a href="../api/api_docs/index.html" title="API Docs"
              >next</a> |</li>
         <li class="right" >
           <a href="quickstart_keras.html" title="MCT Quickstart Guideline for Keras models"
diff --git a/docs/guidelines/visualization.html b/docs/guidelines/visualization.html
index 17053033c..7c879f19a 100644
--- a/docs/guidelines/visualization.html
+++ b/docs/guidelines/visualization.html
@@ -52,12 +52,12 @@ <h3>Navigation</h3>
   <section id="visualization-within-tensorboard">
 <span id="ug-visualization"></span><h1>Visualization within TensorBoard<a class="headerlink" href="#visualization-within-tensorboard" title="Permalink to this heading">¶</a></h1>
 <p>One may log various graphs and data collected in different phases of the model quantization and display them within the Tensorboard UI.
-To use it, all you have to do is to set a logger path. Setting a path is done by calling <a class="reference internal" href="../api/experimental_api_docs/methods/set_logger_path.html#ug-set-logger-path"><span class="std std-ref">set_log_folder</span></a>.</p>
+To use it, all you have to do is to set a logger path. Setting a path is done by calling <a class="reference internal" href="../api/api_docs/methods/set_logger_path.html#ug-set-logger-path"><span class="std std-ref">set_log_folder</span></a>.</p>
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">model_compression_toolkit</span> <span class="k">as</span> <span class="nn">mct</span>
 <span class="n">mct</span><span class="o">.</span><span class="n">set_log_folder</span><span class="p">(</span><span class="s1">&#39;/logger/dir/path&#39;</span><span class="p">)</span>
 </pre></div>
 </div>
-<p>Then, by calling <a class="reference internal" href="../api/api_docs/methods/keras_post_training_quantization.html#ug-keras-post-training-quantization"><span class="std std-ref">keras_post_training_quantization</span></a>, a TensorBoard writer will log graphs of the model at different stages.
+<p>Then, by calling <a class="reference internal" href="../api/api_docs/methods/keras_post_training_quantization_experimental.html#ug-keras-post-training-quantization"><span class="std std-ref">keras_post_training_quantization</span></a>, a TensorBoard writer will log graphs of the model at different stages.
 To visualize them, TensorBoard should be launched with:</p>
 <p>tensorboard –logdir=/logger/dir/path</p>
 <div class="line-block">
diff --git a/docs/index.html b/docs/index.html
index 1d86e87d5..a86c103df 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -71,8 +71,7 @@ <h2>Install<a class="headerlink" href="#install" title="Permalink to this headin
 </pre></div>
 </div>
 <p>For using with Tensorflow please install the packages:
-<a class="reference external" href="https://www.tensorflow.org/install">tensorflow</a>
-<a class="reference external" href="https://www.tensorflow.org/model_optimization/guide/install">tensorflow-model-optimization</a></p>
+<a class="reference external" href="https://www.tensorflow.org/install">tensorflow</a></p>
 <p>For using with Pytorch please install the package:
 <a class="reference external" href="https://pytorch.org/">torch</a></p>
 </section>
@@ -80,20 +79,21 @@ <h2>Install<a class="headerlink" href="#install" title="Permalink to this headin
 <h2>Supported Features<a class="headerlink" href="#supported-features" title="Permalink to this heading">¶</a></h2>
 <p>Keras:</p>
 <ul class="simple">
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/keras_post_training_quantization_experimental.html#ug-keras-post-training-quantization-experimental"><span class="std std-ref">Post Training Quantization</span></a> [1]</p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.html#ug-keras-gradient-post-training-quantization-experimental"><span class="std std-ref">Gradient based post training using knowledge distillation</span></a></p></li>
-<li><p><a class="reference internal" href="api/api_docs/methods/keras_post_training_quantization_mixed_precision.html#ug-keras-post-training-quantization-mixed-precision"><span class="std std-ref">Mixed-precision post training quantization</span></a></p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/keras_quantization_aware_training_init.html#ug-keras-quantization-aware-training-init"><span class="std std-ref">Init model for Quantization Aware Training</span></a> (Experimental)</p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.html#ug-keras-quantization-aware-training-finalize"><span class="std std-ref">Finalize model after Quantization Aware Training</span></a> (Experimental)</p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/keras_pruning_experimental.html#ug-keras-pruning-experimental"><span class="std std-ref">Structured Pruning</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/keras_post_training_quantization_experimental.html#ug-keras-post-training-quantization"><span class="std std-ref">Post Training Quantization</span></a> [1]</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/keras_gradient_post_training_quantization_experimental.html#ug-keras-gradient-post-training-quantization"><span class="std std-ref">Gradient based post training using knowledge distillation</span></a></p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/keras_quantization_aware_training_init.html#ug-keras-quantization-aware-training-init-experimental"><span class="std std-ref">Init model for Quantization Aware Training</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/keras_quantization_aware_training_finalize.html#ug-keras-quantization-aware-training-finalize-experimental"><span class="std std-ref">Finalize model after Quantization Aware Training</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/keras_pruning_experimental.html#ug-keras-pruning-experimental"><span class="std std-ref">Structured pruning</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/keras_data_generation_experimental.html#ug-keras-data-generation-experimental"><span class="std std-ref">Data generation</span></a> (Experimental)</p></li>
 </ul>
 <p>Pytorch:</p>
 <ul class="simple">
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.html#ug-pytorch-post-training-quantization-experimental"><span class="std std-ref">Post Training Quantization</span></a> [1]</p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html#ug-pytorch-gradient-post-training-quantization-experimental"><span class="std std-ref">Gradient based post training using knowledge distillation</span></a></p></li>
-<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.html#ug-pytorch-post-training-quantization-mixed-precision"><span class="std std-ref">Mixed-precision post training quantization</span></a></p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.html#ug-pytorch-quantization-aware-training-init"><span class="std std-ref">Init model for Quantization Aware Training</span></a> (Experimental)</p></li>
-<li><p><a class="reference internal" href="api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.html#ug-pytorch-quantization-aware-training-finalize"><span class="std std-ref">Finalize model after Quantization Aware Training</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_post_training_quantization_experimental.html#ug-pytorch-post-training-quantization"><span class="std std-ref">Post Training Quantization</span></a> [1]</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.html#ug-pytorch-gradient-post-training-quantization"><span class="std std-ref">Gradient based post training using knowledge distillation</span></a></p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_quantization_aware_training_init.html#ug-pytorch-quantization-aware-training-init-experimental"><span class="std std-ref">Init model for Quantization Aware Training</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_quantization_aware_training_finalize.html#ug-pytorch-quantization-aware-training-finalize-experimental"><span class="std std-ref">Finalize model after Quantization Aware Training</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_pruning_experimental.html#ug-pytorch-pruning-experimental"><span class="std std-ref">Structured pruning</span></a> (Experimental)</p></li>
+<li><p><a class="reference internal" href="api/api_docs/methods/pytorch_data_generation_experimental.html#ug-pytorch-data-generation-experimental"><span class="std std-ref">Data generation</span></a> (Experimental)</p></li>
 </ul>
 <p>Visualization:</p>
 <div class="toctree-wrapper compound">
@@ -119,7 +119,7 @@ <h2>API Documentation<a class="headerlink" href="#api-documentation" title="Perm
 <p>Please visit the MCT API documentation here</p>
 <div class="toctree-wrapper compound">
 <ul>
-<li class="toctree-l1"><a class="reference internal" href="api/experimental_api_docs/index.html">API Documentation</a></li>
+<li class="toctree-l1"><a class="reference internal" href="api/api_docs/index.html">API Documentation</a></li>
 </ul>
 </div>
 </section>
diff --git a/docs/objects.inv b/docs/objects.inv
index ec10c3aa94b957cd3231822be13e70961f14fb42..251a31cf493e8f2da279751261ad2773f4a8e14d 100644
GIT binary patch
delta 5312
zcmV;x6hG^oD~T$Qd4KCyuxfmTQ#+?A)z(&d96RfpIC0jR+1-<hmS~%0iBw1`iTBqp
z-ULWI8Xzd=FcXUey1#C`8n2K0O}GAf%&V^aU(vMZn|i;mt8@BfT~?3v`4{#w@5;Km
zExPA=n;l-4n_b?v8Twn6AIf+5zxB4>wD0!y_P8tBcU|5*6@T6Ou*<v0y4jyUcl+Hh
z_+_zMV+Dt%Xj?38-PQH(rR>g!$qg#e!k+zo@t7ZX-TQLW_0R^$=tGQ5Ny|{3K}DZq
zh(!FJ0ZK3brFd<VE7;Ucaen!nS5>jQ_))fA2VFP$zW81@FE^y{!5Z-YF6-*Ce6lJK
zb%UhGf=F7h_<#4s!|@3ye@oJaD!8t9+oHMI=TF7QI>&$d{WQ!Guj{<c_lI5KFZ&5P
z)l!|Q4*YR<<1L(h`J>pbasEw71$<RndT5#55?Oabl-g$iYf4Hm5$aQ^yK0)c8TQOG
z=;TAgHt+KFj#a<wn~ztk|K45Q6UF33`kHIfYHzG4On-lHuK<PnC|VF3Lya9Ug15ea
z{yh?*rGrR^QC9#(IcTEiFBk|(*OI^V9tTZr<$&%j7B&O}ygQrQQZEvy8>*tCHLTc{
zU5$gwd_#n^w7xzSmwB}<al0<s3;g^WRX~+7Ef-za_-)ozfXo|YfrFXZ?7$d%cFW-b
zc#QG?E`Q3W=dS$;3fzKZPJ`dPsO@0Vn0;MV`R*rZ)*c)QjeYC->;f^9nQv5!Jvh=B
zs|vo$aqMz^tZ0JM*=dI`)x<0O`(H;k<DA<TsVf$Ag>$VR%Uws7r#|5ypKu^~O@E&P
z|3G6>EABV-;SEet)h4rN^?GVk6pc_T)QI?8U4Mu&tzRMN0v3F2EDEQ#pk-VML*S*b
zfOWPgtfnbP%v2_J>M~)n5@d&Q&1FtwRE1uPUWz7f*JQ3t*JLojM=^8^AySF$J3Ys`
z_;Dzja$i(kz5}n+M9-^yi&m!YA~_yQFmqB!z8Lb&z`UJvpc9ExLHP-a2pWf<016;V
zo_`g^IFOxHoh|x2iBe;*IJ;(3SeI7m;T5OeJO>R|!#u$Q7R~fjRCw5<<2~7aW@F&s
z4Ii%|pnNi7aS3CmA#+QK!DhBqEeUw!;gS-A&1P*VI*1$)KDKMWCA;><;|d76-48nk
z;lhHk*9~sa=YJ5_U(sLp*qVIDd-ChL*?;Gqx4la_0Q+UyJLb?6YgNaoIrXs0%zmzE
z`g!!QB=YCu_jUeMS8Z2r^qI>ewbf}p0^y4Daf~h0h5YThRV#?F23l>CS>{m~Z>3gU
z9`jAUEu2*-nMDRAF;?*2(OFvX2A|A2ugWR5iV;CCwZYT5%FU<-WQ`kOg1(8w7=MFv
zeCthq$REmG*_A~LjZ<7QKsXNF*Ygi|t1tf~FY@Z11evYpNRAk7KQ#Ha#DhA{ehH3?
zn8snw8FldmEAqDp-@FE+Fcgvgje>6XTw>58MP9glNUtCcn+vF>LJL@p*CQ0;tWB+F
z1*_(uxvSQPy2VYh$;+y&p0ooc@PF7IAS^hZrdXwm(x43x7mSyAf}CHIhpo4LCk*qW
znmgyYA-WIEkr;4($Ns(a)+N!*v<wlN#8EP!9_V3Hp=HBPy|sKBij+}{ORFoMUWwMc
z>zeZ6*cHjmEB9nr%&SeY#wFC0o0F+)X=fXvF4U>4s_|culX+9_5De9E&wngk=Z8a6
z|0wsg(Y5osS)ktM?aQn#7X3`DlU?~iIAk}UqIXZ&NveH%nyx${xUXa$eX)X`?asS^
zk(bC`ag@-5+`$UOHfNvFU=9MRgZe2Pl+6!mkPW2!;IS&M)tmf#jyon<ryj{>3?9uR
zyGn>?XaV~r;{SIu03~9fAb&;6oW-Xh!czi{@+(v@1Zaz+{#}iYqZbw++IfzrqFEpE
z?ir$FcuVi<tGAch<*!(QI3^UK<NDZQKX~;R?;D0``p^_PWS48QNnFt>y!Vj^V7qs8
zceXu+BR|#MDQx?Eh`4f<z`V}~z6aFa7u~9+E^be!xNfjoZ0!cHg@2JyDKYjG`o?AY
z`5<HeQz{3BVF|R}@AKX66dey&bc)8gqQCF>&&$Cw@Z28Nwcmo4x~HqvSE`5d9_c_f
z8qa3BK+n}ALth_^m&x3H@JzNDmCkJ`pkF!x7lN)iq0PLLca1T#mF7_6jArSh*vuAD
zWyy>gCT6R@&Yo^2`+rP26Pqc1{wgmipUcHKJ}hao4+I~_f~GfbVAg0FGK+0O%i9?^
zd-3&p-oVJg9B38;nT|IwZWOT2VxG|Qb_UK~g1w&kjZ}fI4|FlWwLCD>*fG{PzvZ=@
zuw%h%>W9`hi=Q<#7;2s01x_iDx!OrW2~D-rDP(yxf7lg-x__j}+palox?@wE|DLx6
zJ*>A9DZU71Gyeq8CKNIgbOGY0(S8<4V;ueM8t5w8X>jo?E^i5nZ%_5_B~zZZT?KR}
zih@2*8K2A@mQs8}U+9RU9Knw7KH%29*0#rR@Br$APG-FeO_b&07%a7Yu!Y5~2XuHR
zwcm~hEqr$_vVXSQF7Zq7{ftb_d`S{5V1#5|O=b$Sj6Kfi^NfqSxVu^SX}kOyM<idF
zF2G^m_^_o<oB2>@HWuX2svmLlX&fIF%J`#<Jv*{!ZQ(op1J%^~QRpF0n!Q7da&c&>
z{GG9OMD*_R2eJYKy+5P~K}-m+#<IQTlGHQC!zb`$cz;$=WZmllhix79#U`%+z$}b>
zTqYti5tWI$8c~_=t?HnF`Sv({l(A<7Ts&GP5K)1M2}DF-P@|M_Iw9g)@>7jD;qn9E
z8uRd}0u*9Eh;Ho{xQZDtXo7e(19u(b{OzIp%A$%TIqmz*j+?U+ko-I}6rtt3xJ4|-
zYdhl}hJSqcWHRQVK!G--o8%`4IY#~~+o*jW0HNWeB^QNsQ30JQ7eH&Hz*Y8rBpg*=
z7X>C&jJNwOt8MYa+O5;KtRu&*I(v_w8L}@)Pe6V;Q1_C4!Osv)?GnkYgh>>MFWJ8)
zdE%H5P-354T=X|e#s4oiSaDu$vyOyZK=C{u!hiV?&v!EtWm3rFN0=6o_?G><h`P*e
zts6nN!LtuVm%YdDKgid-_2PP&(ZD^UJ1mhXmxQyNyz1X<digYGMx$z%>%#80<5b9`
z5n+vpW=C9OGTYTFGVo#<-j1Po#@*-yFx30w5nz(*M|XONzsG}u(b-ds^N<ig+zwzM
zaDUecK9QS<)!im|-ms#9a4R_51s4En83A4x-U5RblkxVLqY6!c<Y*(YMPa`CW^X43
z=T9@!c?}j)1l~Ka6r_FiJPsNy3Vjb@gxp^M{`<S6BphmDOaoAn`1}s!A>rL6X`NZ$
zJY!KU**HLHZ~7zvPeWN#*cd?4Aw_<$4S%6mB7xqHx@pPLizb?pCBAKThb3g<c1NZj
zno4OGFE5cTd!V{W=1gSHw7W{sl8n1^%1T${MHCGp5|EI9G&Bi4XJlRi7Q3Cbi8g*h
zw69LqU_pvQH0{{%n~~JOD9lTeNP0H>TAgZ|Be5wanyvu@9dErsOxLJH+2cB)V1EgP
zvLp{PdC6JzG1$fSo6h77lEPKTMw*beLyPFg;+kJrf0dwvis+ZT9Z{s|rfajn;<4SB
z<$&(RzR^~!5QPHa4sUxwVigPQXzQ(B=G9&_5~5?kL$1gHy$Zf<$APK^on4UheI;PW
zNw0aXsRr=U(5fCy+BXK)cW4$vN`DD{!;qDlnjX>geaoN_kc4n5Cy~2_2})RAQ3M0O
z!8xXY2A8U|aB7M6*D#@_NmWmG2#CheSB78?Lpi|(%?u!7mtqbdKEr`CFN*p5aF!Eg
zP4bz}Bvu(|!^D_97KALnlrx@bJUgPa;j^B^K8&0B_!(=h6N9_gm3P_6DSzHN{|R1U
z1Mu$J=0Jv3wyDOZZlX~wGqxIqw!kD!E~=#gnpU(EVq$qO|BZwN4T)V6WdTIR^nR`$
z;blWyA8SUE*glv`LpI&1p=*d{SvpB${BRx-QHlX^{wduBiuHpCNdn;e!&`5}4=-h4
z%pXR+0xw;vK80%r{4CzWGk@{9WLNaOYnEpp=^K!yWg#-LhX7|9xn!6alp`+2jb;34
zCA-Cz&oE_bW_Gs2t7NI>Veeh`+CBh99`G|yh)anDqZl6ng6HnPIJNM87s~7B(MO~*
zExXG&HQ`dr1@`s$6IS%ez}piLfgNr^!t*O%&RRIRl)e7eNS8C2&3|Q;NVJrx!T!}L
zp2aWW*D&pm`Ae~T?U(0qXPk-k&@dcBNw{BSYyH_Zd-FxrLDyL#u=SDMbaX<N2_KK+
zLJ@Y4yRs{$qvLW$$X3@M@pBKVvg&?|MMCll?KhuRzri%}8l%#-XKaob41lkgtD+DW
zW!D0N*Bx<@miaCcl7Gz3mIzn;Cq%W*;2x)*J>&akW2q1r?3d=hDTQPg=l=MD2kL&)
zeGLXgGu>XUzCeU)5ox3ch#)<-<bntYJ&FWbU02nQU=TFZ=TD#h0});yaLku|E1K4`
z{$N#ws0buP5XHJw4-C=YMmIze(@Ozjwhe5I#t$mQg3ubINq;g7Ou9zt73llMh6k`(
z+an<wM2tT{<AD)5u<>l5;f%Ve-8AJP+(b1mol@S@zdag{ExC16{K)r*h!BwGMk4p0
zRMr*y<<%<##;sU$sT;DwTQo(riGfleAyBNI)D7wd{^`-U@N;%}!|^f0M@D%YvI{{Q
zf`d}_7NAZc6@OO&xV>T^8IfX;5F_D)prOCAytiZ$DEbKX(j>MphwaNB#ddwbv)Phf
z@-^_Wc}oo-gOw#jnQQU`$iIAXUNH=X{0kBH$M7;?2p)*d;0YucHcg0RLOtNor}L*M
z6q-gRQB$x4-+oPQyj$BXNpdHWjA{S=`gH;L?54M67=OOfnGHm^T&pKt=HA<5uCIfN
z+!v;+WEPF&p9WSnO)6z}@#$EQQh2v$(kXH~d%c0iL6Lx)qe(x1hS)RF$N~zz=h*jF
zuK^u@reuX_SSmTdRu4Y{fPW9VlqekFwLyb^o>zVf!K+W~B(PQW2&Dr7`lk*S&@a>b
zOV~D)hJW_bre1l{P-N|W9YalO(C{h)0V^ueXfTKaS2PWt6@lv)1feQYg?UAuyQ<#c
zo{+cNnW)CHp%7Qe4bm<dBQwAcMv^n0n-ML;6w>gRjRlN=FIM+h(1=$LhN!2;Ym2U{
z88==mDzh*n<y{E6y20W$j2d_nGF8xsbvO_aS%0UR3Wmr~xq_h(qIw$(6oV`iy*3Qm
zSXh04Mu$dxc7aw>>~N&u?$8U-&<h51fXiWD1|If|z}Q119*W^^N{1PDHPjE%C=q-E
zG#u=v-i9oX1tLd8yj(wXFkD^|7|xY7w@uI$X8?XC%0TQLk1M^C*#e-$yX;5}z^xXt
zIDdZ#;$o-EtYV#Q%#vwIPBqh=F_}V=>_Ob=<k54<b`S<eSirXtX0pL9-AVfwXot02
z;T^Qo68RSCZ)KOAv|f#!l}l<+cr*bs$gaXqP&(PH?~LVhHk)+$9+pwvnyT)I!oy}w
z{<3yEdNS6@{JpBPuIzTjKNe3#)w5Jd+keDUmi&hNxp+F3xMwUYI;Sf)FD>p^IiHNG
z+>wk)yS-fD=tjKBK8W<n^<{Rt-=&dkn`iyQUaRLuwhtZIMMwP`B-4*?U{AF}JvZd^
zogho~d+$!WiQ(4k_Mq!dhaaWei-S8HkrsU`+hc#|#_U8b4fEe$TDI?H_gq%ls(+~3
zy7|4%o2^yFa#ObiRa@@MUEY-4YeqO^@n7xm@PZS;FH8>V<se1QB~x<WE4h>}?a&6B
zA_ES-hq6Q8%Wd}@f^xXeqKQPk$lHNxjh!$1U8J*P|7I$XjuyxRDUcA*+9SkdAyt;Q
z^hb<+N;fDXLrEN*tr&4I*+Fht#eZFBoP9@nMPq!sX3W>8q~yeX{gZ{D!@~_^x3fwT
z?{C<@3(09m<LDkVXFJZ01T^)hRip@(WoE=PBa)dl>kzlp--_m2S$wxDlnFlbKX^u^
zpR#3DlJva^&)yV#E5Eg7SCafo{>ihq#{)kd@L1$zG`EY9Ns&x?FLPh>M}J&wS8SfE
za+8zdsaO=<*(J-=NKL(xGA{e4gpu1Ys2^UDcp)n^2@TosuDtbR!+r8IE@druTjZlN
zu<RMjbI;!2<xj=p_=H4s0;5`F83weL^z^oV&Oh*|JC}e2rRw;sJx(z?<Q{swTgVV<
zOoz;Anx2(8f{*#kz`u;8YJbPYLk`WHjSg)e3C-Dn3OSzg_{>UfO!R03!co-0XGWr6
zEE~kgnS#NR=|V>8EKwKW+?5*gAs1gX>!XH|yj6h#cpf<_0IOpf_Ct=>a#bJX)dBn7
zz=CkkTA2a|SYh5Zqw_KWrr^`#c!w*#A*6al#E642nxp#6%0_)8G=I#aaY`95&R{_a
zmII{xOGBe4^o=U6rq4{PC$R$f4rb<ylV(WrgoI>q(oR7Rkb+T7A|{jqTjp5+eVW9g
zGKm%2bt)P%32VSd=4B$2z!KDfxT2rJ%GIN{-P@nWaMgq4ob86@Ww;D4VL|R|$6<!w
z1eZ3rE(?n+CIbWRgMWhzCs&fw8{J=y1{q9}#~DknNMjx2Q`^DklZ6!jxn!IYaI|xs
z_Kc`d>Nz8el?I%T#X=1SM8nSz_Hy_!Ld*F<oKE|?MBH~I&Me=I=%oWE7^AO2oEg9U
zK;%NHwo=hn^*Y^Ag^k8a!JH<tn8wSbm;;F}!bzDFdjld20DohVg4`Qr4CsjzOi5fH
z>+xw6J*pLP1G}H*Mg?mc+#Osu3cNW6_;9ip#g_0vK7#fI=zy4kK8yziX!v-r4`f8a
zdIm?%!%jl8{9@8RKKgys+sJzQq1}N*soFU(EBkB)ngs8L=UKo;rmoFMd;r)SJPX?L
z!#YhYHW6GhOgR!~l0j6`kWL0CF`X!mICUf?$)yzAsX3C;b(Uz#fdf_c;9!XNL<r71
S-eU!B#GUzf+Wrp(_7zsU{9051

delta 5461
zcmV-b6{_lqDxE8kd4Ky?uqwVnQ<I}=YpXntopsG*#xwTL)}B<fMA@uJqC!$myuW_&
zCI|vx<3Y-o#3F(2ue*W9gN??1-LAf!@<Utxuc({Fy4vrn!-76pm4|J$_>;ZN+p;=*
zDcYB6lO5ld>s{V78TvWPkL6Frk7H4n`{K~%yA^)0+EnZ2r+<C5Iqiz(r#7#ji*|L~
z<?Xhr_luWyzx#k+7P}SZcC3r0!K7DhRqei(?LseZ;Eyis)vsUj!=cz+{V1Cbrwb-6
zfnna(`M&sG)nD(3)D+~Ulhdc->GXVE9k%5&jFV8vhE&8PNlh4|ZGPIdpUQRXCz4Xp
zlg|R1fbiNgg?~@X>}&DXOv~-I+HH#ZZl6CFzg0Q@)3a^p)q{90ntXrU6`qoY@m3r2
z#Qosc`#Zn(zb}6jn-!+BE-9gJN)Pww7GDUNdqG8Y6Xs4i6^?PvZgnJJdsEj{tvlxl
zd9SOwSX|?OLgXcteR+-9`tOftX@V3RA2K(2o3D1PhkxGQ{dV*C-}{>ff{MJDuBTfe
z*gYPK0OR9g!LXSx-w<DJ9P3cfhyWW<p&+-yEwWjWahibw{VQxX6NuC@6r{)6X9Pv7
z^~A+jjDeJE$Y1@j1tsm-?g1?nK7>7d;6kw@SH$RfP7SE;d@id)#~G+z4n<2lVX-OO
z3a_m4HGd(~&@TO4T<3>PiT!oaT;b=hlm%tS_*}JZ?Wux3zcFdG(r{1{iyyPloKgeu
z1!#y8{!^6CFKzRV8h{1Sl!Ct-)7wF%5&yP4<hys&?MLt=6#Biia~GJ2#65HC9>J4F
zXqE7Nj;DjSrvoi8zr1!Rv7+AK-+!IhHqKl!Nq?T9;19UgYFqAFvd8;7{_#7WtKZV!
zbIPG{PAbjAx;mawB$a(KxgOunC6dA!DvdhlUZ|Tqri~&Lv{MA%kqQFc+n6_Q@1wB&
zeb`5YAk3zf4q!<cxGm_l3p$BB#;wjdgi;xgO7^v=^JYc%GU%S13XGuMiowW<oAPRY
za(~bQZx9~eaK~Q1Btqn*2EjxtJr@To88tfn;Kzw-@3^JBF^-cA1=<#ermDBQ>U&D8
z%*yGI+GI~+co)$Sunv_b=sK}zarvsoBjMs#LhgqCdcYL&9d`}4RlUz!zb_Dys1Ja9
zrvGz7U@B!lSG4>LOj(gW2L5){sA^bksec~8mO}oJ<J(EN$UWt6^L4%{oCcXjJOjrN
zk+?H)+7aI1rxA6Oe~jS5oA&LgJ)Om(MxG$i+-Orf1Umfo<AYY~{FpzLyRt2dCTQe!
z5d?ucw%-<??;rpC7kQB%9>|QV@%b_?KDT|Y^G%80VOrPVfuFJ0Yo3iU^h^9CtbZ5V
zy4tT^fA$Qq3CF-!FywDBR~u~!C<0PoD-4pu-lV3KV8AsAcJK$q#OO!97t%`I>|YTf
zVhy1x0@{w%)lw`9OsB5;big>c1YC`)W7S~)T<7JXJUsV5>Lyqh__6^@AvHO*9HERL
zlJvJ74A4e4D&Raw#FC6b-gI+_0DqIJq;gIQ4#ciKxcGJ&DR8W`K!+5#bea&H!Qlg5
zQ$y1(c1m29Z*pgWHuh=s?4ZuCEa-RhxgotH(?LHw&j<<dQFs<K!|%4Uu(f?`ot3%q
z+vscvOkXjlVScPnWO!TLv;VKdCb4|LWHh|zO&SIfb$bQ`YZg4*@K4HwRDXkK0B!O7
zMiAxLNtI8hwwMu8xhI=F`C(nGFyXpfzXKo*T`8Xnh@HxrTFv3KXDY!Aj&=2;+*8+m
zHU)|L`@H!&KM1)dopvdjaNVXZK&M`Jri871Q--W;^g2F#;?{cORMKDxS?~E%g<$=b
zw~Ifo9)k|J<*mm)5MlJlQGW*=Y4heL!ce-320>8>Z>T!`5!y5~0Zfh67*^)cdd)5W
zp5x&}HpMMjq?G?F0(~WfG}QFt6!E|91V9N{C`i$vC()@7@sxmr^a>>m0ooMpYFA<5
z=($C2D7^Y}QLm19`vT#pXEwO`=I7aV`5WdY;zI)%-kut)AwQ<Z?0*e@Y(LjU?!EYn
z7M63JUCF-@0&KZUw>z5I_5FL*&Mx&I$Jk@=2?YP+$V0rEhoXI~s3n>+p{Qz%0qbGy
z8<mw10a3&3%!lpZkE2{bo()OJOfmt4hkd@=&F=a**V&!GBmI5Pe_m^WIkPIh59N!0
zSW-NOejt%fZ%fDG!GDlEM@A*iGnpvW(Rkk4JtWK_s1d=`Vgvl&+-bA=FcK<&4>PVI
zZyr1A>?f45Kd8<r9_5@&GQBX1m2mpaIfOL<NG!AX`B7#{S;#$QKK%98W+-s*^jZm?
zLB_$lY<fWj%kxP)uVFi;XOLK12Tm_7V|WHh2h;57Wfd&XCx7j{w(XcsFR==Ab)=gp
zu5Fb$hNU6<>D5rl?F>wKMU~Qw?QzUEAJHL9uMZ~`$l7!M`AZLnQ$u9?I)B;~Bxzfn
zH*I}dx2L*T{E{~XJx}&1O8hCZ^?EL7Z5$vgTNgThM(SPS8-nWM2ZJ^#=K;wh_}&dd
z{{69gFEd8>zJEso6^-KMn5HSrrW=cW--}}U@Pf3$&Z|CQ_ps`H48_wIkViX@DqPTl
z)F6&}QblNAFS#lJ?(=-gu!BPvz2KAbuql3IO}km*pM$)W^eqLFUESYhpYSt7^(Fq9
zk)M>#E`K6Re=DUA_!*+5T_pK=E*M2o_?rE1q9?u)1Ai%Y#YNP!kt+VTTw})hVUx8)
z&p`6L9>VnyuXi^fWn#!14UCH@{Du900XY0)Z3&LELfPk{%}DN5lD4*HQHL4+E2BL!
zqgz2B=1Y>i9{(5+qQx@W6<ngb&NE@s2tPpzX@vhmv@GJJV+C=<ror?&5|+k++~ZQ2
zi0;YM4S(Y>a7(6NQXmrrvH^OC&d0*)n6^nNBub$kqiF;jMB~L;!x)HX1WyywW->GF
z1i~1tN6TcLz=^GC4n#Crmli~_;JCH@6*h=K9kZ@6{M6d{@82FtX=nG>DOx=lF9`Q#
z=1^IiH{+$p{F#qP5k3tVY@6}Pig&jkr@s{Xj(_rP(4b+VeTRRWPE>Cn7Z`3V8&9fk
z>*49l){OLZp<&l%Ydig2wCdnl)9vQ>%)FjKn6VjVFxVw=l@3e!CW|NJu-^;E1Cg20
zO9|W6b`UFwIM+FhLd(b^Y6+!@r4-%8Yb?S4h1W$RdhhVNp(Il&(KY8qz`ZPf7|hqY
zWPj{&MxSS#?iFwO9#@2TVj0{nlJ%)UbuvsE<AuYV>m@TKbAcjKuC!Sye`jnzXVBn1
zZ?;h=B1SQ!C9%Nwl9-&`86=Qq+Y-Bm_U(w*{4KWWIzRYAw%i`X86d&{Q3j~35M}Vm
z$~#CD9@S4DW$YP&ok$Kw9Z~9tQAdP&cz-vNU%AK}d&y7k=H%KRU&O;JdsJ%5g+kt_
zdcVS&vH@L>DsRqVZa`$gIkw;U&_lBEys&&&?36Db1%j|!QbJjHa7k<#xguoJpQM#W
zr!M3exY&deyndWkhS!faDF80rxU=mjYS`v>ly>ZSkMXc<fV-Gkcf&_{nYPAVoPQkq
z<fFW7o8~TlkR9|<#_;WQ7ZmH>`Y3<XMtfZ5Xjr@T%0o?egFfN+pXF=r5sX{haUAIe
z7<tvbS$E9b`}rwyZj%i%6MOTXe|oK`x%dK2si)ziNQdq`6-;We;TV<9T!XZN#74tm
z%V?lvVvi)N_cj$EQ@y)|i4DPoQh&Jn-q;Rwn(X|}{%6>wPOcw4lVy-;jp;BQ4Kfv2
zM_){0K69E+dw(<-ETICNiJ`sCHkuWh!na5JB>+v$*N=uA$mD6X@m$x$dJdk^LXTg`
z;Abn~6%X9W6aSEP4k8I&{^68<GVF@@S_gVn1sl^yIixU)lg>L&ZGeS>Qh(HPxrCF*
zNJ!FV?4#EdXt<3<wd{!k@%b7!T|#2kB1Bz8p^e8zq}QqWZlQptV!u`h9$6F2Cop&@
z@(QQ4VMU>tl0%GT&A3eWKSfKzElfcf1#(FqW-?v0YL_sx*mFjcH%M|)jgdmQ37u_#
zk4@kJ{CsI@=NaHLV*|)SGk*^TnbelSkVAbCal0f0fEJB{$c@x=RC%dD<5=@AGD~!P
zkl-_oSb{oRm7HScYId3U8`NjQ@n_fS(=^hkBf><os4Rpecipp#l-b)t`Ug0F8E;r>
zXU?ujc_osDy7*gOE2(I_U-f(qEvm#JQSLomc-s@6&5iZHUWf=SuYZIh5j;rZIg9#e
zwz$NtLMDm>i*$!;BohbR5~S=&TS1p55847Kj>M`0-BRggckmUJa+Aq_)ePYwgA610
z1>je1irqDRZy;XIY4-=BF0ql)rCiU3B9b<rY@Z<R!XME>;ClsAYB#}t!T3eQKC$Z&
zyn+Muqc2)cAHttB^?!GmJ%c<zl1Ay<)6;kDpdKB6R3KfJ;4qWJ=kKD)CY^%%z>vnD
zZWiyKm07d|kD2`06zM;k_e%WiA(-bhb#zV-Zy6!8dcXA7@D@R_Bv+c2A=}U3ru5p`
z4LyUN<=JoajX#EEAt<niz6LNR{bn>#jyO#Zl>B%Dy=}!SzJFj?k!eV!q@3FTQ(3A6
zY$sFvFnu5ov|}epVA@WP1i<5@uJNCv$3O(3P4RSk4zikBlbNkY3#<^e*0M(;%yI)<
zALtX!cB!z2na_fe6Z=H|23t_vJnm<`-hJhnqyg51sIin)!>rZ6H(mS^R*JyI_KtcN
zx<^4{`%CN@|9^TmWZ?~v{c3P|GBcs06<gUP0BfgBx4&-a>j(AqEq(1Hgc!@y=~;~T
zJx!a~1i+j~+oRO^;w47oy{w0RU457^F{8=uvMZ62vB_9Yz{VGda*LS?%|nxhY>tv9
z5;P^yV4U<<mUjZDgG(Qwj<iG_q2z!g&Cvvd&NoMMHGdy=P9se3<a0dIm}Ah11e)$l
zbRzXQ4lTcaoK`Jv)?+88|NeO4dzGtS4>Vi@n`!jG=IGa3=6+|CTo=;{Qdgq~mMmDv
ze|10?FoBV@#HGjna01=D35_5H_u?8B&DvqE!i0=JL+qJw0HKYmyH?Myfos?CWeS}D
z-b<x=n1819>jCj^%|*r|3|svfka0rtE=4~iVk3-g@WjH=sP!*SgaC`3tXL-}QDc~C
z%t|+eTgN8H5Iw0lflU)4hG?ulX-A;2i@L^3qOf)h!LHI*1-K#4!A)E{fa2G@O{uvv
zog%m$Xcd?2MkZg~8PkPxQtYCo04Q{2#D-0l{(n9Rsv*@uR{H>~U6%T$XxoaVsZWB}
zOxc)yJ{WgZW7=zWX;3=MD%HW|L@`(~*|abTLG^y2AaL>C(*n{!*mS2?0O%p*>KL>Z
zFe0~8w_eK?DMOg!9|dpl_o1$SsXOYh>4Fh5dx*qCF-=G|G$c5LIS$`QKJ2WezZmOk
zLw`OR<ojb%lbCoR!V3vrj{7pM38ouXE?U~44R(NJjIQC<vP6g{HVg{@a9D(W^7l1`
zC8xaSbkCL1KC|+G_i_t`B?*h9AA)2FnX=#81kSAdE=G>K2x4X9pIzpV&d$nty+DkF
z)`k%{;5cQJZ&ClP9D=56r9++O@<NlqS$`NzR6D=%J66&P{GDA?GLN)<W+S(zIOIH3
zE&CAKe@7m}{G)>abB+HvR9RcLyW*dtFxunVo3p4hVD?-bx@>9E65=T<en<Yics`YQ
zSSb&5^PyaSZSbhX6a1)19K{&5FV~NFaw^_rpGA4)Tr>-Sc5z(p*KO84?6{7c`+puo
z_W{#I-5Vs!507@o$|2$oM|CGIq#4)VeJ^s|&DX6#R}B0(O1BoZF!w--Ud!erBMU4_
z?3H2q`@2`|d)dB}hwQO9G*$gemDd|9i{-j%2&$&sm%F?!+qaBd&4d4H^uTc^f)9)i
z>gXVa&NXB5&@s7|FYVB@FQwW^*?*_9Mc>N}59b7;)IYxVNTQD97maoAq-^$!C}+q1
zYBESm4e~?`;sd((2r*hnr8R2(LFP!s4T@>CypJh+WcM*;|8DT)h&J4dUWUjMb;iS!
z1;d1pN=cp>vU_qN(k0>!vfEiHiT8Kx{|lMfkgiBN(EJjq>_k9QeOgJ1m4Ak;jCf^4
zDzk3wqn7Hms9($CyOp6V@CW~cS5*9zt*TO_^CrA{U2KcGIIQ)xzfxT(@|XORS8q;7
z8UeM*wna{+8+J0XD3V1VWbIr2h?8xL^~<4L=fpe*ww!3~lx1n8mVT5puDhq?)-%JP
zetbjXg>2AdzRQMp<?To{?0=JAu$6nYn<5uunXJg3u{saz{eAviT%4Yfn4Q2bvtkvr
zys0$EwI72W6H?5{A(5YV810Np4C05QqF@C<!P69_OUrb*$YZmRUmCKGV-`j#0m)D`
zQf905LU@D25HAPevL}+TPRl8tD0ld!HA^^Q+Dow=pIrOWm`WQnvVW%-O_P+9vEY+j
z@>VoVU>Z&i5s+tdf~=DqyyZZ(DhV{-q$W<J&aJ5zHQ+G4o1u<oQ%s(Dkb~Fv@_o_|
z3hZ<ew%t|V6E>XjWWhoJ$vvp$47$M}e`lI3>6ead=qHlzWiWUv&iN8HQ^Ry3G7Qd?
zKTm+{j>X$g)AoiW?|)2sQXRc3=KL?Al!(c}?+r`q07wltV4pzcj+5yFlzrv-K~|Hr
z6`R#0>E0w@E$`cC#y5#_<dVA-S6@nyG0DpSfD^QhuwLlb`67ihU3NFcm6j0c^o<wq
zTP-_*Z8_%><^}5{;t9eG#xW#slNiC71SZUVC1r3Okq%FM1%Hxt>g-M+8U0f`VY0)6
zRdL6G1j+GZKqr1bBH)})qI=~|?i(4!#LnaB2uz06gl9isG9iq>Pb|Y(kH|3njwp}R
zw}j~9a^QqwlceD401T%7Jpi_pT#5iw&zR#fNhyMQ&zk*nN-1jbm^quTJXVm8&Yrd8
zNCp^5OyHhF>wjorvuHc?s5vV13S$L#Txuc^@FZ3UZU4T_K3Z7+Icw<E#4suKd27J!
z#ERfk%nSXqDJhbJ=7s^Olz=i%pC<??Ye<qHOj<h>7je3Z5ff9b;Ssb`zg?~ppX1TU
zOB~L*kP^4h1-HNhNG?4BL;Bp*fDoTxi%YK%3e3}#<xVL!qY@*_^C=-pR!^#gi<piQ
z#RkVpvU2~~7DP@;+P9hGSKgq>remwwupBqcHl2aG$zthLMp~TYXn-WHJB-c&hHzYt
L$7uW?Tp~T}F*nMN

diff --git a/docs/searchindex.js b/docs/searchindex.js
index e1d9007db..8abc21d5b 100644
--- a/docs/searchindex.js
+++ b/docs/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"docnames": ["api/api_docs/index", "api/api_docs/methods/keras_kpi_data", "api/api_docs/methods/keras_post_training_quantization", "api/api_docs/methods/keras_post_training_quantization_mixed_precision", "api/api_docs/methods/pytorch_kpi_data", "api/api_docs/methods/pytorch_post_training_quantization", "api/api_docs/methods/pytorch_post_training_quantization_mixed_precision", "api/api_docs/modules/mixed_precision_quantization_config", "api/experimental_api_docs/classes/DefaultDict", "api/experimental_api_docs/classes/FolderImageLoader", "api/experimental_api_docs/classes/FrameworkInfo", "api/experimental_api_docs/classes/GradientPTQConfig", "api/experimental_api_docs/index", "api/experimental_api_docs/methods/get_keras_data_generation_config", "api/experimental_api_docs/methods/get_keras_gptq_config", "api/experimental_api_docs/methods/get_pytorch_data_generation_config", "api/experimental_api_docs/methods/get_pytroch_gptq_config", "api/experimental_api_docs/methods/get_target_platform_capabilities", "api/experimental_api_docs/methods/keras_data_generation_experimental", "api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental", "api/experimental_api_docs/methods/keras_kpi_data_experimental", "api/experimental_api_docs/methods/keras_load_quantizad_model", "api/experimental_api_docs/methods/keras_post_training_quantization_experimental", "api/experimental_api_docs/methods/keras_pruning_experimental", "api/experimental_api_docs/methods/keras_quantization_aware_training_finalize", "api/experimental_api_docs/methods/keras_quantization_aware_training_init", "api/experimental_api_docs/methods/pytorch_data_generation_experimental", "api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental", "api/experimental_api_docs/methods/pytorch_kpi_data_experimental", "api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental", "api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize", "api/experimental_api_docs/methods/pytorch_quantization_aware_training_init", "api/experimental_api_docs/methods/set_logger_path", "api/experimental_api_docs/modules/core_config", "api/experimental_api_docs/modules/debug_config", "api/experimental_api_docs/modules/exporter", "api/experimental_api_docs/modules/layer_filters", "api/experimental_api_docs/modules/mixed_precision_quantization_config", "api/experimental_api_docs/modules/network_editor", "api/experimental_api_docs/modules/qat_config", "api/experimental_api_docs/modules/quantization_config", "api/experimental_api_docs/modules/target_platform", "api/experimental_api_docs/modules/trainable_infrastructure", "api/experimental_api_docs/notes/experimental_api_note", "api/experimental_api_docs/notes/tpc_note", "guidelines/quickstart_keras", "guidelines/quickstart_pytorch", "guidelines/visualization", "index"], "filenames": ["api/api_docs/index.rst", "api/api_docs/methods/keras_kpi_data.rst", "api/api_docs/methods/keras_post_training_quantization.rst", "api/api_docs/methods/keras_post_training_quantization_mixed_precision.rst", "api/api_docs/methods/pytorch_kpi_data.rst", "api/api_docs/methods/pytorch_post_training_quantization.rst", "api/api_docs/methods/pytorch_post_training_quantization_mixed_precision.rst", "api/api_docs/modules/mixed_precision_quantization_config.rst", "api/experimental_api_docs/classes/DefaultDict.rst", "api/experimental_api_docs/classes/FolderImageLoader.rst", "api/experimental_api_docs/classes/FrameworkInfo.rst", "api/experimental_api_docs/classes/GradientPTQConfig.rst", "api/experimental_api_docs/index.rst", "api/experimental_api_docs/methods/get_keras_data_generation_config.rst", "api/experimental_api_docs/methods/get_keras_gptq_config.rst", "api/experimental_api_docs/methods/get_pytorch_data_generation_config.rst", "api/experimental_api_docs/methods/get_pytroch_gptq_config.rst", "api/experimental_api_docs/methods/get_target_platform_capabilities.rst", "api/experimental_api_docs/methods/keras_data_generation_experimental.rst", "api/experimental_api_docs/methods/keras_gradient_post_training_quantization_experimental.rst", "api/experimental_api_docs/methods/keras_kpi_data_experimental.rst", "api/experimental_api_docs/methods/keras_load_quantizad_model.rst", "api/experimental_api_docs/methods/keras_post_training_quantization_experimental.rst", "api/experimental_api_docs/methods/keras_pruning_experimental.rst", "api/experimental_api_docs/methods/keras_quantization_aware_training_finalize.rst", "api/experimental_api_docs/methods/keras_quantization_aware_training_init.rst", "api/experimental_api_docs/methods/pytorch_data_generation_experimental.rst", "api/experimental_api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst", "api/experimental_api_docs/methods/pytorch_kpi_data_experimental.rst", "api/experimental_api_docs/methods/pytorch_post_training_quantization_experimental.rst", "api/experimental_api_docs/methods/pytorch_quantization_aware_training_finalize.rst", "api/experimental_api_docs/methods/pytorch_quantization_aware_training_init.rst", "api/experimental_api_docs/methods/set_logger_path.rst", "api/experimental_api_docs/modules/core_config.rst", "api/experimental_api_docs/modules/debug_config.rst", "api/experimental_api_docs/modules/exporter.rst", "api/experimental_api_docs/modules/layer_filters.rst", "api/experimental_api_docs/modules/mixed_precision_quantization_config.rst", "api/experimental_api_docs/modules/network_editor.rst", "api/experimental_api_docs/modules/qat_config.rst", "api/experimental_api_docs/modules/quantization_config.rst", "api/experimental_api_docs/modules/target_platform.rst", "api/experimental_api_docs/modules/trainable_infrastructure.rst", "api/experimental_api_docs/notes/experimental_api_note.rst", "api/experimental_api_docs/notes/tpc_note.rst", "guidelines/quickstart_keras.rst", "guidelines/quickstart_pytorch.rst", "guidelines/visualization.rst", "index.rst"], "titles": ["API Docs", "Get KPI information for Keras Models", "Keras Post Training Quantization", "Keras Post Training Mixed Precision Quantization", "Get KPI information for PyTorch Models", "Pytorch Post Training Quantization", "PyTorch Post Training Mixed Precision Quantization", "mixed_precision_quantization_config Module", "DefaultDict Class", "Folder Image Loader API", "FrameworkInfo Class", "GradientPTQConfigV2 Class", "API Docs", "Get DataGenerationConfig for Keras Models", "Get GradientPTQConfig for Keras Models", "Get DataGenerationConfig for Pytorch Models", "Get GradientPTQConfig for Pytorch Models", "Get TargetPlatformCapabilities", "Keras Data Generation", "Keras Gradient Based Post Training Quantization", "Get KPI information for Keras Models", "Load Quantized Keras Model", "Keras Post Training Quantization", "Keras Structured Pruning", "Keras Quantization Aware Training Model Finalize", "Keras Quantization Aware Training Model Init", "Pytorch Data Generation", "Pytorch Gradient Based Post Training Quantization", "Get KPI information for PyTorch Models", "Pytorch Post Training Quantization", "PyTorch Quantization Aware Training Model Finalize", "PyTorch Quantization Aware Training Model Init", "Enable a Logger", "core_config Module", "debug_config Module", "exporter Module", "Layer Attributes Filters", "mixed_precision_quantization_config Module", "network_editor Module", "qat_config Module", "quantization_config Module", "target_platform Module", "trainable_infrastructure Module", "&lt;no title&gt;", "&lt;no title&gt;", "MCT Quickstart Guideline for Keras models", "MCT Quickstart Guideline for Pytorch models", "Visualization within TensorBoard", "Model Compression Toolkit User Guide"], "terms": {"thi": [0, 1, 3, 4, 6, 7, 11, 12, 19, 21, 22, 23, 24, 25, 27, 29, 31, 35, 37, 41, 42, 43, 48], "remov": [0, 12, 23, 30, 40, 43, 46], "futur": [0, 11, 12, 17, 19, 22, 27, 29, 35, 41, 43, 44], "releas": [0, 48], "pleas": [0, 3, 6, 12, 22, 25, 31, 35, 43, 48], "switch": 0, "new": [0, 12, 38, 41, 43], "init": [0, 12, 38, 48], "mct": [0, 1, 2, 3, 4, 5, 6, 10, 12, 14, 16, 17, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 33, 34, 35, 38, 40, 41, 42, 44, 47, 48], "import": [0, 1, 2, 3, 4, 5, 6, 10, 12, 14, 16, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 38, 40, 41, 42, 45, 46, 47], "model_compression_toolkit": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 45, 46, 47], "pytorch_post_training_quant": [0, 5, 16], "us": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48], "post": [0, 11, 12, 25, 31, 45, 46, 48], "train": [0, 11, 12, 39, 41, 42, 45, 46, 48], "quantiz": [0, 1, 4, 7, 10, 11, 12, 14, 16, 17, 20, 28, 33, 34, 35, 37, 38, 39, 40, 41, 42, 44, 45, 46, 47, 48], "pytorch": [0, 12, 17, 35, 41, 42, 48], "model": [0, 2, 3, 5, 6, 7, 10, 11, 12, 17, 18, 19, 22, 23, 26, 27, 29, 33, 35, 37, 38, 39, 40, 41, 42, 47], "pytorch_post_training_quantization_mixed_precis": [0, 6], "mix": [0, 1, 4, 7, 12, 19, 20, 22, 24, 25, 27, 28, 29, 31, 33, 37, 41, 48], "precis": [0, 1, 4, 7, 12, 19, 20, 22, 23, 24, 25, 27, 28, 29, 31, 33, 37, 41, 48], "experiment": [0, 3, 6, 11, 12, 19, 22, 27, 29, 35, 40, 43, 48], "keras_post_training_quant": [0, 2, 14, 38, 40, 47], "kera": [0, 4, 7, 10, 11, 12, 35, 37, 38, 41, 42, 48], "keras_post_training_quantization_mixed_precis": [0, 3], "get_keras_gptq_config": [0, 12, 14, 19], "creat": [0, 1, 2, 3, 4, 5, 6, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 36, 38, 40, 41, 45, 46], "gradientptqconfig": [0, 2, 3, 5, 6, 12], "instanc": [0, 11, 12, 14, 16, 38, 41, 47], "when": [0, 2, 3, 5, 6, 7, 8, 9, 10, 12, 14, 16, 19, 22, 23, 24, 25, 34, 36, 37, 39, 41, 42, 47], "gptq": [0, 2, 3, 5, 6, 11, 12, 14, 16, 19, 27], "get_target_platform_cap": [0, 12, 17, 41, 45, 46], "get": [0, 2, 3, 5, 6, 8, 10, 11, 12, 19, 22, 24, 25, 27, 29, 30, 31, 37, 41, 45, 46, 47], "target": [0, 1, 3, 4, 6, 12, 17, 19, 20, 22, 23, 24, 25, 28, 30, 31, 41, 45], "platform": [0, 1, 3, 4, 6, 12, 17, 19, 22, 23, 24, 25, 28, 41, 45], "tensorflow": [0, 1, 2, 3, 10, 12, 14, 17, 19, 20, 22, 23, 24, 25, 38, 41, 45, 48], "keras_kpi_data": [0, 1, 20], "comput": [0, 1, 4, 7, 10, 11, 12, 20, 28, 37, 47], "kpi": [0, 3, 6, 12, 19, 22, 23, 24, 25, 27, 29, 30, 31], "data": [0, 1, 4, 12, 13, 15, 20, 23, 28, 41, 45, 46, 47], "can": [0, 1, 4, 9, 10, 11, 12, 14, 16, 17, 20, 23, 28, 34, 35, 38, 40, 41, 42, 43, 45, 46, 47, 48], "calcul": [0, 1, 2, 3, 4, 5, 6, 7, 12, 19, 20, 22, 23, 25, 27, 28, 29, 31, 37], "desir": [0, 1, 3, 4, 6, 12, 19, 20, 22, 24, 25, 27, 28, 29, 31], "pytorch_kpi_data": [0, 4, 28], "quantization_config": [0, 12, 33, 42, 46], "configur": [0, 2, 3, 5, 6, 7, 11, 12, 13, 14, 15, 16, 18, 19, 22, 24, 25, 26, 27, 29, 30, 31, 33, 34, 36, 37, 38, 39, 40, 41, 42, 46, 48], "process": [0, 7, 9, 11, 12, 13, 14, 15, 16, 17, 23, 33, 34, 37, 38, 39, 40, 41, 44, 45, 46, 47], "mixed_precision_quantization_config": [0, 12], "ptq": [0, 9, 11, 12, 22, 29, 45, 46], "network_editor": [0, 2, 3, 5, 6, 34], "edit": [0, 33, 34, 38], "your": [0, 41], "dure": [0, 11, 12, 13, 14, 15, 16, 17, 38, 40, 41, 42, 44, 45, 46, 47], "target_platform": [0, 12, 36, 42], "hardwar": [0, 12, 17, 23, 41, 42, 45, 46, 48], "relat": [0, 10, 12, 23, 41], "set": [0, 2, 3, 5, 6, 10, 12, 14, 19, 22, 23, 24, 25, 27, 29, 31, 32, 41, 42, 45, 46, 47], "optim": [0, 1, 2, 3, 4, 5, 6, 10, 11, 12, 13, 14, 15, 16, 17, 19, 20, 22, 25, 27, 28, 29, 31, 33, 40, 41, 42, 44, 45, 46, 48], "accord": [0, 1, 2, 3, 4, 5, 6, 7, 12, 19, 20, 22, 23, 25, 27, 28, 29, 31, 35, 36, 37, 40, 41], "infer": [0, 12, 17, 24, 30, 41, 42, 45, 46], "gradientptqc": 0, "option": [0, 3, 6, 12, 21, 22, 23, 25, 27, 31, 33, 35, 41], "gradient": [0, 2, 3, 5, 6, 12, 29, 48], "base": [0, 2, 3, 5, 6, 11, 12, 14, 16, 23, 29, 37, 41, 42, 48], "folderimageload": [0, 9, 12, 45, 46], "an": [0, 2, 3, 5, 6, 10, 11, 12, 19, 22, 23, 25, 31, 35, 36, 38, 39, 41, 42, 43, 45, 46, 48], "imag": [0, 1, 4, 7, 12, 13, 15, 18, 19, 22, 25, 26, 27, 29, 31, 37, 45, 46, 47], "directori": [0, 9, 12, 32], "repres": [0, 2, 3, 5, 6, 7, 9, 11, 12, 14, 16, 19, 22, 23, 24, 25, 27, 29, 30, 31, 35, 37, 38, 41, 45, 46, 47], "dataset": [0, 1, 2, 3, 4, 5, 6, 9, 11, 12, 14, 16, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 35, 45, 46, 47], "frameworkinfo": [0, 1, 2, 3, 4, 5, 6, 12, 19, 20, 25, 28, 31], "wrap": [0, 7, 8, 10, 12, 19, 21, 22, 25, 27, 29, 31, 40, 41, 42], "framework": [0, 1, 2, 3, 4, 5, 6, 10, 12, 17, 19, 20, 25, 28, 31, 41, 42], "inform": [0, 2, 3, 5, 6, 10, 11, 12, 14, 16, 17, 19, 22, 25, 27, 29, 31, 34, 41, 42, 43, 44], "index": [0, 10, 12], "search": [0, 3, 6, 7, 12, 19, 22, 25, 27, 29, 31, 37, 40], "page": [0, 12], "document": [0, 3, 6, 12, 22, 25, 31, 43], "auto": [0, 12], "gener": [0, 1, 2, 3, 4, 5, 6, 8, 12, 13, 15, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 41, 45, 46, 47], "sphinx": [0, 12], "in_model": [1, 2, 3, 4, 6, 19, 20, 22, 24, 25, 28, 30, 31], "representative_data_gen": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 25, 27, 28, 29, 31, 45, 46], "quant_config": [1, 2, 3, 4, 5, 6], "default_mixedprecision_config": [1, 3, 4, 6], "fw_info": [1, 2, 3, 4, 5, 6, 19, 20, 25, 28, 31], "default_keras_info": [1, 2, 3, 19, 20, 25], "target_platform_cap": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 25, 27, 28, 29, 31, 41, 42, 45, 46], "keras_default_tpc": [1, 20], "build": [1, 4, 20, 28, 42, 48], "graph": [1, 4, 20, 28, 38, 47], "from": [1, 2, 3, 4, 9, 10, 11, 17, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 38, 40, 41, 42, 44, 45, 46, 47, 48], "given": [1, 2, 3, 4, 5, 6, 7, 8, 19, 20, 22, 25, 27, 28, 29, 31, 37, 41], "paramet": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42], "callabl": [1, 2, 3, 4, 5, 6, 7, 10, 11, 14, 16, 19, 20, 22, 23, 25, 27, 28, 29, 31, 35, 36, 37, 45, 46], "calibr": [1, 2, 3, 4, 5, 6, 9, 11, 19, 20, 22, 25, 27, 28, 29, 31, 45, 46], "mixedprecisionquantizationconfig": [1, 3, 4, 6], "contain": [1, 2, 3, 4, 5, 6, 7, 9, 12, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 41, 42, 45, 46], "how": [1, 2, 3, 4, 5, 6, 7, 10, 19, 20, 22, 23, 25, 27, 28, 29, 31, 35, 41, 42, 45, 46, 48], "should": [1, 2, 3, 4, 5, 6, 7, 10, 11, 14, 16, 19, 20, 22, 23, 24, 25, 27, 28, 29, 31, 37, 40, 41, 45, 46, 47], "need": [1, 2, 3, 4, 5, 6, 10, 19, 20, 22, 25, 27, 28, 29, 31, 35, 36, 41, 42], "about": [1, 2, 3, 4, 5, 6, 10, 11, 14, 16, 19, 20, 22, 23, 24, 25, 28, 31, 35, 41, 42], "specif": [1, 2, 3, 4, 5, 6, 9, 10, 19, 20, 23, 25, 28, 31, 38, 41, 47], "e": [1, 2, 3, 4, 5, 6, 10, 19, 20, 22, 25, 27, 28, 29, 31, 41, 48], "g": [1, 2, 3, 4, 5, 6, 10, 19, 20, 22, 25, 27, 28, 29, 31], "kernel": [1, 2, 3, 4, 5, 6, 7, 10, 19, 20, 22, 24, 25, 28, 31, 37, 42], "channel": [1, 2, 3, 4, 5, 6, 10, 19, 20, 23, 25, 28, 31, 40, 41, 42, 47], "indic": [1, 2, 3, 4, 5, 6, 10, 19, 20, 23, 25, 28, 31, 41], "group": [1, 2, 3, 4, 5, 6, 10, 19, 20, 23, 25, 28, 31, 41], "layer": [1, 2, 3, 4, 5, 6, 7, 10, 13, 15, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 34, 35, 37, 38, 41, 42, 45, 46, 47], "thei": [1, 2, 3, 4, 5, 6, 10, 19, 20, 25, 28, 31, 41], "etc": [1, 2, 3, 4, 5, 6, 10, 19, 20, 22, 25, 27, 28, 29, 31, 41, 47], "default": [1, 2, 3, 4, 5, 6, 8, 11, 13, 14, 15, 17, 19, 20, 22, 23, 25, 27, 28, 29, 31, 33, 35, 39, 41, 45, 46, 47], "info": [1, 2, 3, 4, 5, 6, 19, 20, 25, 28, 31, 32], "targetplatformcap": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 25, 27, 28, 29, 31, 45, 46], "return": [1, 2, 3, 4, 5, 6, 8, 9, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 35, 37, 41, 45, 46], "A": [1, 2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 14, 16, 17, 19, 20, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 33, 34, 37, 38, 39, 41, 45, 46, 48], "object": [1, 3, 4, 6, 7, 9, 10, 13, 14, 15, 16, 17, 19, 20, 21, 22, 24, 25, 27, 28, 29, 31, 35, 37, 38, 41, 42, 45, 46], "total": [1, 4, 7, 20, 28, 37], "weight": [1, 2, 3, 4, 5, 6, 7, 10, 11, 13, 14, 15, 16, 19, 20, 23, 25, 27, 28, 29, 30, 31, 35, 37, 38, 39, 40, 41, 42, 47], "sum": [1, 4, 6, 7, 20, 23, 28, 37], "max": [1, 2, 3, 4, 5, 6, 10, 19, 20, 22, 25, 27, 28, 29, 31, 40, 45, 47], "activ": [1, 2, 3, 4, 5, 6, 7, 10, 19, 20, 22, 25, 27, 28, 29, 31, 35, 37, 38, 39, 40, 41, 42, 47], "tensor": [1, 4, 7, 11, 14, 16, 18, 20, 26, 28, 37, 40, 41, 42, 45, 46, 47, 48], "exampl": [1, 2, 3, 4, 5, 6, 7, 9, 10, 11, 14, 16, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 37, 38, 40, 42, 45, 46, 48], "applic": [1, 2, 3, 19, 20, 22, 23, 24, 25, 45], "mobilenet": [1, 2, 19, 20, 45], "random": [1, 2, 3, 4, 5, 6, 11, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31], "requir": [1, 4, 19, 22, 25, 27, 29, 31, 42, 47], "number": [1, 2, 3, 4, 5, 6, 7, 9, 11, 13, 14, 15, 16, 17, 18, 19, 22, 23, 25, 26, 27, 29, 31, 37, 41, 42, 44, 45, 46], "iter": [1, 2, 3, 4, 5, 6, 11, 13, 15, 19, 22, 25, 27, 29, 31, 45, 46], "num_calibration_batch": [1, 4, 19, 22, 25, 27, 29, 31], "In": [1, 3, 4, 6, 19, 22, 25, 27, 29, 31, 36, 37, 41], "10": [1, 3, 4, 6, 9, 19, 22, 25, 27, 29, 31, 45], "batch": [1, 4, 13, 15, 19, 22, 25, 27, 29, 31, 45, 46], "each": [1, 2, 3, 4, 5, 6, 9, 19, 22, 23, 25, 27, 29, 31, 38, 41, 42, 45, 46, 47], "4": [1, 4, 14, 16, 19, 22, 23, 25, 27, 29, 31, 41], "numpi": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 45, 46], "np": [1, 2, 3, 4, 5, 6, 7, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 37, 45], "def": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 41, 45, 46], "repr_datagen": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31], "_": [1, 4, 19, 22, 25, 27, 29, 31, 45, 46], "rang": [1, 4, 10, 19, 22, 25, 27, 29, 31, 45, 46], "yield": [1, 4, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 45, 46], "224": [1, 2, 3, 4, 5, 6, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 45, 46], "3": [1, 2, 3, 4, 5, 6, 10, 14, 16, 19, 20, 22, 23, 24, 25, 27, 28, 29, 30, 31, 42, 45, 46], "call": [1, 4, 20, 28, 41, 45, 46, 47], "kpi_data": [1, 4, 20, 28], "core": [1, 3, 4, 6, 9, 19, 20, 22, 24, 25, 27, 28, 30, 31, 33, 34, 37, 40, 46], "type": [1, 2, 3, 4, 5, 6, 8, 11, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 26, 28, 35, 38, 41, 44], "n_iter": [2, 3, 5, 6, 11, 13, 15, 45, 46], "500": [2, 3, 5, 6], "defaultconfig": [2, 5, 7], "gptq_config": [2, 3, 5, 6, 19, 27, 29], "none": [2, 3, 5, 6, 7, 8, 11, 14, 16, 17, 19, 21, 22, 25, 27, 29, 31, 33, 35, 37, 38, 39, 41, 42], "analyze_similar": [2, 3, 5, 6, 34], "fals": [2, 3, 5, 6, 11, 34, 40, 41], "default_keras_tpc": [2, 3, 19, 22, 23, 25], "pretrain": [2, 3, 6, 30, 31, 46], "By": [2, 3, 5, 6, 23, 27, 29, 47], "symmetr": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 39, 41, 42], "constraint": [2, 3, 5, 6, 19, 22, 23, 27, 29], "threshold": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 37, 40, 41, 42, 46], "power": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 40, 41], "two": [2, 3, 5, 6, 7, 19, 22, 25, 27, 29, 31, 37, 41, 45, 46, 47], "defin": [2, 3, 5, 6, 11, 14, 16, 19, 22, 23, 24, 25, 27, 29, 41, 42], "The": [2, 3, 5, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 19, 22, 23, 24, 25, 27, 29, 31, 35, 37, 38, 40, 41, 42, 43, 45, 46, 47], "first": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 41, 47], "sever": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 41, 47], "transform": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 46], "batchnorm": [2, 3, 5, 6, 13, 15, 19, 22, 25, 27, 29, 31], "fold": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31], "preced": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31], "Then": [2, 3, 5, 6, 10, 19, 22, 25, 27, 29, 31, 38, 41, 47], "statist": [2, 3, 5, 6, 10, 19, 22, 25, 27, 29, 31, 47], "min": [2, 3, 5, 6, 10, 19, 22, 25, 27, 29, 31, 40, 47], "histogram": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 47], "ar": [2, 3, 5, 6, 10, 11, 17, 19, 22, 23, 25, 27, 29, 31, 35, 41, 42, 44, 45, 46, 47], "being": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 42], "collect": [2, 3, 5, 6, 10, 19, 22, 25, 27, 29, 31, 47], "s": [2, 3, 5, 6, 7, 10, 19, 22, 23, 24, 25, 27, 29, 31, 35, 36, 37, 38, 40, 41, 42, 45, 46, 48], "output": [2, 3, 5, 6, 10, 13, 15, 18, 19, 22, 25, 26, 27, 29, 30, 31, 40, 41, 46, 47, 48], "input": [2, 3, 5, 6, 7, 13, 15, 19, 22, 25, 27, 29, 31, 37, 40, 41, 45, 46], "depend": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31], "both": [2, 3, 5, 6, 17, 19, 22, 27, 29, 30, 41, 42, 47], "coeffici": [2, 3, 5, 6, 7, 10, 19, 22, 24, 25, 27, 29, 37, 41, 42], "If": [2, 3, 5, 6, 8, 10, 19, 22, 24, 25, 27, 29, 35, 41], "pass": [2, 3, 5, 6, 8, 9, 10, 14, 16, 19, 22, 23, 24, 25, 27, 29, 30, 31, 38, 40, 41], "compar": [2, 3, 5, 6, 7, 19, 27, 29, 37, 47], "point": [2, 3, 5, 6, 7, 11, 14, 16, 19, 27, 29, 37, 41, 47], "between": [2, 3, 5, 6, 7, 11, 19, 27, 29, 37, 40, 41, 47], "float": [2, 3, 5, 6, 7, 11, 13, 14, 15, 16, 19, 25, 27, 29, 31, 35, 37, 40, 41, 42, 47], "minim": [2, 3, 5, 6, 19, 23, 27, 29, 40], "observ": [2, 3, 5, 6, 19, 27, 29, 41, 47], "loss": [2, 3, 5, 6, 11, 13, 14, 15, 16, 19, 23, 27, 29], "int": [2, 3, 5, 6, 7, 11, 13, 14, 15, 16, 18, 23, 26, 37, 40, 41, 42, 45], "run": [2, 3, 5, 6, 11, 14, 16, 45, 46, 47], "quantizationconfig": [2, 3, 5, 6, 7, 33, 37, 41, 46], "list": [2, 3, 5, 6, 7, 9, 10, 11, 13, 14, 15, 16, 18, 26, 34, 37, 38, 41, 45, 46, 48], "editrul": [2, 3, 5, 6, 34], "consist": [2, 3, 5, 6], "node": [2, 3, 5, 6, 25, 31, 38, 42, 47], "filter": [2, 3, 5, 6, 23, 41], "action": [2, 3, 5, 6, 34], "chang": [2, 3, 5, 6, 11, 19, 22, 27, 29, 35, 38, 47], "bool": [2, 3, 5, 6, 11, 13, 14, 15, 16, 19, 22, 27, 29, 34, 37, 40, 41, 42], "whether": [2, 3, 5, 6, 11, 13, 14, 15, 16, 19, 21, 22, 23, 27, 29, 34, 35, 37, 40, 41, 42], "plot": [2, 3, 5, 6, 34, 47], "similar": [2, 3, 5, 6, 34, 40, 41, 48], "figur": [2, 3, 5, 6, 34, 47], "within": [2, 3, 5, 6, 34, 48], "tensorboard": [2, 3, 5, 6, 34, 48], "logger": [2, 3, 5, 6, 34, 47], "enabl": [2, 3, 5, 6, 7, 12, 17, 19, 22, 27, 29, 34, 37, 40, 41, 42, 44, 48], "user": [2, 3, 5, 6, 19, 22, 24, 25, 27, 29, 30, 31], "mai": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31, 36, 40, 41, 47], "handl": [2, 3, 5, 6, 19, 22, 25, 27, 29, 31], "1": [2, 3, 5, 6, 7, 10, 11, 16, 19, 20, 22, 23, 24, 27, 28, 29, 30, 37, 45, 48], "quantized_model": [2, 3, 6, 19, 22, 24, 25, 30, 31, 45, 46], "quantization_info": [2, 3, 5, 6, 19, 22, 24, 25, 27, 29, 30, 31, 45, 46], "tupl": [2, 3, 5, 6, 10, 18, 19, 23, 26, 38, 41], "userinform": [2, 3, 5, 6, 19], "target_kpi": [3, 6, 19, 22, 23, 25, 27, 29, 31], "For": [3, 6, 9, 10, 17, 19, 22, 24, 25, 31, 35, 40, 41, 42, 44, 45, 46, 47, 48], "possibl": [3, 6, 7, 19, 22, 25, 31, 37, 40, 41, 47], "bit": [3, 6, 7, 17, 19, 22, 24, 25, 31, 37, 38, 41, 42, 44, 48], "width": [3, 6, 7, 19, 22, 25, 31, 37, 41, 48], "per": [3, 6, 10, 19, 22, 25, 31, 40, 41, 42, 47], "oper": [3, 7, 10, 36, 37, 41], "ilp": [3, 6, 19, 22, 25, 31], "solver": [3, 6, 19, 22, 25, 31], "we": [3, 6, 10, 12, 19, 22, 23, 25, 31, 38, 41, 42, 43, 45, 46, 47], "find": [3, 6, 19, 22, 25, 31], "order": [3, 6, 14, 16, 19, 22, 25, 31, 36, 41], "limit": [3, 6, 19, 22, 24, 25, 27, 29, 31], "maxim": [3, 6, 19, 22, 25, 31], "size": [3, 6, 13, 15, 18, 19, 22, 24, 25, 26, 31, 39, 45, 46], "after": [3, 6, 12, 19, 21, 22, 25, 31, 40, 41, 48], "weights_memori": [3, 6, 7, 19, 22, 23, 25, 31, 37], "activation_memori": [3, 7, 37], "byte": [3, 6, 7, 19, 22, 23, 25, 31, 37, 47], "notic": [3, 6, 23, 41, 45, 46], "featur": [3, 6, 35], "mobilenet_v2": [3, 4, 5, 6, 22, 24, 25, 27, 28, 29, 30, 31, 46], "mobilenetv2": [3, 22, 24, 25, 47], "differ": [3, 6, 7, 12, 19, 22, 24, 25, 35, 37, 40, 41, 47], "bitwidth": [3, 6, 19, 22, 24, 25], "candid": [3, 6, 19, 22, 24, 25, 38], "config": [3, 6, 11, 19, 22, 23, 24, 25, 27, 30, 31, 33, 38, 41, 42], "our": [3, 6, 19, 22, 24, 25, 31], "note": [3, 6, 7, 19, 22, 24, 25, 35, 37, 41], "valu": [3, 6, 7, 8, 10, 11, 19, 22, 23, 24, 25, 35, 36, 37, 38, 39, 40, 41], "affect": [3, 6, 7, 19, 22, 24, 25, 37, 41], "onli": [3, 6, 7, 9, 10, 19, 22, 24, 25, 35, 37, 41], "conv2d": [3, 6, 7, 10, 19, 22, 24, 25, 37, 38, 41], "while": [3, 6, 7, 19, 22, 24, 25, 31, 37, 41], "bia": [3, 6, 7, 11, 14, 16, 19, 22, 24, 25, 37, 40], "count_param": [3, 19, 22, 23, 24, 25], "0": [3, 6, 7, 10, 11, 13, 14, 15, 19, 22, 23, 24, 25, 37, 40, 41, 42, 45, 46], "75": [3, 6, 19, 22, 24, 25], "8": [3, 6, 19, 22, 24, 25, 41, 42], "more": [3, 6, 12, 17, 22, 23, 25, 31, 35, 41, 43, 44, 47], "take": [3, 6, 22, 25, 31, 48], "look": [3, 6, 22, 25, 31, 41, 48], "api": [3, 6, 10, 11, 22, 25, 31, 41, 43], "default_pytorch_info": [4, 5, 6, 28, 31], "pytorch_default_tpc": [4, 28], "capabl": [4, 17, 23, 28], "torchvis": [4, 5, 6, 15, 27, 28, 29, 30, 31, 46], "modul": [4, 5, 6, 26, 27, 28, 29], "in_modul": [5, 29], "default_pytorch_tpc": [5, 6, 27, 29, 31], "quantized_modul": [5, 27, 29], "p": [6, 40], "numel": 6, "resourc": [7, 37, 47], "class": [7, 9, 21, 23, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42], "inf": [7, 37, 40], "total_memori": [7, 37], "bop": [7, 37], "measur": [7, 37, 47], "perform": [7, 18, 23, 26, 37], "memori": [7, 23, 37, 47], "includ": [7, 11, 19, 22, 23, 25, 27, 29, 31, 37, 39], "metric": [7, 11, 23, 37], "qc": [7, 40], "compute_distance_fn": [7, 37], "compute_ms": 7, "distance_weighting_method": [7, 37], "get_average_weight": [7, 37], "num_of_imag": [7, 19, 22, 37], "32": [7, 23, 37, 41, 45, 46], "configuration_overwrit": [7, 37], "num_interest_points_factor": [7, 37], "all": [7, 10, 11, 38, 40, 41, 42, 47], "librari": [7, 10, 40], "unlik": [7, 37], "support": [7, 17, 35, 37, 41], "function": [7, 9, 10, 11, 13, 14, 15, 16, 18, 21, 23, 26, 37, 38, 41, 42, 45, 46], "distanc": [7, 37], "among": [7, 37], "sensit": [7, 23, 37], "evalu": [7, 37], "integ": [7, 35, 37, 41], "overwrit": [7, 37], "predefin": [7, 37], "one": [7, 9, 36, 37, 40, 41, 45, 46, 47], "multipl": [7, 10, 37, 41], "factor": [7, 11, 14, 16, 37], "zero": [7, 37, 41], "percentag": [7, 37], "reduc": [7, 23, 37], "interest": [7, 37], "known_dict": 8, "default_valu": 8, "dictionari": [8, 10, 11, 24, 25, 35, 38, 39, 42], "It": [8, 41, 42], "initi": [8, 9, 11, 13, 15, 25, 31, 41, 42, 45, 46], "its": [8, 10, 21, 40, 41, 47], "request": 8, "kei": [8, 23, 41], "present": [8, 47], "inner": 8, "default_factori": 8, "exist": [8, 9, 38], "wa": [8, 35, 41], "ani": [8, 10, 11, 35, 36, 41, 42, 45, 46], "follow": [9, 10, 11, 41, 42, 47], "load": [9, 12, 24, 25, 35, 42, 45, 46], "preprocess": [9, 45, 46], "batch_siz": [9, 45, 46], "file_typ": 9, "filetyp": 9, "retriev": 9, "path": [9, 21, 32, 35, 45, 46, 47], "ha": [9, 23, 38, 41, 45, 46], "least": [9, 41, 45, 46], "befor": [9, 12, 43], "them": [9, 17, 41, 47], "sampl": [9, 11, 45, 46, 47], "instanti": [9, 11, 39, 40], "randomli": 9, "time": [9, 10, 42], "image_data_load": [9, 45, 46], "To": [9, 41, 47], "method": [9, 23, 38, 39, 40, 41, 42, 45, 46], "lambda": 9, "x": [9, 45, 46], "127": [9, 45], "5": [9, 14, 16, 23, 45], "extens": 9, "png": 9, "common": [9, 41], "data_load": 9, "jpeg": 9, "jpg": 9, "bmp": 9, "network": [10, 23, 30, 33, 34, 38, 40, 47, 48], "activation_quantizer_map": 10, "kernel_channels_map": 10, "activation_min_max_map": 10, "layer_min_max_map": 10, "kernel_ops_attributes_map": 10, "out_channel_axis_map": 10, "hold": [10, 33, 36], "map": [10, 41], "divid": 10, "three": [10, 41], "kernel_op": 10, "have": [10, 35, 36, 41, 45, 46, 47], "dens": 10, "activation_op": 10, "add": [10, 13, 15, 21, 41, 42], "relu": [10, 40, 41], "no_quantization_op": 10, "reshap": [10, 41], "transpos": 10, "dict": [10, 11, 23, 35, 42], "quantizationmethod": [10, 42], "defaultdict": 10, "out": [10, 23], "str": [10, 35, 36, 41], "attirbut": 10, "want": [10, 41], "know": 10, "2": [10, 14, 40, 41, 42, 45, 48], "respectivli": 10, "tf": [10, 14, 18, 21, 24, 25, 41], "advanc": 10, "save": [10, 25, 32, 35, 42], "softmax": [10, 40], "enum": [10, 11, 39, 40], "select": [10, 35, 39, 40, 41, 42], "format": [10, 12, 35], "axi": [10, 42], "nhwc": 10, "last": 10, "nchw": 10, "which": [11, 35, 36, 38, 40, 41, 42, 45, 46], "knowledg": [11, 48], "distil": [11, 48], "teacher": 11, "student": 11, "subject": [11, 19, 22, 27, 29, 35], "n_epoch": [11, 14, 16, 19], "optimizer_rest": [11, 14, 16], "log_funct": [11, 14, 16], "train_bia": 11, "true": [11, 13, 14, 15, 16, 19, 21, 22, 27, 29, 30, 31, 37, 40, 41, 42, 46], "rounding_typ": 11, "roundingtyp": 11, "softquant": 11, "use_hessian_based_weight": [11, 14, 16], "optimizer_quantization_paramet": 11, "optimizer_bia": 11, "regularization_factor": [11, 14, 16], "reg_default": [11, 14, 16], "hessian_weights_config": 11, "gptq_quantizer_params_overrid": 11, "gradientptqv2": 11, "epoch": [11, 14, 16], "accept": [11, 14, 16], "6": 11, "1st": [11, 14, 16], "2nd": [11, 14, 16], "3rd": [11, 14, 16], "4th": [11, 14, 16], "5th": 11, "6th": 11, "mean": [11, 41, 45, 46, 47], "std": [11, 45, 46], "accordingli": [11, 41], "see": [11, 41, 48], "multiple_tensors_mse_loss": [11, 16], "log": [11, 14, 16, 32, 47], "updat": 11, "round": [11, 45], "hessian": [11, 14, 16, 23, 37], "averag": [11, 13, 14, 15, 16, 37], "overrid": [11, 39, 41], "rest": 11, "optimizerfor": 11, "regular": [11, 14, 16], "necessari": [11, 42], "argument": [11, 41, 45, 46], "score": [11, 23, 37, 40], "classmethod": 11, "from_v1": 11, "n_ptq_iter": 11, "config_v1": 11, "length": 11, "convert": [11, 24, 30], "v2": 11, "gradientptq": [11, 12], "hessians_num_sampl": 11, "16": [11, 46], "norm_scor": [11, 37], "log_norm": 11, "scale_log_norm": 11, "hessians_n_it": 11, "50": [11, 23, 45, 46], "gptqhessianweightsconfig": 11, "normal": [11, 13, 15, 37, 45, 46], "scale": [11, 37, 40, 41], "final": [11, 12, 18, 26, 37, 38, 47, 48], "vector": [11, 47], "approxim": [11, 23], "previou": [12, 43], "still": [12, 43], "avail": [12, 43, 48], "visit": [12, 43, 48], "howev": [12, 43], "recommend": [12, 43], "deprec": [12, 43], "pytorch_post_training_quantization_experiment": [12, 29, 46], "keras_post_training_quantization_experiment": [12, 22, 45], "keras_gradient_post_training_quantization_experiment": [12, 19], "pytorch_gradient_post_training_quantization_experiment": [12, 27], "keras_quantization_aware_training_init": [12, 24, 25], "prepar": [12, 25, 31], "awar": [12, 39, 42, 48], "keras_quantization_aware_training_fin": [12, 24], "without": [12, 41, 45, 46], "quantizewrapp": [12, 25, 30, 31], "get_pytorch_gptq_config": [12, 16], "keras_kpi_data_experiment": [12, 20], "pytorch_kpi_data_experiment": [12, 28], "keras_load_quantized_model": [12, 21], "tensorflow_data_generation_experiment": [12, 18], "get_tensorflow_data_generation_config": [12, 13], "datagenerationconfig": [12, 18, 26], "pytorch_data_generation_experiment": [12, 26], "get_pytorch_data_generation_config": [12, 15], "keras_pruning_experiment": [12, 23], "appli": [12, 36, 38, 41], "structur": [12, 48], "prune": [12, 48], "core_config": [12, 19, 20, 22, 24, 25, 27, 28, 29, 30, 31, 46], "debug_config": [12, 33], "debug": [12, 33, 34], "qat_config": [12, 25, 31], "export": 12, "serial": [12, 35], "trainable_infrastructur": 12, "abstract": [12, 42], "orient": [12, 42], "tool": [12, 42], "data_gener": [13, 15, 18, 26], "default_n_it": [13, 15], "adam": [13, 14, 16], "data_gen_batch_s": [13, 15], "default_data_gen_b": [13, 15], "initial_lr": [13, 15], "default_keras_initial_lr": 13, "output_loss_multipli": [13, 15], "default_keras_output_loss_multipli": 13, "scheduler_typ": [13, 15], "schedulertyp": [13, 15], "reduce_on_plateau": [13, 15], "bn_alignment_loss_typ": [13, 15], "batchnormalignemntlosstyp": [13, 15], "l2_squar": [13, 15], "output_loss_typ": [13, 15], "outputlosstyp": [13, 15], "regularized_min_max_diff": [13, 15], "data_init_typ": [13, 15], "datainittyp": [13, 15], "gaussian": 13, "layer_weighting_typ": [13, 15], "bnlayerweightingtyp": [13, 15], "image_granular": [13, 15], "imagegranular": [13, 15], "batchwis": 13, "image_pipeline_typ": [13, 15], "imagepipelinetyp": [13, 15], "random_crop_flip": 13, "image_normalization_typ": [13, 15], "imagenormalizationtyp": [13, 15], "keras_appl": 13, "extra_pixel": [13, 15], "bn_layer_typ": [13, 15], "clip_imag": [13, 15], "reflect": [13, 15], "specifi": [13, 15, 21, 23, 35, 41], "learn": [13, 14, 15, 39], "rate": [13, 14, 15], "multipli": [13, 15], "schedul": [13, 15], "align": [13, 15], "granular": [13, 15], "pipelin": [13, 15], "extra": [13, 15], "pixel": [13, 15], "consid": [13, 15, 23, 41], "clip": [13, 15], "learning_r": 14, "lr_default": [14, 16], "lr_rest_default": [14, 16], "gptqmultipletensorsloss": 14, "gradientptqconfigv2": [14, 16, 19, 27], "fine": [14, 16, 24, 25, 30, 31], "tune": [14, 16, 24, 25, 30], "optimizerv2": 14, "auxiliri": [14, 16], "variabl": [14, 16], "gptq_conf": [14, 16, 27], "other": [14, 16, 41], "nadam": 14, "radam": 15, "default_pytorch_initial_lr": 15, "default_pytorch_output_loss_multipli": 15, "divers": 15, "allimag": 15, "random_crop": 15, "default_pytorch_bn_layer_typ": 15, "last_layer_typ": 15, "default_pytorch_last_layer_typ": 15, "torch": [16, 48], "lr": 16, "dummi": 16, "param": [16, 34, 38, 42], "fw_name": 17, "target_platform_nam": 17, "target_platform_vers": 17, "name": [17, 38, 41, 47], "now": [17, 31, 41, 42, 44, 47], "imx500": [17, 41], "tflite": [17, 35, 41], "qnnpack": [17, 41], "version": [17, 41, 48], "attach": [17, 41, 45, 46], "some": [17, 41, 44, 47], "field": [17, 36, 41, 44], "opquantizationconfig": [17, 44], "ignor": [17, 41, 44], "current": [17, 35, 41, 44, 48], "disabl": [17, 41, 44], "n_imag": [18, 26], "output_image_s": [18, 26], "data_generation_config": [18, 26], "provid": [18, 23, 26, 42, 47], "gptq_representative_data_gen": [19, 27], "coreconfig": [19, 20, 22, 24, 25, 27, 28, 29, 30, 31, 46], "new_experimental_export": [19, 22, 27, 29], "mixed_precision_config": [19, 22, 24, 25, 33], "mixedprecisionquantizationconfigv2": [19, 22, 24, 25, 33], "hw": 20, "filepath": 21, "custom_object": [21, 24, 25], "compil": 21, "trainabl": [21, 24, 42], "custom": [21, 25, 35], "file": [21, 24, 25, 32, 35], "addit": [21, 41], "boolean": 21, "saved_model": 21, "loadopt": 21, "savedmodel": 21, "pruning_config": 23, "pruningconfig": 23, "meet": 23, "simd": [23, 41], "tpc": [23, 41], "determin": [23, 45, 46], "label": [23, 41], "free": 23, "lfh": 23, "assess": 23, "strategi": 23, "togeth": 23, "friendli": [23, 48], "architectur": 23, "involv": 23, "analyz": 23, "identifi": 23, "impact": 23, "must": [23, 41], "retrain": 23, "recov": 23, "compress": 23, "origin": [23, 47], "achiev": 23, "through": [23, 39], "analysi": 23, "standard": [23, 39], "associ": [23, 41], "pruninginfo": 23, "resnet50": 23, "here": [23, 41, 45, 46, 48], "aim": [23, 41], "footprint": 23, "assum": 23, "float32": 23, "thu": [23, 47], "dense_nparam": 23, "l": [23, 48], "num_score_approxim": 23, "higher": 23, "also": [23, 41, 48], "extend": 23, "durat": 23, "pruned_model": 23, "pruning_info": 23, "importance_metr": 23, "importancemetr": 23, "channels_filtering_strategi": 23, "channelsfilteringstrategi": 23, "greedi": [23, 37], "neural": [23, 48], "pruning_mask": 23, "importance_scor": 23, "store": [23, 42], "mask": 23, "act": 23, "access": 23, "metadata": 23, "arrai": [23, 45, 46], "where": [23, 35, 38, 41, 45, 46, 47], "element": [23, 41], "correspond": 23, "neuron": 23, "been": 23, "kept": [23, 25, 31], "basenod": 23, "ndarrai": [23, 45, 46], "quantifi": [23, 47], "signific": 23, "qat": [24, 25, 30, 31, 39], "replac": 24, "trainablequant": 24, "inferablequant": [24, 30], "load_model": [24, 25], "model_fil": [24, 25], "qatconfig": [25, 31], "built": [25, 31, 42], "fake_qu": [25, 31], "onlin": [25, 31], "wrapper": [25, 30, 31, 42], "ker": 25, "clibrat": 29, "pytorch_quantization_aware_training_fin": 30, "pytorch_quantization_aware_training_init": [30, 31], "keep": [30, 48], "readi": 30, "tun": 31, "set_log_fold": [32, 47], "folder": [32, 45, 46], "level": 32, "verbos": 32, "debugconfig": 33, "purpos": [34, 41, 45, 46], "pinpoint": 34, "problemat": 34, "rule": [34, 38], "allow": 35, "detail": [35, 41], "refer": 35, "project": [35, 48], "github": [35, 48], "readm": 35, "you": [35, 47, 48], "question": 35, "issu": [35, 37], "open": [35, 47, 48], "repositori": 35, "torchscript": 35, "onnx": 35, "via": 35, "save_model_path": 35, "is_layer_exportable_fn": 35, "is_keras_layer_export": 35, "serialization_format": 35, "quantization_format": 35, "quantizationformat": 35, "mctq": 35, "h5": 35, "combin": [35, 41], "fakely_qu": 35, "fake": 35, "keras_h5": 35, "int8": 35, "8bit": 35, "check": [35, 36, 37, 38, 41], "quant": 35, "repr_dataset": 35, "is_pytorch_layer_export": 35, "trace": 35, "mandatori": 35, "layerfilterparam": 36, "next": [36, 41], "eq": 36, "attr": 36, "match": [36, 38, 41], "equal": [36, 40], "op": [36, 41], "regard": [36, 41], "noteq": [36, 41], "greater": 36, "than": [36, 37, 41], "greatereq": 36, "smaller": 36, "smallereq": 36, "use_hessian_based_scor": 37, "refine_mp_solut": 37, "metric_normalization_threshold": 37, "1e10": 37, "try": 37, "improv": 37, "algorithm": [37, 46], "increas": 37, "case": [37, 41], "larger": 37, "prevent": 37, "numer": 37, "wight": [38, 41], "9": 38, "er_list": 38, "nodetypefilt": 38, "changecandidatesweightsquantconfigattr": 38, "weights_n_bit": [38, 41, 42], "modifi": 38, "node_typ": 38, "nodenamefilt": 38, "node_nam": 38, "nodenamescopefilt": 38, "node_name_scop": 38, "string": 38, "changefinalweightsquantconfigattr": 38, "kwarg": [38, 41], "attribut": [38, 41, 42], "attr_nam": 38, "attr_valu": 38, "changefinalactivationquantconfigattr": 38, "changecandidatesactivationquantconfigattr": 38, "changequantizationparamfunct": 38, "activation_quantization_params_fn": 38, "weights_quantization_params_fn": 38, "changefinalweightsquantizationmethod": 38, "weights_quantization_method": [38, 41, 42], "changecandidatesweightsquantizationmethod": 38, "changecandidatesactivationquantizationmethod": 38, "activation_quantization_method": [38, 41, 42], "changequantizationmethod": 38, "ste": 39, "straight": 39, "estim": 39, "poweroftwo": 39, "uniform": [39, 41, 42], "dqa": 39, "dnn": 39, "attent": 39, "smooth": 39, "introduc": 39, "lsq": 39, "step": 39, "http": [39, 48], "arxiv": [39, 48], "org": 39, "pdf": 39, "1902": 39, "08153": 39, "weight_training_method": 39, "activation_training_method": 39, "weight_quantizer_params_overrid": 39, "activation_quantizer_params_overrid": 39, "noclip": 40, "mse": [40, 47], "squar": 40, "error": 40, "nois": 40, "mae": [40, 47], "absolut": 40, "kl": [40, 47], "diverg": [40, 47], "make": 40, "signal": 40, "distribut": 40, "lp": 40, "norm": [40, 47], "activation_error_method": 40, "weights_error_method": 40, "relu_bound_to_power_of_2": 40, "weights_bias_correct": 40, "weights_per_channel_threshold": [40, 41, 42], "weights_second_moment_correct": 40, "input_sc": 40, "softmax_shift": 40, "shift_negative_activation_correct": 40, "activation_channel_equ": 40, "z_threshold": [40, 46], "math": 40, "min_threshold": [40, 42], "l_p_valu": 40, "linear_collaps": 40, "residual_collaps": 40, "shift_negative_ratio": 40, "05": 40, "shift_negative_threshold_recalcul": 40, "shift_negative_params_search": 40, "correct": 40, "second_mo": 40, "shift": 40, "neg": 40, "z": [40, 46], "outlier": [40, 46], "minimum": [40, 42], "l_p": 40, "block_collaps": 40, "collaps": 40, "block": [40, 42, 47], "anoth": [40, 41], "ratio": 40, "non": [40, 41], "linear": 40, "abov": [40, 41], "occur": 40, "recomput": 40, "One": [40, 47], "done": [40, 47], "instans": 40, "backend": 41, "address": 41, "shortli": 41, "diagram": 41, "demonstr": 41, "main": [41, 47], "compon": [41, 42], "explain": [41, 42], "part": 41, "power_of_two": 41, "kmean": 41, "k": 41, "lut_pot_quant": 41, "lookup": 41, "tabl": 41, "lut_sym_quant": 41, "activation_n_bit": [41, 42], "enable_weights_quant": [41, 42], "enable_activation_quant": [41, 42], "quantization_preserv": 41, "fixed_scal": 41, "fixed_zero_point": 41, "weights_multiplier_nbit": 41, "simd_siz": 41, "same": 41, "up": [41, 47], "singl": 41, "instruct": 41, "fetch": 41, "simultan": 41, "would": [41, 47], "like": 41, "op_qc_8bit": 41, "later": 41, "wai": [41, 47, 48], "simplest": 41, "quantization_config_list": 41, "base_config": 41, "gather": [41, 47], "fallback": 41, "manner": 41, "either": 41, "previous": 41, "under": [41, 47], "op_qc_4bit": 41, "clone_and_edit": 41, "op_qc_2bit": 41, "mixed_precision_configuration_opt": 41, "properti": 41, "pattern": 41, "default_qco": 41, "default_tp_model": 41, "definit": 41, "so": 41, "come": 41, "explicitli": 41, "guid": 41, "default_configuration_opt": 41, "unless": 41, "otherwis": 41, "my_model": 41, "start": [41, 42, 48], "qc_option": 41, "uniqu": 41, "fullyconnect": 41, "fc_opset": 41, "kind": 41, "implicitli": 41, "do": [41, 47], "relu_opset": 41, "treat": 41, "henc": 41, "appear": 41, "operator_groups_list": 41, "avoid": 41, "were": [41, 47], "opset": 41, "operatorset": 41, "sublist": 41, "sequenc": 41, "add_opset": 41, "pre": 41, "well": 41, "encount": 41, "regardless": 41, "cours": 41, "concaten": 41, "similarli": 41, "place": 41, "separ": 41, "opseratorsset": 41, "activations_after_fc_to_fus": 41, "equival": 41, "tp": 41, "get_tp_model": 41, "test": 41, "experi": 41, "implement": [41, 42], "i": [41, 48], "get_op_quantization_config": 41, "generate_tp_model": 41, "mixed_precision_cfg_list": 41, "default_config": 41, "imx500_tp_model": 41, "eight_bit": 41, "lut": 41, "four_bit": 41, "two_bit": 41, "arg": 41, "generated_tpc": 41, "below": 41, "less": 41, "set_simd_pad": 41, "is_simd_pad": 41, "suit": 41, "dropout": 41, "noquant": 41, "get_default_quantization_config_opt": 41, "conv": 41, "fc": 41, "any_relu": 41, "anyrelu": 41, "sub": 41, "mul": 41, "div": 41, "prelu": 41, "swish": 41, "sigmoid": 41, "tanh": 41, "activations_after_conv_to_fus": 41, "any_binari": 41, "represent": [41, 45, 46], "op_set_nam": 41, "filterlayerparam": 41, "There": [41, 47], "bound": 41, "unbound": 41, "condit": 41, "attributefilt": 41, "satisfi": 41, "keyword": 41, "pair": [41, 47], "distinguish": 41, "made": 41, "max_valu": 41, "unbounded_relu_filt": 41, "usag": 41, "These": [41, 47], "just": [41, 48], "nn": 41, "relu6": 41, "negative_slop": 41, "tp_model": 41, "upon": [41, 42], "infrastructur": 42, "util": 42, "packag": [42, 48], "propos": 42, "emul": 42, "holder": 42, "learnabl": 42, "basic": 42, "valid": 42, "get_config": 42, "from_config": 42, "weights_quantization_param": 42, "weights_channels_axi": 42, "weights_quantization_candid": 42, "constant": 42, "activation_quantization_param": 42, "activation_quantization_candid": 42, "code": [45, 46], "show": [45, 46, 47], "mobilenetv1": 45, "cv2": 45, "resize_scal": 45, "256": [45, 46], "resiz": [45, 46], "resize_sid": 45, "shape": [45, 46], "height_tag": 45, "width_tag": 45, "resized_img": 45, "offset_height": 45, "offset_width": 45, "cropped_img": 45, "loader": [45, 46], "second": [45, 46, 47], "20": [45, 46, 47], "targetplatformmodel": [45, 46], "pil": 46, "np_to_pil": 46, "img": 46, "fromarrai": 46, "compos": 46, "centercrop": 46, "totensor": 46, "485": 46, "456": 46, "406": 46, "229": 46, "225": 46, "variou": 47, "phase": 47, "displai": 47, "ui": 47, "dir": 47, "writer": 47, "stage": 47, "launch": 47, "logdir": 47, "seen": 47, "tab": 47, "click": 47, "deeper": 47, "view": 47, "tag": 47, "scalar": 47, "mathemat": 47, "divis": 47, "dot": 47, "product": 47, "euclidean": 47, "along": 47, "expect": 47, "mani": 47, "few": [47, 48], "As": 47, "insert": 47, "chosen": 47, "sourc": 48, "research": 48, "develop": 48, "engin": 48, "easili": 48, "state": 48, "art": 48, "hptq": 48, "work": 48, "soni": 48, "semiconductor": 48, "israel": 48, "pip": 48, "git": 48, "clone": 48, "com": 48, "model_optim": 48, "python": 48, "setup": 48, "py": 48, "pypi": 48, "latest": 48, "stabl": 48, "nightli": 48, "unstabl": 48, "visual": 48, "cosin": 48, "comparison": 48, "minut": 48, "quick": 48, "tutori": 48, "doesn": 48, "t": 48, "out1": 48, "out2": 48, "out3": 48, "habi": 48, "h": 48, "v": 48, "peretz": 48, "r": 48, "cohen": 48, "dikstein": 48, "dror": 48, "o": 48, "diamant": 48, "jen": 48, "netzer": 48, "2021": 48, "preprint": 48}, "objects": {"model_compression_toolkit": [[10, 0, 1, "", "ChannelAxis"], [34, 0, 1, "", "DebugConfig"], [8, 0, 1, "", "DefaultDict"], [9, 0, 1, "", "FolderImageLoader"], [10, 0, 1, "", "FrameworkInfo"], [37, 0, 1, "", "KPI"], [7, 0, 1, "", "MixedPrecisionQuantizationConfig"], [40, 0, 1, "", "QuantizationConfig"], [40, 0, 1, "", "QuantizationErrorMethod"], [17, 3, 1, "", "get_target_platform_capabilities"], [1, 3, 1, "", "keras_kpi_data"], [21, 3, 1, "", "keras_load_quantized_model"], [2, 3, 1, "", "keras_post_training_quantization"], [3, 3, 1, "", "keras_post_training_quantization_mixed_precision"], [4, 3, 1, "", "pytorch_kpi_data"], [5, 3, 1, "", "pytorch_post_training_quantization"], [6, 3, 1, "", "pytorch_post_training_quantization_mixed_precision"], [32, 3, 1, "", "set_log_folder"]], "model_compression_toolkit.DefaultDict": [[8, 1, 1, "", "get"], [8, 1, 1, "", "keys"]], "model_compression_toolkit.FolderImageLoader": [[9, 1, 1, "", "sample"]], "model_compression_toolkit.core": [[33, 0, 1, "", "CoreConfig"], [37, 0, 1, "", "MixedPrecisionQuantizationConfigV2"], [20, 3, 1, "", "keras_kpi_data_experimental"], [28, 3, 1, "", "pytorch_kpi_data_experimental"]], "model_compression_toolkit.core.common.data_loader": [[9, 2, 1, "", "FILETYPES"]], "model_compression_toolkit.data_generation": [[15, 3, 1, "", "get_pytorch_data_generation_config"], [13, 3, 1, "", "get_tensorflow_data_generation_config"], [26, 3, 1, "", "pytorch_data_generation_experimental"], [18, 3, 1, "", "tensorflow_data_generation_experimental"]], "model_compression_toolkit.exporter": [[35, 0, 1, "", "KerasExportSerializationFormat"], [35, 0, 1, "", "PytorchExportSerializationFormat"], [35, 0, 1, "", "keras_export_model"], [35, 0, 1, "", "pytorch_export_model"]], "model_compression_toolkit.gptq": [[11, 0, 1, "", "GPTQHessianScoresConfig"], [11, 0, 1, "", "GradientPTQConfig"], [11, 0, 1, "", "GradientPTQConfigV2"], [14, 3, 1, "", "get_keras_gptq_config"], [16, 3, 1, "", "get_pytorch_gptq_config"], [19, 3, 1, "", "keras_gradient_post_training_quantization_experimental"], [27, 3, 1, "", "pytorch_gradient_post_training_quantization_experimental"]], "model_compression_toolkit.gptq.GradientPTQConfigV2": [[11, 1, 1, "", "from_v1"]], "model_compression_toolkit.network_editor": [[38, 0, 1, "", "ChangeCandidatesActivationQuantConfigAttr"], [38, 0, 1, "", "ChangeCandidatesActivationQuantizationMethod"], [38, 0, 1, "", "ChangeCandidatesWeightsQuantConfigAttr"], [38, 0, 1, "", "ChangeCandidatesWeightsQuantizationMethod"], [38, 0, 1, "", "ChangeFinalActivationQuantConfigAttr"], [38, 0, 1, "", "ChangeFinalWeightsQuantConfigAttr"], [38, 0, 1, "", "ChangeFinalWeightsQuantizationMethod"], [38, 0, 1, "", "ChangeQuantizationParamFunction"], [38, 0, 1, "", "EditRule"], [38, 0, 1, "", "NodeNameFilter"], [38, 0, 1, "", "NodeNameScopeFilter"], [38, 0, 1, "", "NodeTypeFilter"]], "model_compression_toolkit.pruning": [[23, 3, 1, "", "PruningConfig"], [23, 3, 1, "", "PruningInfo"], [23, 4, 1, "", "channels_filtering_strategy"], [23, 4, 1, "", "importance_metric"], [23, 4, 1, "", "importance_scores"], [23, 3, 1, "", "keras_pruning_experimental"], [23, 4, 1, "", "num_score_approximations"], [23, 4, 1, "", "pruning_masks"]], "model_compression_toolkit.ptq": [[22, 3, 1, "", "keras_post_training_quantization_experimental"], [29, 3, 1, "", "pytorch_post_training_quantization_experimental"]], "model_compression_toolkit.qat": [[39, 0, 1, "", "QATConfig"], [39, 0, 1, "", "TrainingMethod"], [24, 3, 1, "", "keras_quantization_aware_training_finalize"], [25, 3, 1, "", "keras_quantization_aware_training_init"], [30, 3, 1, "", "pytorch_quantization_aware_training_finalize"], [31, 3, 1, "", "pytorch_quantization_aware_training_init"]], "model_compression_toolkit.target_platform": [[36, 0, 1, "", "Eq"], [41, 0, 1, "", "Fusing"], [36, 0, 1, "", "Greater"], [36, 0, 1, "", "GreaterEq"], [41, 0, 1, "", "LayerFilterParams"], [36, 0, 1, "", "NotEq"], [41, 0, 1, "", "OpQuantizationConfig"], [41, 0, 1, "", "OperationsSetToLayers"], [41, 0, 1, "", "OperatorSetConcat"], [41, 0, 1, "", "OperatorsSet"], [41, 0, 1, "", "QuantizationConfigOptions"], [41, 0, 1, "", "QuantizationMethod"], [36, 0, 1, "", "Smaller"], [36, 0, 1, "", "SmallerEq"], [41, 0, 1, "", "TargetPlatformCapabilities"], [41, 0, 1, "", "TargetPlatformModel"]], "model_compression_toolkit.trainable_infrastructure": [[42, 0, 1, "", "BaseKerasTrainableQuantizer"], [42, 0, 1, "", "BasePytorchTrainableQuantizer"], [42, 0, 1, "", "TrainableQuantizerActivationConfig"], [42, 0, 1, "", "TrainableQuantizerWeightsConfig"]]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:data", "3": "py:function", "4": "py:attribute"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "data", "Python data"], "3": ["py", "function", "Python function"], "4": ["py", "attribute", "Python attribute"]}, "titleterms": {"api": [0, 9, 12, 48], "doc": [0, 12], "function": [0, 12], "modul": [0, 7, 12, 33, 34, 35, 37, 38, 39, 40, 41, 42], "class": [0, 8, 10, 11, 12], "indic": [0, 12], "tabl": [0, 12], "get": [1, 4, 13, 14, 15, 16, 17, 20, 28], "kpi": [1, 4, 7, 20, 28, 37], "inform": [1, 4, 20, 23, 28], "kera": [1, 2, 3, 13, 14, 18, 19, 20, 21, 22, 23, 24, 25, 45], "model": [1, 4, 13, 14, 15, 16, 20, 21, 24, 25, 28, 30, 31, 45, 46, 48], "post": [2, 3, 5, 6, 19, 22, 27, 29], "train": [2, 3, 5, 6, 19, 22, 24, 25, 27, 29, 30, 31], "quantiz": [2, 3, 5, 6, 19, 21, 22, 24, 25, 27, 29, 30, 31], "mix": [3, 6, 47], "precis": [3, 6, 47], "pytorch": [4, 5, 6, 15, 16, 26, 27, 28, 29, 30, 31, 46], "mixed_precision_quantization_config": [7, 37], "mixedprecisionquantizationconfig": 7, "defaultdict": 8, "folder": 9, "imag": 9, "loader": 9, "default": 9, "file": 9, "type": 9, "scan": 9, "frameworkinfo": 10, "channelaxi": 10, "gradientptqconfigv2": 11, "gradientptqconfig": [11, 14, 16], "gptqhessianscoresconfig": 11, "datagenerationconfig": [13, 15], "targetplatformcap": [17, 41], "data": [18, 26], "gener": [18, 26], "gradient": [19, 27], "base": [19, 27], "load": 21, "structur": 23, "prune": 23, "configur": [23, 47], "awar": [24, 25, 30, 31], "final": [24, 30], "init": [25, 31], "enabl": 32, "logger": 32, "core_config": 33, "coreconfig": 33, "debug_config": 34, "debugconfig": 34, "export": 35, "kerasexportserializationformat": 35, "pytorchexportserializationformat": 35, "keras_export_model": 35, "pytorch_export_model": 35, "layer": 36, "attribut": 36, "filter": [36, 38], "mixedprecisionquantizationconfigv2": 37, "network_editor": 38, "editrul": 38, "action": 38, "qat_config": 39, "trainingmethod": 39, "qatconfig": 39, "quantization_config": 40, "quantizationerrormethod": 40, "quantizationconfig": 40, "target_platform": 41, "quantizationmethod": 41, "opquantizationconfig": 41, "quantizationconfigopt": 41, "targetplatformmodel": 41, "operatorsset": 41, "fuse": 41, "operatorsetconcat": 41, "code": 41, "exampl": 41, "operationssettolay": 41, "layerfilterparam": 41, "trainable_infrastructur": 42, "basekerastrainablequant": 42, "basepytorchtrainablequant": 42, "trainablequantizerweightsconfig": 42, "trainablequantizeractivationconfig": 42, "mct": [45, 46], "quickstart": [45, 46, 48], "guidelin": [45, 46], "visual": 47, "within": 47, "tensorboard": 47, "cosin": 47, "similar": 47, "comparison": 47, "bit": 47, "width": 47, "compress": 48, "toolkit": 48, "user": 48, "guid": 48, "overview": 48, "instal": 48, "support": 48, "featur": 48, "document": 48, "technic": 48, "constraint": 48, "refer": 48}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 56}})
\ No newline at end of file
+Search.setIndex({"docnames": ["api/api_docs/classes/DefaultDict", "api/api_docs/classes/FolderImageLoader", "api/api_docs/classes/FrameworkInfo", "api/api_docs/classes/GradientPTQConfig", "api/api_docs/classes/PruningConfig", "api/api_docs/classes/PruningInfo", "api/api_docs/index", "api/api_docs/methods/get_keras_data_generation_config", "api/api_docs/methods/get_keras_gptq_config", "api/api_docs/methods/get_pytorch_data_generation_config", "api/api_docs/methods/get_pytroch_gptq_config", "api/api_docs/methods/get_target_platform_capabilities", "api/api_docs/methods/keras_data_generation_experimental", "api/api_docs/methods/keras_gradient_post_training_quantization_experimental", "api/api_docs/methods/keras_kpi_data_experimental", "api/api_docs/methods/keras_load_quantizad_model", "api/api_docs/methods/keras_post_training_quantization_experimental", "api/api_docs/methods/keras_pruning_experimental", "api/api_docs/methods/keras_quantization_aware_training_finalize", "api/api_docs/methods/keras_quantization_aware_training_init", "api/api_docs/methods/pytorch_data_generation_experimental", "api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental", "api/api_docs/methods/pytorch_kpi_data_experimental", "api/api_docs/methods/pytorch_post_training_quantization_experimental", "api/api_docs/methods/pytorch_pruning_experimental", "api/api_docs/methods/pytorch_quantization_aware_training_finalize", "api/api_docs/methods/pytorch_quantization_aware_training_init", "api/api_docs/methods/set_logger_path", "api/api_docs/modules/core_config", "api/api_docs/modules/debug_config", "api/api_docs/modules/exporter", "api/api_docs/modules/layer_filters", "api/api_docs/modules/mixed_precision_quantization_config", "api/api_docs/modules/network_editor", "api/api_docs/modules/qat_config", "api/api_docs/modules/quantization_config", "api/api_docs/modules/target_platform", "api/api_docs/modules/trainable_infrastructure", "api/api_docs/notes/tpc_note", "guidelines/quickstart_keras", "guidelines/quickstart_pytorch", "guidelines/visualization", "index"], "filenames": ["api/api_docs/classes/DefaultDict.rst", "api/api_docs/classes/FolderImageLoader.rst", "api/api_docs/classes/FrameworkInfo.rst", "api/api_docs/classes/GradientPTQConfig.rst", "api/api_docs/classes/PruningConfig.rst", "api/api_docs/classes/PruningInfo.rst", "api/api_docs/index.rst", "api/api_docs/methods/get_keras_data_generation_config.rst", "api/api_docs/methods/get_keras_gptq_config.rst", "api/api_docs/methods/get_pytorch_data_generation_config.rst", "api/api_docs/methods/get_pytroch_gptq_config.rst", "api/api_docs/methods/get_target_platform_capabilities.rst", "api/api_docs/methods/keras_data_generation_experimental.rst", "api/api_docs/methods/keras_gradient_post_training_quantization_experimental.rst", "api/api_docs/methods/keras_kpi_data_experimental.rst", "api/api_docs/methods/keras_load_quantizad_model.rst", "api/api_docs/methods/keras_post_training_quantization_experimental.rst", "api/api_docs/methods/keras_pruning_experimental.rst", "api/api_docs/methods/keras_quantization_aware_training_finalize.rst", "api/api_docs/methods/keras_quantization_aware_training_init.rst", "api/api_docs/methods/pytorch_data_generation_experimental.rst", "api/api_docs/methods/pytorch_gradient_post_training_quantization_experimental.rst", "api/api_docs/methods/pytorch_kpi_data_experimental.rst", "api/api_docs/methods/pytorch_post_training_quantization_experimental.rst", "api/api_docs/methods/pytorch_pruning_experimental.rst", "api/api_docs/methods/pytorch_quantization_aware_training_finalize.rst", "api/api_docs/methods/pytorch_quantization_aware_training_init.rst", "api/api_docs/methods/set_logger_path.rst", "api/api_docs/modules/core_config.rst", "api/api_docs/modules/debug_config.rst", "api/api_docs/modules/exporter.rst", "api/api_docs/modules/layer_filters.rst", "api/api_docs/modules/mixed_precision_quantization_config.rst", "api/api_docs/modules/network_editor.rst", "api/api_docs/modules/qat_config.rst", "api/api_docs/modules/quantization_config.rst", "api/api_docs/modules/target_platform.rst", "api/api_docs/modules/trainable_infrastructure.rst", "api/api_docs/notes/tpc_note.rst", "guidelines/quickstart_keras.rst", "guidelines/quickstart_pytorch.rst", "guidelines/visualization.rst", "index.rst"], "titles": ["DefaultDict Class", "Folder Image Loader API", "FrameworkInfo Class", "GradientPTQConfig Class", "Pruning Configuration", "Pruning Information", "API Docs", "Get DataGenerationConfig for Keras Models", "Get GradientPTQConfig for Keras Models", "Get DataGenerationConfig for Pytorch Models", "Get GradientPTQConfig for Pytorch Models", "Get TargetPlatformCapabilities", "Keras Data Generation", "Keras Gradient Based Post Training Quantization", "Get KPI information for Keras Models", "Load Quantized Keras Model", "Keras Post Training Quantization", "Keras Structured Pruning", "Keras Quantization Aware Training Model Finalize", "Keras Quantization Aware Training Model Init", "Pytorch Data Generation", "Pytorch Gradient Based Post Training Quantization", "Get KPI information for PyTorch Models", "Pytorch Post Training Quantization", "Pytorch Structured Pruning", "PyTorch Quantization Aware Training Model Finalize", "PyTorch Quantization Aware Training Model Init", "Enable a Logger", "core_config Module", "debug_config Module", "exporter Module", "Layer Attributes Filters", "mixed_precision_quantization_config Module", "network_editor Module", "qat_config Module", "quantization_config Module", "target_platform Module", "trainable_infrastructure Module", "&lt;no title&gt;", "MCT Quickstart Guideline for Keras models", "MCT Quickstart Guideline for Pytorch models", "Visualization within TensorBoard", "Model Compression Toolkit User Guide"], "terms": {"model_compression_toolkit": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41], "known_dict": 0, "none": [0, 3, 8, 10, 11, 13, 15, 16, 19, 21, 23, 26, 28, 30, 32, 33, 34, 36, 37], "default_valu": 0, "default": [0, 3, 7, 8, 9, 11, 13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 28, 30, 34, 36, 39, 40, 41], "dictionari": [0, 2, 3, 18, 19, 30, 33, 34, 36, 37], "It": [0, 36, 37], "wrap": [0, 2, 6, 15, 19, 26, 35, 36, 37], "given": [0, 13, 14, 16, 19, 21, 22, 23, 26, 32, 36], "initi": [0, 1, 3, 7, 9, 19, 26, 36, 37, 39, 40], "return": [0, 1, 3, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 30, 32, 36, 39, 40], "its": [0, 2, 15, 24, 30, 35, 36, 41], "valu": [0, 2, 3, 13, 16, 17, 18, 19, 24, 30, 31, 32, 33, 34, 35, 36], "when": [0, 1, 2, 4, 6, 8, 10, 13, 16, 18, 19, 29, 31, 32, 34, 36, 37, 41], "request": 0, "If": [0, 2, 13, 16, 18, 19, 21, 23, 30, 36], "kei": [0, 17, 24, 36], "present": [0, 41], "pass": [0, 1, 2, 8, 10, 13, 16, 17, 18, 19, 21, 23, 24, 25, 26, 33, 35, 36], "gener": [0, 6, 7, 9, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 36, 39, 40, 41, 42], "paramet": [0, 1, 2, 3, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "provid": [0, 12, 17, 20, 24, 30, 37, 41], "an": [0, 2, 3, 5, 6, 13, 16, 19, 26, 30, 31, 33, 34, 36, 37, 39, 40, 42], "empti": 0, "get": [0, 2, 3, 6, 13, 16, 18, 19, 21, 23, 25, 26, 32, 36, 39, 40, 41], "inner": 0, "us": [0, 1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 29, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42], "default_factori": 0, "exist": [0, 1, 33], "wa": [0, 30, 36], "type": [0, 3, 4, 5, 7, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 22, 24, 30, 33, 36, 38], "ani": [0, 2, 3, 30, 31, 36, 37, 39, 40], "The": [1, 2, 3, 4, 7, 8, 9, 10, 13, 16, 17, 18, 19, 21, 23, 24, 26, 30, 32, 33, 35, 36, 37, 39, 40, 41], "follow": [1, 2, 3, 36, 37, 41], "can": [1, 2, 3, 6, 8, 10, 11, 14, 17, 22, 24, 29, 30, 33, 35, 36, 37, 39, 40, 41, 42], "load": [1, 6, 18, 19, 30, 37, 39, 40], "creat": [1, 2, 3, 6, 7, 8, 9, 10, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 31, 33, 35, 36, 39, 40], "repres": [1, 3, 6, 8, 10, 13, 16, 17, 18, 19, 21, 23, 24, 25, 26, 30, 32, 33, 36, 39, 40, 41], "dataset": [1, 3, 6, 8, 10, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 39, 40, 41], "ptq": [1, 6, 16, 23, 30, 39, 40], "calibr": [1, 13, 14, 16, 19, 21, 22, 23, 26, 39, 40], "class": [1, 4, 5, 15, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37], "core": [1, 2, 13, 14, 16, 18, 19, 21, 22, 25, 26, 28, 29, 32, 33, 35, 40], "folderimageload": [1, 6, 39, 40], "preprocess": [1, 39, 40], "batch_siz": [1, 39, 40], "file_typ": 1, "filetyp": 1, "process": [1, 3, 6, 7, 8, 9, 10, 11, 17, 24, 28, 29, 32, 33, 34, 35, 36, 38, 39, 40, 41], "retriev": 1, "object": [1, 2, 7, 8, 9, 10, 11, 13, 14, 15, 16, 18, 19, 21, 22, 23, 26, 30, 32, 33, 36, 37, 39, 40], "path": [1, 15, 27, 30, 39, 40, 41], "ha": [1, 5, 30, 33, 36, 39, 40], "contain": [1, 5, 6, 12, 13, 14, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 36, 37, 39, 40], "least": [1, 36, 39, 40], "one": [1, 31, 32, 35, 36, 39, 40, 41], "list": [1, 2, 3, 7, 8, 9, 10, 12, 20, 29, 32, 33, 36, 39, 40, 42], "function": [1, 2, 3, 7, 8, 9, 10, 12, 15, 17, 20, 24, 32, 33, 36, 37, 39, 40], "befor": 1, "them": [1, 11, 36, 41], "number": [1, 3, 4, 7, 8, 9, 10, 11, 12, 13, 16, 17, 19, 20, 21, 23, 24, 26, 32, 36, 37, 38, 39, 40], "each": [1, 5, 13, 16, 17, 19, 21, 23, 24, 26, 33, 36, 37, 39, 40, 41], "sampl": [1, 3, 39, 40, 41], "exampl": [1, 2, 3, 8, 10, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 32, 33, 35, 37, 39, 40, 42], "instanti": [1, 3, 34, 35], "directori": [1, 6, 27], "10": [1, 13, 16, 19, 21, 23, 26, 39], "randomli": 1, "time": [1, 2, 37], "image_data_load": [1, 39, 40], "To": [1, 30, 36, 41], "method": [1, 17, 24, 30, 33, 34, 35, 36, 37, 39, 40], "lambda": [1, 30], "x": [1, 39, 40], "127": [1, 39], "5": [1, 8, 10, 17, 24, 39], "For": [1, 2, 11, 13, 16, 18, 19, 26, 30, 35, 36, 37, 38, 39, 40, 41, 42], "onli": [1, 2, 13, 16, 18, 19, 30, 32, 36], "specif": [1, 2, 13, 14, 17, 19, 22, 24, 26, 33, 36, 41], "extens": [1, 30], "png": 1, "A": [1, 2, 3, 5, 6, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 28, 29, 32, 33, 34, 36, 39, 40, 42], "from": [1, 2, 3, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 33, 35, 36, 37, 38, 39, 40, 41, 42], "common": [1, 36], "data_load": 1, "jpeg": 1, "jpg": 1, "bmp": 1, "api": [2, 3, 16, 19, 26, 36], "mct": [2, 6, 8, 10, 11, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 28, 29, 30, 33, 35, 36, 37, 38, 41, 42], "framework": [2, 6, 11, 13, 14, 19, 22, 26, 36, 37], "relat": [2, 5, 6, 36], "inform": [2, 3, 6, 8, 10, 11, 13, 16, 17, 19, 21, 23, 24, 26, 29, 36, 37, 38], "optim": [2, 3, 6, 7, 8, 9, 10, 11, 13, 14, 16, 19, 21, 22, 23, 26, 28, 35, 36, 37, 38, 39, 40, 42], "network": [2, 4, 25, 28, 29, 33, 35, 41, 42], "activation_quantizer_map": 2, "kernel_channels_map": 2, "activation_min_max_map": 2, "layer_min_max_map": 2, "kernel_ops_attributes_map": 2, "out_channel_axis_map": 2, "all": [2, 3, 33, 35, 36, 37, 41], "about": [2, 3, 5, 8, 10, 13, 14, 16, 18, 19, 22, 26, 30, 36, 37], "librari": [2, 35], "need": [2, 13, 14, 16, 19, 21, 22, 23, 26, 30, 31, 36, 37], "quantiz": [2, 3, 6, 8, 10, 11, 14, 22, 28, 29, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42], "model": [2, 3, 5, 6, 11, 12, 13, 16, 17, 20, 21, 23, 24, 28, 32, 33, 34, 35, 36, 37, 41], "hold": [2, 28, 31], "layer": [2, 5, 7, 9, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 29, 30, 32, 33, 36, 37, 39, 40, 41], "how": [2, 4, 13, 14, 16, 19, 21, 22, 23, 26, 30, 36, 37, 39, 40, 42], "thei": [2, 13, 14, 19, 22, 26, 36], "should": [2, 3, 4, 8, 10, 13, 14, 16, 18, 19, 21, 22, 23, 24, 26, 30, 32, 35, 36, 39, 40, 41], "multipl": [2, 32, 36], "map": [2, 36], "kernel": [2, 13, 14, 16, 18, 19, 22, 26, 32, 33, 36, 37], "channel": [2, 4, 5, 13, 14, 17, 19, 22, 24, 26, 35, 36, 37, 41], "indic": [2, 5, 13, 14, 17, 19, 22, 24, 26, 36], "min": [2, 13, 16, 19, 21, 23, 26, 35, 41], "max": [2, 13, 14, 16, 19, 21, 22, 23, 26, 35, 39, 41], "etc": [2, 13, 14, 16, 19, 21, 22, 23, 26, 36, 41], "ar": [2, 3, 11, 13, 16, 17, 19, 21, 23, 24, 26, 30, 36, 37, 38, 39, 40, 41], "divid": 2, "three": [2, 36], "group": [2, 13, 14, 17, 19, 22, 24, 26, 36], "kernel_op": 2, "have": [2, 30, 31, 36, 39, 40, 41], "coeffici": [2, 13, 16, 18, 19, 21, 23, 32, 37], "e": [2, 13, 14, 16, 19, 21, 22, 23, 26, 36, 42], "g": [2, 13, 14, 16, 19, 21, 22, 23, 26], "conv2d": [2, 13, 16, 18, 19, 32, 33, 36], "dens": 2, "activation_op": 2, "output": [2, 7, 9, 12, 13, 16, 19, 20, 21, 23, 25, 26, 35, 36, 40, 41, 42], "add": [2, 7, 9, 15, 36, 37], "relu": [2, 35, 36], "no_quantization_op": 2, "reshap": 2, "transpos": 2, "dict": [2, 3, 5, 30, 36, 37], "quantizationmethod": [2, 37], "callabl": [2, 3, 8, 10, 13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 30, 31, 32, 39, 40], "defaultdict": [2, 36], "tupl": [2, 12, 13, 17, 20, 24, 33, 36], "out": [2, 4], "str": [2, 30, 31, 36], "activ": [2, 13, 14, 16, 19, 21, 22, 23, 26, 30, 32, 33, 34, 35, 36, 37, 41], "oper": [2, 31, 32, 36], "weight": [2, 3, 7, 8, 9, 10, 13, 14, 17, 19, 21, 22, 23, 24, 25, 26, 30, 32, 33, 34, 35, 36, 37, 41], "attirbut": 2, "s": [2, 13, 16, 17, 18, 19, 21, 23, 24, 26, 30, 31, 32, 33, 35, 36, 37, 39, 40, 42], "comput": [2, 3, 6, 14, 22, 32, 41], "statist": [2, 13, 16, 19, 21, 23, 26, 41], "per": [2, 13, 16, 19, 26, 36, 37, 41], "kera": [2, 3, 6, 32, 33, 36, 37, 42], "we": [2, 13, 16, 17, 19, 24, 26, 30, 33, 36, 37, 39, 40, 41], "want": [2, 36], "set": [2, 6, 8, 13, 16, 17, 18, 19, 21, 23, 24, 26, 27, 33, 36, 37, 39, 40, 41], "know": 2, "3": [2, 8, 10, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 37, 39, 40], "2": [2, 8, 30, 35, 36, 37, 39, 42], "respectivli": 2, "import": [2, 4, 5, 6, 8, 10, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 33, 35, 36, 37, 39, 40, 41], "tensorflow": [2, 6, 8, 11, 13, 14, 16, 17, 18, 19, 30, 33, 36, 39, 42], "tf": [2, 8, 12, 15, 18, 19, 36], "Then": [2, 13, 16, 19, 21, 23, 26, 33, 36, 41], "rang": [2, 13, 16, 19, 21, 23, 26, 39, 40], "advanc": 2, "save": [2, 19, 27, 30, 37], "collect": [2, 13, 16, 19, 21, 23, 26, 41], "softmax": [2, 35], "0": [2, 3, 5, 7, 8, 9, 13, 16, 17, 18, 19, 24, 30, 32, 35, 36, 37, 39, 40], "1": [2, 3, 5, 10, 13, 14, 16, 17, 18, 21, 22, 23, 24, 25, 30, 32, 39, 42], "enum": [2, 3, 34, 35], "select": [2, 30, 34, 35, 36, 37], "format": [2, 6], "index": [2, 6], "axi": [2, 37], "nhwc": 2, "last": 2, "nchw": 2, "instanc": [3, 6, 8, 10, 33, 36, 41], "which": [3, 30, 31, 33, 35, 36, 37, 39, 40], "post": [3, 6, 19, 24, 26, 39, 40, 42], "train": [3, 6, 34, 36, 37, 39, 40, 42], "knowledg": [3, 42], "distil": [3, 42], "teacher": 3, "float": [3, 7, 8, 9, 10, 13, 19, 21, 23, 26, 30, 32, 35, 36, 37, 41], "student": 3, "gptq": [3, 6, 8, 10, 13, 21], "n_epoch": [3, 8, 10, 13], "optimizer_rest": [3, 8, 10], "loss": [3, 7, 8, 9, 10, 13, 17, 21, 23, 24], "log_funct": [3, 8, 10], "train_bia": 3, "true": [3, 7, 8, 9, 10, 15, 25, 26, 32, 35, 36, 37, 40], "rounding_typ": 3, "roundingtyp": 3, "softquant": 3, "use_hessian_based_weight": [3, 8, 10], "optimizer_quantization_paramet": 3, "optimizer_bia": 3, "regularization_factor": [3, 8, 10], "reg_default": [3, 8, 10], "hessian_weights_config": 3, "gptq_quantizer_params_overrid": 3, "configur": [3, 6, 7, 8, 9, 10, 12, 13, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 28, 29, 31, 32, 33, 34, 35, 36, 37, 40, 42], "gradientptq": [3, 6], "int": [3, 4, 7, 8, 9, 10, 12, 20, 32, 35, 36, 37, 39], "epoch": [3, 8, 10], "bia": [3, 8, 10, 13, 16, 18, 19, 32, 35, 36], "accept": [3, 8, 10], "6": 3, "tensor": [3, 8, 10, 12, 14, 20, 22, 32, 36, 37, 39, 40, 41, 42], "1st": [3, 8, 10], "2nd": [3, 8, 10], "3rd": [3, 8, 10], "4th": [3, 8, 10], "5th": 3, "6th": 3, "mean": [3, 36, 39, 40, 41], "std": [3, 39, 40], "accordingli": [3, 36], "see": [3, 36, 42], "multiple_tensors_mse_loss": [3, 10], "log": [3, 8, 10, 27, 41], "bool": [3, 7, 8, 9, 10, 29, 32, 35, 36, 37], "whether": [3, 5, 7, 8, 9, 10, 15, 29, 30, 32, 35, 36, 37], "updat": 3, "dure": [3, 6, 7, 8, 9, 10, 11, 30, 33, 35, 36, 37, 38, 39, 40, 41], "defin": [3, 8, 10, 13, 16, 17, 18, 19, 21, 23, 24, 36, 37], "round": [3, 39], "hessian": [3, 8, 10, 17, 24, 32], "base": [3, 6, 8, 10, 17, 23, 24, 32, 36, 37, 42], "averag": [3, 7, 8, 9, 10, 32], "overrid": [3, 34, 36], "rest": 3, "point": [3, 8, 10, 13, 21, 23, 32, 36, 41], "regular": [3, 8, 10], "factor": [3, 8, 10, 32], "includ": [3, 5, 13, 16, 19, 21, 23, 26, 32, 34, 36], "necessari": [3, 30, 37], "argument": [3, 36, 39, 40], "run": [3, 8, 10, 30, 39, 40, 41], "score": [3, 4, 5, 17, 24, 32, 35], "hessians_num_sampl": 3, "16": [3, 30, 40], "norm_scor": [3, 32], "log_norm": 3, "scale_log_norm": 3, "fals": [3, 29, 35, 36], "metric": [3, 4, 32], "gptqhessianweightsconfig": 3, "normal": [3, 7, 9, 32, 39, 40], "between": [3, 13, 21, 23, 32, 35, 36, 41], "scale": [3, 32, 35, 36], "final": [3, 6, 12, 20, 32, 33, 41, 42], "vector": [3, 41], "pruningconfig": [4, 6, 17, 24], "num_score_approxim": [4, 17, 24], "32": [4, 32, 36, 39, 40], "importance_metr": 4, "importancemetr": 4, "lfh": [4, 17, 24], "channels_filtering_strategi": 4, "channelsfilteringstrategi": 4, "greedi": [4, 32], "specifi": [4, 7, 9, 15, 17, 24, 30, 36], "neural": [4, 42], "approxim": [4, 17, 24], "perform": [4, 12, 17, 20, 24, 32], "calcul": [4, 6, 13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 32], "strategi": [4, 17, 24], "filter": [4, 36], "pruninginfo": [5, 6, 17, 24], "pruning_mask": 5, "importance_scor": 5, "store": [5, 37], "mask": 5, "thi": [5, 6, 13, 15, 16, 17, 18, 19, 21, 23, 24, 26, 30, 32, 36, 37, 42], "act": 5, "access": 5, "metadata": 5, "arrai": [5, 39, 40], "where": [5, 30, 33, 36, 39, 40, 41], "element": [5, 36], "correspond": 5, "neuron": 5, "been": 5, "kept": [5, 19, 26], "basenod": 5, "np": [5, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 32, 39], "ndarrai": [5, 39, 40], "quantifi": [5, 41], "signific": 5, "init": [6, 33, 42], "pytorch_post_training_quant": [6, 10, 23, 30], "pytorch": [6, 11, 36, 37, 42], "keras_post_training_quant": [6, 8, 16, 30, 33, 35, 41], "keras_gradient_post_training_quant": [6, 13], "gradient": [6, 23, 42], "get_keras_gptq_config": [6, 8, 13], "gradientptqconfig": [6, 13, 21], "pytorch_gradient_post_training_quant": [6, 21], "get_pytorch_gptq_config": [6, 10], "keras_quantization_aware_training_init": 6, "prepar": [6, 19, 26], "awar": [6, 34, 37, 42], "experiment": [6, 42], "keras_quantization_aware_training_fin": 6, "after": [6, 13, 15, 16, 19, 26, 35, 36, 42], "without": [6, 36, 39, 40], "quantizewrapp": [6, 19, 25, 26], "keras_data_generation_experiment": [6, 12], "data": [6, 7, 9, 14, 17, 22, 24, 30, 36, 39, 40, 41, 42], "get_keras_data_generation_config": [6, 7], "datagenerationconfig": [6, 12, 20], "pytorch_data_generation_experiment": [6, 20], "get_pytorch_data_generation_config": [6, 9], "keras_pruning_experiment": [6, 17], "appli": [6, 30, 31, 33, 36], "structur": [6, 42], "prune": [6, 42], "pytorch_pruning_experiment": [6, 24], "keras_kpi_data": [6, 14], "kpi": [6, 13, 16, 17, 18, 19, 21, 23, 24, 25, 26], "desir": [6, 13, 14, 16, 18, 19, 21, 22, 23, 26], "target": [6, 11, 13, 14, 16, 17, 18, 19, 22, 24, 25, 26, 36, 39], "mix": [6, 13, 14, 16, 18, 19, 21, 22, 23, 26, 28, 32, 36, 42], "precis": [6, 13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 26, 28, 32, 36, 42], "pytorch_kpi_data": [6, 22], "get_target_platform_cap": [6, 11, 36, 39, 40], "platform": [6, 11, 13, 16, 17, 18, 19, 22, 24, 36, 39], "keras_load_quantized_model": [6, 15], "core_config": [6, 13, 14, 16, 18, 19, 21, 22, 23, 25, 26, 40], "quantization_config": [6, 28, 37, 40], "mixed_precision_quantization_config": 6, "debug_config": [6, 28], "option": [6, 15, 16, 17, 19, 21, 24, 26, 28, 30, 36], "debug": [6, 28, 29], "target_platform": [6, 31, 37], "hardwar": [6, 11, 17, 24, 36, 37, 39, 40, 42], "accord": [6, 13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 30, 31, 32, 35, 36], "infer": [6, 11, 18, 25, 36, 37, 39, 40], "qat_config": [6, 19, 26], "export": 6, "enabl": [6, 11, 29, 32, 35, 36, 37, 38, 42], "differ": [6, 13, 16, 18, 19, 30, 32, 35, 36, 41], "serial": 6, "trainable_infrastructur": 6, "abstract": [6, 37], "orient": [6, 37], "tool": [6, 37], "imag": [6, 7, 9, 12, 13, 16, 19, 20, 21, 23, 26, 32, 39, 40, 41], "frameworkinfo": [6, 13, 14, 19, 22, 26], "search": [6, 13, 16, 19, 21, 23, 26, 32, 35], "page": 6, "document": [6, 16, 19, 26], "auto": 6, "sphinx": 6, "data_gener": [7, 9, 12, 20], "n_iter": [7, 9, 39, 40], "default_n_it": [7, 9], "adam": [7, 8, 10], "data_gen_batch_s": [7, 9], "default_data_gen_b": [7, 9], "initial_lr": [7, 9], "default_keras_initial_lr": 7, "output_loss_multipli": [7, 9], "default_keras_output_loss_multipli": 7, "scheduler_typ": [7, 9], "schedulertyp": [7, 9], "reduce_on_plateau": [7, 9], "bn_alignment_loss_typ": [7, 9], "batchnormalignemntlosstyp": [7, 9], "l2_squar": [7, 9], "output_loss_typ": [7, 9], "outputlosstyp": [7, 9], "regularized_min_max_diff": [7, 9], "data_init_typ": [7, 9], "datainittyp": [7, 9], "gaussian": 7, "layer_weighting_typ": [7, 9], "bnlayerweightingtyp": [7, 9], "image_granular": [7, 9], "imagegranular": [7, 9], "batchwis": 7, "image_pipeline_typ": [7, 9], "imagepipelinetyp": [7, 9], "random_crop_flip": 7, "image_normalization_typ": [7, 9], "imagenormalizationtyp": [7, 9], "keras_appl": 7, "extra_pixel": [7, 9], "bn_layer_typ": [7, 9], "batchnorm": [7, 9, 13, 16, 19, 21, 23, 26], "clip_imag": [7, 9], "reflect": [7, 9], "iter": [7, 9, 13, 16, 19, 21, 23, 26, 39, 40], "batch": [7, 9, 13, 16, 19, 21, 23, 26, 39, 40], "size": [7, 9, 12, 13, 16, 18, 19, 20, 26, 30, 34, 39, 40], "learn": [7, 8, 9, 34], "rate": [7, 8, 9], "multipli": [7, 9], "schedul": [7, 9], "align": [7, 9], "granular": [7, 9], "pipelin": [7, 9], "extra": [7, 9], "pixel": [7, 9], "input": [7, 9, 13, 16, 19, 21, 23, 26, 32, 35, 36, 39, 40], "consid": [7, 9, 17, 24, 36], "clip": [7, 9], "learning_r": 8, "lr_default": [8, 10], "lr_rest_default": [8, 10], "gptqmultipletensorsloss": 8, "gradientptqconfigv2": [8, 10], "fine": [8, 10, 18, 19, 24, 25, 26], "tune": [8, 10, 18, 19, 24, 25], "optimizerv2": 8, "auxiliri": [8, 10], "variabl": [8, 10], "4": [8, 10, 13, 16, 17, 19, 21, 23, 24, 26, 36], "gptq_conf": [8, 10, 21], "other": [8, 10, 36], "nadam": 8, "order": [8, 10, 13, 16, 19, 26, 30, 31, 36], "radam": 9, "default_pytorch_initial_lr": 9, "default_pytorch_output_loss_multipli": 9, "divers": 9, "allimag": 9, "random_crop": 9, "torchvis": [9, 21, 22, 23, 24, 25, 26, 30, 40], "default_pytorch_bn_layer_typ": 9, "last_layer_typ": 9, "default_pytorch_last_layer_typ": 9, "torch": [10, 30, 42], "lr": 10, "dummi": 10, "param": [10, 29, 33, 37], "fw_name": 11, "target_platform_nam": 11, "target_platform_vers": 11, "name": [11, 30, 33, 36, 41], "now": [11, 26, 30, 36, 37, 38, 41], "support": [11, 30, 36], "both": [11, 13, 16, 21, 23, 25, 36, 37, 41], "imx500": [11, 30, 36], "tflite": [11, 36], "qnnpack": [11, 36], "capabl": [11, 17, 22, 24], "version": [11, 36, 42], "attach": [11, 36, 39, 40], "some": [11, 30, 36, 38, 41], "field": [11, 31, 36, 38], "opquantizationconfig": [11, 38], "ignor": [11, 36, 38], "current": [11, 30, 36, 38, 42], "bit": [11, 13, 16, 18, 19, 26, 30, 32, 33, 36, 37, 38, 42], "disabl": [11, 36, 38], "more": [11, 16, 17, 19, 24, 26, 30, 36, 38, 41], "futur": [11, 36, 38], "n_imag": [12, 20], "output_image_s": [12, 20], "data_generation_config": [12, 20], "in_model": [13, 14, 16, 18, 19, 22, 25, 26], "representative_data_gen": [13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 30, 39, 40], "gptq_config": [13, 21, 23], "gptq_representative_data_gen": [13, 21], "target_kpi": [13, 16, 17, 19, 21, 23, 24, 26], "coreconfig": [13, 14, 16, 18, 19, 21, 22, 23, 25, 26, 40], "fw_info": [13, 14, 19, 22, 26], "default_keras_info": [13, 14, 19], "target_platform_cap": [13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 36, 37, 39, 40], "default_keras_tpc": [13, 16, 17, 19], "symmetr": [13, 16, 19, 21, 23, 26, 34, 36, 37], "constraint": [13, 16, 17, 21, 23, 24], "threshold": [13, 16, 19, 21, 23, 26, 32, 35, 36, 37, 40], "power": [13, 16, 19, 21, 23, 26, 35, 36], "two": [13, 16, 19, 21, 23, 26, 30, 32, 36, 39, 40, 41], "first": [13, 16, 19, 21, 23, 26, 30, 36, 41], "sever": [13, 16, 19, 21, 23, 26, 36, 41], "transform": [13, 16, 19, 21, 23, 26, 40], "fold": [13, 16, 19, 21, 23, 26], "preced": [13, 16, 19, 21, 23, 26], "histogram": [13, 16, 19, 21, 23, 26, 41], "being": [13, 16, 19, 21, 23, 26, 37], "depend": [13, 16, 19, 21, 23, 26, 36], "possibl": [13, 16, 19, 26, 35, 36, 41], "width": [13, 16, 19, 26, 32, 36, 42], "config": [13, 16, 17, 18, 19, 21, 24, 25, 26, 28, 33, 36, 37], "ilp": [13, 16, 19, 26], "solver": [13, 16, 19, 26], "find": [13, 16, 19, 26], "In": [13, 16, 19, 21, 23, 26, 30, 31, 32, 36], "limit": [13, 16, 18, 19, 21, 23, 26], "maxim": [13, 16, 19, 26], "weights_memori": [13, 16, 17, 19, 24, 26, 32], "byte": [13, 16, 17, 19, 24, 26, 32, 41], "compar": [13, 21, 23, 30, 32, 41], "minim": [13, 17, 21, 23, 24, 35], "observ": [13, 21, 23, 36, 41], "info": [13, 14, 19, 22, 26, 27], "targetplatformcap": [13, 14, 16, 17, 19, 21, 22, 23, 24, 26, 39, 40], "user": [13, 16, 18, 19, 21, 23, 25, 26], "mai": [13, 16, 19, 21, 23, 26, 31, 35, 41], "handl": [13, 16, 19, 21, 23, 26, 36], "applic": [13, 14, 16, 17, 18, 19, 30, 39], "mobilenet": [13, 14, 39], "random": [13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30], "requir": [13, 16, 19, 21, 23, 26, 37, 41], "num_calibration_batch": [13, 16, 19, 21, 23, 26], "numpi": [13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 39, 40], "def": [13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 36, 39, 40], "repr_datagen": [13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26], "_": [13, 16, 19, 21, 23, 26, 30, 39, 40], "yield": [13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 39, 40], "224": [13, 14, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 30, 39, 40], "bitwidth": [13, 16, 18, 19], "candid": [13, 16, 18, 19, 33], "mixed_precision_config": [13, 14, 16, 18, 19, 22, 28], "mixedprecisionquantizationconfig": [13, 14, 16, 18, 19, 22, 28, 32], "num_of_imag": [13, 16, 32], "our": [13, 16, 18, 19, 26], "note": [13, 16, 18, 19, 32, 36], "affect": [13, 16, 18, 19, 32, 36], "while": [13, 16, 18, 19, 26, 32, 36], "count_param": [13, 16, 17, 18, 19], "75": [13, 16, 18, 19], "8": [13, 16, 18, 19, 30, 36, 37], "quantized_model": [13, 16, 18, 19, 25, 26, 39, 40], "quantization_info": [13, 16, 18, 19, 21, 23, 25, 26, 39, 40], "userinform": 13, "keras_default_tpc": 14, "build": [14, 22, 37, 42], "graph": [14, 22, 33, 41], "hw": 14, "total": [14, 22, 32], "sum": [14, 17, 22, 24, 32], "call": [14, 22, 36, 39, 40, 41], "kpi_data": [14, 22], "filepath": 15, "custom_object": [15, 18, 19], "compil": 15, "trainabl": [15, 18, 37], "custom": [15, 19, 30], "file": [15, 18, 19, 27, 30], "addit": [15, 30, 36], "boolean": 15, "saved_model": 15, "loadopt": 15, "savedmodel": 15, "mobilenet_v2": [16, 18, 19, 21, 22, 23, 25, 26, 30, 40], "mobilenetv2": [16, 18, 19, 30, 41], "pleas": [16, 19, 26, 30, 42], "take": [16, 19, 26, 42], "look": [16, 19, 26, 42], "pruning_config": [17, 24], "meet": [17, 24], "simd": [17, 24, 36], "tpc": [17, 24, 36], "By": [17, 21, 23, 24, 30, 41], "determin": [17, 24, 39, 40], "label": [17, 24, 36], "free": [17, 24], "assess": [17, 24], "sensit": [17, 24, 32], "togeth": [17, 24], "friendli": [17, 24, 42], "architectur": [17, 24], "involv": [17, 24], "analyz": [17, 24], "identifi": [17, 24], "remov": [17, 24, 25, 35, 40], "impact": [17, 24], "notic": [17, 24, 30, 36, 39, 40], "must": [17, 24, 36], "retrain": [17, 24], "recov": [17, 24], "compress": [17, 21, 24, 30], "origin": [17, 41], "achiev": 17, "through": [17, 34], "analysi": [17, 24], "standard": [17, 24, 34], "associ": [17, 24, 36], "resnet50": [17, 24, 30], "here": [17, 24, 30, 36, 39, 40, 42], "aim": [17, 24, 36], "reduc": [17, 24, 32], "memori": [17, 24, 32, 41], "footprint": [17, 24], "50": [17, 24, 39, 40], "assum": [17, 24], "float32": [17, 24, 30], "thu": [17, 24, 41], "dense_nparam": [17, 24], "l": [17, 42], "higher": [17, 24], "also": [17, 24, 36, 42], "extend": [17, 24], "durat": [17, 24], "pruned_model": [17, 24], "pruning_info": [17, 24], "qat": [18, 19, 25, 26, 34], "keras_quantization_aware_training_finalize_experiment": 18, "convert": [18, 25], "replac": 18, "trainablequant": 18, "inferablequant": [18, 25], "keras_quantization_aware_training_init_experiment": [18, 19], "load_model": [18, 19], "model_fil": [18, 19], "qatconfig": [19, 26], "built": [19, 26, 37], "fake_qu": [19, 26], "node": [19, 26, 33, 37, 41], "onlin": [19, 26], "wrapper": [19, 25, 26, 37], "ker": 19, "modul": [20, 21, 22, 23, 24], "default_pytorch_tpc": [21, 23, 24, 26], "toolkit": 21, "quantized_modul": [21, 23], "default_pytorch_info": [22, 26], "pytorch_default_tpc": 22, "in_modul": 23, "clibrat": 23, "default_pyotrch_tpc": 24, "improv": [24, 32], "resnet50_weight": 24, "imagenet1k_v1": 24, "p": [24, 35], "numel": 24, "state_dict": 24, "pytorch_quantization_aware_training_finalize_experiment": 25, "pretrain": [25, 26, 40], "pytorch_quantization_aware_training_init_experiment": [25, 26], "keep": [25, 42], "readi": 25, "tun": 26, "set_log_fold": [27, 41], "folder": [27, 39, 40], "level": 27, "verbos": 27, "quantizationconfig": [28, 36, 40], "debugconfig": 28, "edit": [28, 29, 33], "purpos": [29, 36, 39, 40], "analyze_similar": 29, "network_editor": 29, "plot": [29, 41], "similar": [29, 35, 36, 42], "figur": [29, 41], "within": [29, 42], "tensorboard": [29, 42], "logger": [29, 41], "pinpoint": 29, "problemat": 29, "editrul": 29, "rule": [29, 33], "action": 29, "allow": 30, "detail": [30, 36], "refer": 30, "project": [30, 42], "github": [30, 42], "readm": 30, "you": [30, 41, 42], "question": 30, "issu": [30, 32], "open": [30, 41, 42], "repositori": 30, "fakely_qu": 30, "integ": [30, 32, 36], "mct_quantiz": 30, "via": 30, "save_model_path": 30, "is_layer_exportable_fn": 30, "is_keras_layer_export": 30, "serialization_format": 30, "quantization_format": 30, "h5": 30, "combin": [30, 36], "keras_h5": 30, "8bit": 30, "check": [30, 31, 32, 33, 36], "quant": 30, "pip": [30, 42], "instal": 30, "q": 30, "nightli": [30, 42], "float_model": 30, "demonstr": [30, 36], "quantized_exportable_model": 30, "dtype": 30, "avail": [30, 42], "tempfil": 30, "keras_file_path": 30, "mkstemp": 30, "same": [30, 36], "mode": 30, "qauntiz": 30, "tflite_file_path": 30, "os": 30, "measur": [30, 32, 41], "float_file_path": 30, "print": 30, "mb": 30, "getsiz": 30, "20": [30, 39, 40, 41], "f": 30, "ratio": [30, 35], "repr_dataset": 30, "is_pytorch_layer_export": 30, "onnx_opset_vers": 30, "default_onnx_opset_vers": 30, "trace": 30, "mandatori": 30, "your": [30, 36], "packag": [30, 37, 42], "so": [30, 36], "part": [30, 36], "skip": 30, "plan": 30, "onnxruntim": 30, "let": 30, "start": [30, 36, 37, 42], "There": [30, 36, 41], "choos": 30, "onnx_file_path": 30, "model_format_onnx_mctq": 30, "15": 30, "chang": [30, 33, 36, 41], "get_ort_session_opt": 30, "session": 30, "creation": 30, "slowli": 30, "suffer": 30, "longer": 30, "latenc": 30, "howev": 30, "ort": 30, "sess": 30, "inferencesess": 30, "cudaexecutionprovid": 30, "cpuexecutionprovid": 30, "_input_data": 30, "next": [30, 31, 36], "astyp": 30, "_model_output_nam": 30, "get_output": 30, "_model_input_nam": 30, "get_input": 30, "predict": 30, "torchscript_file_path": 30, "pt": 30, "layerfilterparam": 31, "eq": 31, "attr": 31, "match": [31, 33, 36], "equal": [31, 35], "op": [31, 36], "regard": 31, "noteq": [31, 36], "greater": 31, "than": [31, 32, 36], "greatereq": 31, "smaller": 31, "smallereq": 31, "resourc": [32, 41], "inf": [32, 35], "activation_memori": 32, "total_memori": 32, "bop": 32, "compute_distance_fn": 32, "distance_weighting_method": 32, "get_average_weight": 32, "configuration_overwrit": 32, "num_interest_points_factor": 32, "use_hessian_based_scor": 32, "refine_mp_solut": 32, "metric_normalization_threshold": 32, "1e10": 32, "distanc": 32, "among": 32, "evalu": 32, "overwrit": 32, "predefin": 32, "zero": [32, 36], "percentag": 32, "interest": 32, "try": 32, "algorithm": [32, 40], "increas": 32, "case": [32, 36], "larger": 32, "prevent": 32, "numer": 32, "attribut": [33, 36, 37], "9": 33, "constant": [33, 36, 37], "er_list": 33, "nodetypefilt": 33, "changecandidatesweightsquantconfigattr": 33, "attr_nam": 33, "weights_n_bit": [33, 36, 37], "modifi": [33, 36], "new": [33, 36], "node_typ": 33, "nodenamefilt": 33, "node_nam": 33, "nodenamescopefilt": 33, "node_name_scop": 33, "string": 33, "changefinalweightsquantconfigattr": 33, "kwarg": [33, 36], "attr_valu": 33, "changefinalactivationquantconfigattr": 33, "changecandidatesactivationquantconfigattr": 33, "changequantizationparamfunct": 33, "activation_quantization_params_fn": 33, "weights_quantization_params_fn": 33, "changefinalweightsquantizationmethod": 33, "weights_quantization_method": [33, 36, 37], "changecandidatesweightsquantizationmethod": 33, "changecandidatesactivationquantizationmethod": 33, "activation_quantization_method": [33, 36, 37], "changequantizationmethod": 33, "ste": 34, "straight": 34, "estim": 34, "poweroftwo": 34, "uniform": [34, 36, 37], "dqa": 34, "dnn": 34, "attent": 34, "smooth": 34, "introduc": 34, "lsq": 34, "step": 34, "http": [34, 42], "arxiv": [34, 42], "org": 34, "pdf": 34, "1902": 34, "08153": 34, "weight_training_method": 34, "activation_training_method": 34, "weight_quantizer_params_overrid": 34, "activation_quantizer_params_overrid": 34, "noclip": 35, "mse": [35, 41], "squar": 35, "error": 35, "nois": 35, "mae": [35, 41], "absolut": 35, "kl": [35, 41], "diverg": [35, 41], "make": 35, "signal": 35, "distribut": 35, "lp": 35, "norm": [35, 41], "activation_error_method": 35, "weights_error_method": 35, "relu_bound_to_power_of_2": 35, "weights_bias_correct": 35, "weights_second_moment_correct": 35, "input_sc": 35, "softmax_shift": 35, "shift_negative_activation_correct": 35, "activation_channel_equ": 35, "z_threshold": [35, 40], "math": 35, "min_threshold": [35, 37], "l_p_valu": 35, "linear_collaps": 35, "residual_collaps": 35, "shift_negative_ratio": 35, "05": 35, "shift_negative_threshold_recalcul": 35, "shift_negative_params_search": 35, "correct": 35, "second_mo": 35, "shift": 35, "neg": 35, "z": [35, 40], "outlier": [35, 40], "minimum": [35, 37], "l_p": 35, "block_collaps": 35, "collaps": 35, "block": [35, 37, 41], "anoth": [35, 36], "non": [35, 36], "linear": [35, 36], "abov": [35, 36], "occur": 35, "recomput": 35, "One": [35, 41], "done": [35, 41], "qc": 35, "instans": 35, "backend": 36, "address": 36, "shortli": 36, "diagram": 36, "main": [36, 41], "compon": [36, 37], "explain": [36, 37], "wight": 36, "power_of_two": 36, "kmean": 36, "k": 36, "lut_pot_quant": 36, "lookup": 36, "tabl": 36, "lut_sym_quant": 36, "default_weight_attr_config": 36, "attr_weights_configs_map": 36, "activation_n_bit": [36, 37], "enable_activation_quant": [36, 37], "quantization_preserv": 36, "fixed_scal": 36, "fixed_zero_point": 36, "simd_siz": 36, "attributequantizationconfig": 36, "singl": 36, "instruct": 36, "fetch": 36, "simultan": 36, "would": [36, 41], "like": 36, "op_qc_8bit": 36, "weights_per_channel_threshold": [36, 37], "enable_weights_quant": [36, 37], "later": 36, "wai": [36, 41, 42], "simplest": 36, "quantization_config_list": 36, "base_config": 36, "gather": [36, 41], "fallback": 36, "manner": 36, "either": 36, "previous": 36, "under": [36, 41], "op_qc_4bit": 36, "clone_and_edit": 36, "op_qc_2bit": 36, "mixed_precision_configuration_opt": 36, "properti": 36, "pattern": 36, "default_qco": 36, "default_tp_model": 36, "definit": 36, "come": 36, "explicitli": 36, "guid": 36, "default_configuration_opt": 36, "unless": 36, "otherwis": 36, "my_model": 36, "qc_option": 36, "uniqu": 36, "fullyconnect": 36, "fc_opset": 36, "kind": 36, "implicitli": 36, "do": [36, 41], "relu_opset": 36, "treat": 36, "henc": 36, "appear": 36, "operator_groups_list": 36, "avoid": 36, "were": [36, 41], "opset": 36, "operatorset": 36, "sublist": 36, "sequenc": 36, "add_opset": 36, "pre": 36, "well": 36, "encount": 36, "regardless": 36, "cours": 36, "concaten": 36, "similarli": 36, "place": 36, "separ": 36, "opseratorsset": 36, "activations_after_fc_to_fus": 36, "equival": 36, "float_bitwidth": 36, "kernel_attr": 36, "bias_attr": 36, "op_quantization_config": 36, "tp": 36, "get_tp_model": 36, "test": 36, "experi": 36, "implement": [36, 37], "i": [36, 42], "get_op_quantization_config": 36, "generate_tp_model": 36, "mixed_precision_cfg_list": 36, "default_config": 36, "imx500_tp_model": 36, "todo": 36, "don": 36, "t": [36, 42], "preserv": 36, "behavior": 36, "what": 36, "eventu": 36, "multi": 36, "TO": 36, "BE": 36, "IN": 36, "onc": 36, "lut_values_bitwidth": 36, "kernel_base_config": 36, "bias_config": 36, "eight_bits_default": 36, "linear_eight_bit": 36, "lut": 36, "four_bit": 36, "attr_to_edit": 36, "two_bit": 36, "arg": 36, "generated_tpc": 36, "represent": [36, 39, 40], "op_set_nam": 36, "attr_map": 36, "filterlayerparam": 36, "circular": 36, "bound": 36, "unbound": 36, "condit": 36, "attributefilt": 36, "satisfi": 36, "keyword": 36, "pair": [36, 41], "distinguish": 36, "made": 36, "max_valu": 36, "unbounded_relu_filt": 36, "usag": 36, "These": [36, 41], "just": [36, 42], "nn": 36, "relu6": 36, "negative_slop": 36, "tp_model": 36, "upon": [36, 37], "infrastructur": 37, "util": 37, "propos": 37, "emul": 37, "holder": 37, "learnabl": 37, "basic": 37, "valid": 37, "get_config": 37, "from_config": 37, "weights_quantization_param": 37, "weights_channels_axi": 37, "weights_quantization_candid": 37, "activation_quantization_param": 37, "activation_quantization_candid": 37, "code": [39, 40], "show": [39, 40, 41], "mobilenetv1": 39, "cv2": 39, "resize_scal": 39, "256": [39, 40], "resiz": [39, 40], "resize_sid": 39, "shape": [39, 40], "height_tag": 39, "width_tag": 39, "resized_img": 39, "offset_height": 39, "offset_width": 39, "cropped_img": 39, "loader": [39, 40], "second": [39, 40, 41], "targetplatformmodel": [39, 40], "keras_post_training_quantization_experiment": 39, "pil": 40, "np_to_pil": 40, "img": 40, "fromarrai": 40, "compos": 40, "centercrop": 40, "totensor": 40, "485": 40, "456": 40, "406": 40, "229": 40, "225": 40, "pytorch_post_training_quantization_experiment": 40, "variou": 41, "phase": 41, "displai": 41, "ui": 41, "dir": 41, "writer": 41, "stage": 41, "launch": 41, "logdir": 41, "seen": 41, "tab": 41, "click": 41, "deeper": 41, "view": 41, "tag": 41, "up": 41, "scalar": 41, "mathemat": 41, "divis": 41, "dot": 41, "product": 41, "euclidean": 41, "along": 41, "expect": 41, "mani": 41, "few": [41, 42], "As": 41, "insert": 41, "chosen": 41, "sourc": 42, "research": 42, "develop": 42, "engin": 42, "easili": 42, "state": 42, "art": 42, "hptq": 42, "work": 42, "soni": 42, "semiconductor": 42, "israel": 42, "git": 42, "clone": 42, "com": 42, "model_optim": 42, "python": 42, "setup": 42, "py": 42, "pypi": 42, "latest": 42, "stabl": 42, "releas": 42, "unstabl": 42, "visual": 42, "cosin": 42, "comparison": 42, "minut": 42, "quick": 42, "tutori": 42, "visit": 42, "doesn": 42, "out1": 42, "out2": 42, "out3": 42, "habi": 42, "h": 42, "v": 42, "peretz": 42, "r": 42, "cohen": 42, "dikstein": 42, "dror": 42, "o": 42, "diamant": 42, "jen": 42, "netzer": 42, "2021": 42, "preprint": 42}, "objects": {"model_compression_toolkit": [[0, 0, 1, "", "DefaultDict"], [11, 3, 1, "", "get_target_platform_capabilities"], [15, 3, 1, "", "keras_load_quantized_model"], [27, 3, 1, "", "set_log_folder"]], "model_compression_toolkit.DefaultDict": [[0, 1, 1, "", "get"], [0, 1, 1, "", "keys"]], "model_compression_toolkit.core": [[2, 0, 1, "", "ChannelAxis"], [28, 0, 1, "", "CoreConfig"], [29, 0, 1, "", "DebugConfig"], [1, 0, 1, "", "FolderImageLoader"], [2, 0, 1, "", "FrameworkInfo"], [32, 0, 1, "", "KPI"], [32, 0, 1, "", "MixedPrecisionQuantizationConfig"], [35, 0, 1, "", "QuantizationConfig"], [35, 0, 1, "", "QuantizationErrorMethod"], [14, 3, 1, "", "keras_kpi_data"], [22, 3, 1, "", "pytorch_kpi_data"]], "model_compression_toolkit.core.FolderImageLoader": [[1, 1, 1, "", "sample"]], "model_compression_toolkit.core.common.data_loader": [[1, 2, 1, "", "FILETYPES"]], "model_compression_toolkit.core.network_editor": [[33, 0, 1, "", "ChangeCandidatesActivationQuantConfigAttr"], [33, 0, 1, "", "ChangeCandidatesActivationQuantizationMethod"], [33, 0, 1, "", "ChangeCandidatesWeightsQuantConfigAttr"], [33, 0, 1, "", "ChangeCandidatesWeightsQuantizationMethod"], [33, 0, 1, "", "ChangeFinalActivationQuantConfigAttr"], [33, 0, 1, "", "ChangeFinalWeightsQuantConfigAttr"], [33, 0, 1, "", "ChangeFinalWeightsQuantizationMethod"], [33, 0, 1, "", "ChangeQuantizationParamFunction"], [33, 0, 1, "", "EditRule"], [33, 0, 1, "", "NodeNameFilter"], [33, 0, 1, "", "NodeNameScopeFilter"], [33, 0, 1, "", "NodeTypeFilter"]], "model_compression_toolkit.data_generation": [[7, 3, 1, "", "get_keras_data_generation_config"], [9, 3, 1, "", "get_pytorch_data_generation_config"], [12, 3, 1, "", "keras_data_generation_experimental"], [20, 3, 1, "", "pytorch_data_generation_experimental"]], "model_compression_toolkit.exporter": [[30, 0, 1, "", "KerasExportSerializationFormat"], [30, 0, 1, "", "PytorchExportSerializationFormat"], [30, 0, 1, "", "QuantizationFormat"], [30, 0, 1, "", "keras_export_model"], [30, 0, 1, "", "pytorch_export_model"]], "model_compression_toolkit.gptq": [[3, 0, 1, "", "GPTQHessianScoresConfig"], [3, 0, 1, "", "GradientPTQConfig"], [8, 3, 1, "", "get_keras_gptq_config"], [10, 3, 1, "", "get_pytorch_gptq_config"], [13, 3, 1, "", "keras_gradient_post_training_quantization"], [21, 3, 1, "", "pytorch_gradient_post_training_quantization"]], "model_compression_toolkit.pruning": [[4, 3, 1, "", "PruningConfig"], [5, 3, 1, "", "PruningInfo"], [4, 4, 1, "", "channels_filtering_strategy"], [4, 4, 1, "", "importance_metric"], [5, 4, 1, "", "importance_scores"], [17, 3, 1, "", "keras_pruning_experimental"], [4, 4, 1, "", "num_score_approximations"], [5, 4, 1, "", "pruning_masks"], [24, 3, 1, "", "pytorch_pruning_experimental"]], "model_compression_toolkit.ptq": [[16, 3, 1, "", "keras_post_training_quantization"], [23, 3, 1, "", "pytorch_post_training_quantization"]], "model_compression_toolkit.qat": [[34, 0, 1, "", "QATConfig"], [34, 0, 1, "", "TrainingMethod"], [18, 3, 1, "", "keras_quantization_aware_training_finalize_experimental"], [19, 3, 1, "", "keras_quantization_aware_training_init_experimental"], [25, 3, 1, "", "pytorch_quantization_aware_training_finalize_experimental"], [26, 3, 1, "", "pytorch_quantization_aware_training_init_experimental"]], "model_compression_toolkit.target_platform": [[31, 0, 1, "", "Eq"], [36, 0, 1, "", "Fusing"], [31, 0, 1, "", "Greater"], [31, 0, 1, "", "GreaterEq"], [36, 0, 1, "", "LayerFilterParams"], [31, 0, 1, "", "NotEq"], [36, 0, 1, "", "OpQuantizationConfig"], [36, 0, 1, "", "OperationsSetToLayers"], [36, 0, 1, "", "OperatorSetConcat"], [36, 0, 1, "", "OperatorsSet"], [36, 0, 1, "", "QuantizationConfigOptions"], [36, 0, 1, "", "QuantizationMethod"], [31, 0, 1, "", "Smaller"], [31, 0, 1, "", "SmallerEq"], [36, 0, 1, "", "TargetPlatformCapabilities"], [36, 0, 1, "", "TargetPlatformModel"]], "model_compression_toolkit.trainable_infrastructure": [[37, 0, 1, "", "BaseKerasTrainableQuantizer"], [37, 0, 1, "", "BasePytorchTrainableQuantizer"], [37, 0, 1, "", "TrainableQuantizerActivationConfig"], [37, 0, 1, "", "TrainableQuantizerWeightsConfig"]]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:data", "3": "py:function", "4": "py:attribute"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "data", "Python data"], "3": ["py", "function", "Python function"], "4": ["py", "attribute", "Python attribute"]}, "titleterms": {"defaultdict": 0, "class": [0, 2, 3, 6], "folder": 1, "imag": 1, "loader": 1, "api": [1, 6, 42], "default": 1, "file": 1, "type": 1, "scan": 1, "frameworkinfo": 2, "channelaxi": 2, "gradientptqconfig": [3, 8, 10], "gptqhessianscoresconfig": 3, "prune": [4, 5, 17, 24], "configur": [4, 41], "inform": [5, 14, 22], "doc": 6, "function": 6, "modul": [6, 28, 29, 30, 32, 33, 34, 35, 36, 37], "indic": 6, "tabl": 6, "get": [7, 8, 9, 10, 11, 14, 22], "datagenerationconfig": [7, 9], "kera": [7, 8, 12, 13, 14, 15, 16, 17, 18, 19, 30, 39], "model": [7, 8, 9, 10, 14, 15, 18, 19, 22, 25, 26, 30, 39, 40, 42], "pytorch": [9, 10, 20, 21, 22, 23, 24, 25, 26, 30, 40], "targetplatformcap": [11, 36], "data": [12, 20], "gener": [12, 20], "gradient": [13, 21], "base": [13, 21], "post": [13, 16, 21, 23], "train": [13, 16, 18, 19, 21, 23, 25, 26], "quantiz": [13, 15, 16, 18, 19, 21, 23, 25, 26, 30], "kpi": [14, 22, 32], "load": 15, "structur": [17, 24], "awar": [18, 19, 25, 26], "final": [18, 25], "init": [19, 26], "enabl": 27, "logger": 27, "core_config": 28, "coreconfig": 28, "debug_config": 29, "debugconfig": 29, "export": 30, "quantizationformat": 30, "kerasexportserializationformat": 30, "keras_export_model": 30, "tutori": 30, "serial": 30, "format": 30, "mctq": 30, "fake": 30, "tflite": 30, "int8": 30, "usag": 30, "exampl": [30, 36], "pytorchexportserializationformat": 30, "pytorch_export_model": 30, "onnx": 30, "opset": 30, "version": 30, "us": 30, "infer": 30, "torchscript": 30, "layer": 31, "attribut": 31, "filter": [31, 33], "mixed_precision_quantization_config": 32, "mixedprecisionquantizationconfigv2": 32, "network_editor": 33, "editrul": 33, "action": 33, "qat_config": 34, "trainingmethod": 34, "qatconfig": 34, "quantization_config": 35, "quantizationerrormethod": 35, "quantizationconfig": 35, "target_platform": 36, "quantizationmethod": 36, "opquantizationconfig": 36, "quantizationconfigopt": 36, "targetplatformmodel": 36, "operatorsset": 36, "fuse": 36, "operatorsetconcat": 36, "code": 36, "operationssettolay": 36, "layerfilterparam": 36, "trainable_infrastructur": 37, "basekerastrainablequant": 37, "basepytorchtrainablequant": 37, "trainablequantizerweightsconfig": 37, "trainablequantizeractivationconfig": 37, "mct": [39, 40], "quickstart": [39, 40, 42], "guidelin": [39, 40], "visual": 41, "within": 41, "tensorboard": 41, "cosin": 41, "similar": 41, "comparison": 41, "mix": 41, "precis": 41, "bit": 41, "width": 41, "compress": 42, "toolkit": 42, "user": 42, "guid": 42, "overview": 42, "instal": 42, "support": 42, "featur": 42, "document": 42, "technic": 42, "constraint": 42, "refer": 42}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx": 56}})
\ No newline at end of file