Skip to content

Commit af228db

Browse files
author
reuvenp
committed
use new mode AnyQuantizedNonFused during MP
1 parent 4bf622d commit af228db

File tree

4 files changed

+9
-6
lines changed

4 files changed

+9
-6
lines changed

model_compression_toolkit/core/common/mixed_precision/mixed_precision_ru_helper.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,7 @@ def compute_utilization(self, ru_targets: Set[RUTarget], mp_cfg: Dict[BaseNode,
5151
"""
5252
act_qcs, w_qcs = self.get_quantization_candidates(mp_cfg)
5353

54-
ru, detailed_ru = self.ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantized,
54+
ru, detailed_ru = self.ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantizedNonFused,
5555
BitwidthMode.QCustom,
5656
act_qcs=act_qcs,
5757
w_qcs=w_qcs,

model_compression_toolkit/core/common/mixed_precision/mixed_precision_search_manager.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -295,9 +295,12 @@ def compute_resource_utilization_for_config(self, config: Dict[BaseNode, int]) -
295295
296296
"""
297297
act_qcs, w_qcs = self.ru_helper.get_quantization_candidates(config)
298-
ru = self.ru_helper.ru_calculator.compute_resource_utilization(
299-
target_criterion=TargetInclusionCriterion.AnyQuantized, bitwidth_mode=BitwidthMode.QCustom, act_qcs=act_qcs,
300-
w_qcs=w_qcs, ru_targets=self.ru_targets, allow_unused_qcs=True)
298+
ru = self.ru_helper.ru_calculator.compute_resource_utilization(target_criterion=TargetInclusionCriterion.AnyQuantizedNonFused,
299+
bitwidth_mode=BitwidthMode.QCustom,
300+
act_qcs=act_qcs,
301+
w_qcs=w_qcs,
302+
ru_targets=self.ru_targets,
303+
allow_unused_qcs=True)
301304
return ru
302305

303306
def _finalize_distance_metric(self, layer_to_metrics_mapping: Dict[BaseNode, List[float]]):

model_compression_toolkit/core/common/mixed_precision/resource_utilization_tools/resource_utilization_data.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -63,4 +63,4 @@ def compute_resource_utilization_data(in_model: Any,
6363
running_gptq=False)
6464

6565
ru_calculator = ResourceUtilizationCalculator(transformed_graph, fw_impl, fw_info)
66-
return ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantized, BitwidthMode.QDefaultSP)
66+
return ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantizedNonFused, BitwidthMode.QDefaultSP)

model_compression_toolkit/core/runner.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -220,7 +220,7 @@ def _set_final_resource_utilization(graph: Graph,
220220
ru_calculator = ResourceUtilizationCalculator(graph, fw_impl, fw_info)
221221
w_qcs = {n.name: n.final_weights_quantization_cfg for n in graph.nodes}
222222
a_qcs = {n.name: n.final_activation_quantization_cfg for n in graph.nodes}
223-
final_ru = ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantized,
223+
final_ru = ru_calculator.compute_resource_utilization(TargetInclusionCriterion.AnyQuantizedNonFused,
224224
BitwidthMode.QCustom, act_qcs=a_qcs, w_qcs=w_qcs,
225225
ru_targets=ru_targets, allow_unused_qcs=True)
226226
summary = final_ru.get_summary_str(restricted=True)

0 commit comments

Comments
 (0)