Move to autocast adjustment to separate method

jkosek · jkosek · commit 01ac364e1bd6 · 2024-11-14T14:36:52.000+01:00
diff --git a/model_navigator/runners/torch.py b/model_navigator/runners/torch.py
@@ -93,16 +93,7 @@ def activate_impl(self):
         self._input_module_device = get_module_device(self.model) or torch.device("cpu")
         self._loaded_model = self.model
         self._loaded_model.to(self.device).eval()
-
-        # TODO: Consider better handling for controlling autocast behavior
-        try:
-            if hasattr(self._loaded_model, "parameters") and self._autocast_dtype is None:
-                param_dtype = next(self._loaded_model.parameters()).dtype
-                if param_dtype in [torch.bfloat16, torch.int8, torch.uint8]:
-                    self._autocast = False
-                    LOGGER.warning(f"Model has {param_dtype} parameters. Disabling autocast.")
-        except StopIteration:
-            LOGGER.warning("Model has no parameters.")
+        self._adjust_autocast()
 
     def deactivate_impl(self):
         """Deactivation implementation."""
@@ -233,6 +224,17 @@ def _to_torch_tensor(self, value, dtype):
             raise ValueError(f"Unsupported type {type(value)}")
         return value
 
+    def _adjust_autocast(self):
+        # TODO: Consider better handling for controlling autocast behavior
+        try:
+            if hasattr(self._loaded_model, "parameters") and self._autocast_dtype is None:
+                param_dtype = next(self._loaded_model.parameters()).dtype
+                if param_dtype in [torch.bfloat16, torch.int8, torch.uint8]:
+                    self._autocast = False
+                    LOGGER.warning(f"Model has {param_dtype} parameters. Disabling autocast.")
+        except StopIteration:
+            LOGGER.warning("Model has no parameters.")
+
 
 class _BaseTorchScriptRunner(_BaseTorchRunner):
     """Base runner for inference of TorchScript models."""
@@ -424,6 +426,7 @@ def activate_impl(self):
         exported_program = torch.export.load(str(self._model))
         self._loaded_model = exported_program.module()
         self._loaded_model.to(self.device)
+        self._adjust_autocast()
 
 
 class TorchExportedProgramCPURunner(_BaseTorchExportedProgramRunner):