Remove unnecessary code

jackzhxng · jackzhxng · commit bfe8b062e0c9 · 2025-02-25T13:30:14.000-08:00
diff --git a/examples/models/llama/model.py b/examples/models/llama/model.py
@@ -289,15 +289,6 @@ def __init__(self, **kwargs):
     def get_eager_model(self) -> torch.nn.Module:
         return self.model_
 
-        if self.checkpoint_dtype:
-            # convert to the type of the provided checkpoint
-            # input and output are torch.long, so signature unchanged
-            return self.model_.to(self.checkpoint_dtype)
-        else:
-            # int8 quantization code has some bf16,
-            # switch all to FP32
-            return self.model_.to(torch.float32)
-
     def get_example_inputs(self):
         if self.use_kv_cache:
             return self.get_example_inputs_kvcache_sdpa()