Replace torch.empty with torch.zeros (pytorch#6478)

Lunwen He · facebook-github-bot · commit c74b0b71b5e9 · 2024-10-25T11:00:03.000-07:00
Summary: X-link: pytorch/ao#1157 It turns out that it is unsafe to use `torch.empty` in oss environment because `torch.empty` creates tensor with uninitialized data. That means the buffer could be initialized with random values depends on what is left on that piece of memory. This causes code to generate inconsistent behavior. This PR replaces `torch.empty` with `torch.zeros` to make sure that they are properly initialized and avoid inconsistent behaviors. Reviewed By: msaroufim Differential Revision: D64875312
diff --git a/examples/models/llama/source_transformation/lora.py b/examples/models/llama/source_transformation/lora.py
@@ -70,6 +70,8 @@ def __init__(
             precision=precision,
             scales_precision=scales_precision,
         )
+        # TODO(lunwenh): Remove this once TorchAO's commit pin in ExecuTorch is updated to include this PR
+        super().zeros = torch.zeros_like(super().zeros)
         self.adaptor = LoRAAdaptorLinear(
             in_features,
             out_features,
diff --git a/examples/models/llama/source_transformation/pre_quantization.py b/examples/models/llama/source_transformation/pre_quantization.py
@@ -46,6 +46,8 @@ def replacement_fn(child: torch.nn.Module) -> torch.nn.Module:
             precision=precision,
             scales_precision=scales_precision,
         )
+        # TODO(lunwenh): Remove this once TorchAO's commit pin in ExecuTorch is updated to include this PR
+        new_linear.zeros = torch.zeros_like(new_linear.zeros)
         return new_linear
 
     _replace_with_custom_fn_if_matches_filter(module, replacement_fn, filter_fn)
diff --git a/examples/models/llama/source_transformation/quantize.py b/examples/models/llama/source_transformation/quantize.py
@@ -375,7 +375,7 @@ def __init__(
         self.in_features = in_features
         self.out_features = out_features
         self.register_buffer(
-            "weight", torch.empty((out_features, in_features), dtype=torch.int8)
+            "weight", torch.zeros((out_features, in_features), dtype=torch.int8)
         )
         self.register_buffer("scales", torch.ones(out_features, dtype=torch.bfloat16))
 
@@ -448,18 +448,18 @@ def __init__(
         # currently storing unpacked int8 weights
         self.register_buffer(
             "weight",
-            torch.empty((out_features, in_features), dtype=torch.int8),
+            torch.zeros((out_features, in_features), dtype=torch.int8),
         )
         self.register_buffer(
             "scales",
-            torch.empty(
+            torch.zeros(
                 (out_features),
                 dtype=torch.float32,
             ),
         )
         self.register_buffer(
             "zeros",
-            torch.empty(
+            torch.zeros(
                 (out_features),
                 dtype=torch.float32,
             ),
@@ -632,15 +632,15 @@ def __init__(
         if not packed:
             self.register_buffer(
                 "weight",
-                torch.empty(
+                torch.zeros(
                     (vocab_size, embedding_dim), dtype=torch.int8, device=device
                 ),
             )
         else:  # packed
             if bitwidth == 2:
                 self.register_buffer(
                     "weight",
-                    torch.empty(
+                    torch.zeros(
                         (vocab_size, embedding_dim // 4),
                         dtype=torch.uint8,
                         device=device,
@@ -649,7 +649,7 @@ def __init__(
             elif bitwidth == 4:
                 self.register_buffer(
                     "weight",
-                    torch.empty(
+                    torch.zeros(
                         (vocab_size, embedding_dim // 2),
                         dtype=torch.uint8,
                         device=device,

Original file line number	Diff line number	Diff line change
`@@ -70,6 +70,8 @@ def __init__(`
`70`	`70`	`precision=precision,`
`71`	`71`	`scales_precision=scales_precision,`
`72`	`72`	`)`
	`73`	`+ # TODO(lunwenh): Remove this once TorchAO's commit pin in ExecuTorch is updated to include this PR`
	`74`	`+ super().zeros = torch.zeros_like(super().zeros)`
`73`	`75`	`self.adaptor = LoRAAdaptorLinear(`
`74`	`76`	`in_features,`
`75`	`77`	`out_features,`
Original file line number	Diff line number	Diff line change
`@@ -46,6 +46,8 @@ def replacement_fn(child: torch.nn.Module) -> torch.nn.Module:`
`46`	`46`	`precision=precision,`
`47`	`47`	`scales_precision=scales_precision,`
`48`	`48`	`)`
	`49`	`+ # TODO(lunwenh): Remove this once TorchAO's commit pin in ExecuTorch is updated to include this PR`
	`50`	`+ new_linear.zeros = torch.zeros_like(new_linear.zeros)`
`49`	`51`	`return new_linear`
`50`	`52`
`51`	`53`	`_replace_with_custom_fn_if_matches_filter(module, replacement_fn, filter_fn)`