[RLHF] Fix torch.dtype not serializable in example (#22158)

22quinn · web-flow · commit 845420ac2c2b · 2025-08-04T02:43:33.000Z
Signed-off-by: 22quinn &lt;33176974+22quinn@users.noreply.github.com&gt;
diff --git a/examples/offline_inference/rlhf.py b/examples/offline_inference/rlhf.py
@@ -126,7 +126,10 @@ def __init__(self, *args, **kwargs):
 
 # Synchronize the updated weights to the inference engine.
 for name, p in train_model.named_parameters():
-    handle = llm.collective_rpc.remote("update_weight", args=(name, p.dtype, p.shape))
+    dtype_name = str(p.dtype).split(".")[-1]
+    handle = llm.collective_rpc.remote(
+        "update_weight", args=(name, dtype_name, p.shape)
+    )
     model_update_group.broadcast(p, src=0, stream=torch.cuda.current_stream())
     ray.get(handle)
 
diff --git a/examples/offline_inference/rlhf_utils.py b/examples/offline_inference/rlhf_utils.py
@@ -45,7 +45,8 @@ def init_weight_update_group(
             self.device,
         )
 
-    def update_weight(self, name, dtype, shape):
+    def update_weight(self, name, dtype_name, shape):
+        dtype = getattr(torch, dtype_name)
         weight = torch.empty(shape, dtype=dtype, device="cuda")
         self.model_update_group.broadcast(
             weight, src=0, stream=torch.cuda.current_stream()

Original file line number	Diff line number	Diff line change
`@@ -45,7 +45,8 @@ def init_weight_update_group(`
`45`	`45`	`self.device,`
`46`	`46`	`)`
`47`	`47`
`48`		`- def update_weight(self, name, dtype, shape):`
	`48`	`+ def update_weight(self, name, dtype_name, shape):`
	`49`	`+ dtype = getattr(torch, dtype_name)`
`49`	`50`	`weight = torch.empty(shape, dtype=dtype, device="cuda")`
`50`	`51`	`self.model_update_group.broadcast(`
`51`	`52`	`weight, src=0, stream=torch.cuda.current_stream()`