clip_text_model add to cuda

shell-nlp · shell-nlp · commit 37f98ae49c15 · 2025-06-09T16:22:37.000+08:00
diff --git a/gpt_server/model_worker/embedding.py b/gpt_server/model_worker/embedding.py
@@ -48,6 +48,11 @@ def __init__(
             self.client = AutoModel.from_pretrained(
                 model_path, trust_remote_code=True
             )  # You must set trust_remote_code=True
+            if device == "cuda":
+                self.client.to(
+                    torch.device("cuda" if torch.cuda.is_available() else "cpu")
+                )
+                logger.info(f"device: {self.client.device}")
             self.client.set_processor(model_path)
             self.client.eval()
         else: