Update handler.py
Browse files- handler.py +1 -2
handler.py
CHANGED
|
@@ -14,8 +14,7 @@ class EndpointHandler:
|
|
| 14 |
trust_remote_code=True,
|
| 15 |
attn_implementation='sdpa',
|
| 16 |
torch_dtype=torch.bfloat16 if self.device.type == "cuda" else torch.float32,
|
| 17 |
-
|
| 18 |
-
)
|
| 19 |
self.model.eval()
|
| 20 |
|
| 21 |
# Load the tokenizer
|
|
|
|
| 14 |
trust_remote_code=True,
|
| 15 |
attn_implementation='sdpa',
|
| 16 |
torch_dtype=torch.bfloat16 if self.device.type == "cuda" else torch.float32,
|
| 17 |
+
).to(self.device)
|
|
|
|
| 18 |
self.model.eval()
|
| 19 |
|
| 20 |
# Load the tokenizer
|