fredaddy commited on
Commit
a1c2e19
1 Parent(s): db6f154

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +1 -2
handler.py CHANGED
@@ -14,8 +14,7 @@ class EndpointHandler:
14
  trust_remote_code=True,
15
  attn_implementation='sdpa',
16
  torch_dtype=torch.bfloat16 if self.device.type == "cuda" else torch.float32,
17
- device_map="auto",
18
- )
19
  self.model.eval()
20
 
21
  # Load the tokenizer
 
14
  trust_remote_code=True,
15
  attn_implementation='sdpa',
16
  torch_dtype=torch.bfloat16 if self.device.type == "cuda" else torch.float32,
17
+ ).to(self.device)
 
18
  self.model.eval()
19
 
20
  # Load the tokenizer