hutlim
/

hutlim commited on
Commit
bb5fb45
·
verified ·
1 Parent(s): 2f3cbcd

Update handler.py

Browse files
Files changed (1) hide show
  1. handler.py +2 -4
handler.py CHANGED
@@ -39,20 +39,18 @@ class EndpointHandler:
39
  )
40
 
41
  self.device = "cuda" if torch.cuda.is_available() else "cpu"
42
- self.torch_dtype = torch.float16 if self.device == "cuda" else torch.float32
43
 
44
  self.tokenizer = AutoTokenizer.from_pretrained(
45
  str(model_dir),
46
  padding_side="left",
47
  trust_remote_code=True,
48
- local_files_only=True,
49
  )
50
 
51
  self.model = AutoModelForCausalLM.from_pretrained(
52
  str(model_dir),
53
- torch_dtype=self.torch_dtype,
54
  trust_remote_code=True,
55
- local_files_only=True,
56
  ).to(self.device).eval()
57
 
58
  # Safer token lookup for decoder LMs: include leading space variants if needed
 
39
  )
40
 
41
  self.device = "cuda" if torch.cuda.is_available() else "cpu"
42
+ self.dtype = torch.float16 if self.device == "cuda" else torch.float32
43
 
44
  self.tokenizer = AutoTokenizer.from_pretrained(
45
  str(model_dir),
46
  padding_side="left",
47
  trust_remote_code=True,
 
48
  )
49
 
50
  self.model = AutoModelForCausalLM.from_pretrained(
51
  str(model_dir),
52
+ dtype=self.dtype,
53
  trust_remote_code=True,
 
54
  ).to(self.device).eval()
55
 
56
  # Safer token lookup for decoder LMs: include leading space variants if needed