Pierce Maloney commited on
Commit
eebf1ef
1 Parent(s): 0425154

adding back truncation

Browse files
Files changed (1) hide show
  1. handler.py +3 -3
handler.py CHANGED
@@ -31,11 +31,11 @@ class EndpointHandler():
31
 
32
  input_ids = self.tokenizer.encode(inputs, return_tensors="pt")
33
  max_generation_length = 75 # Desired number of tokens to generate
34
- # max_input_length = 4092 - max_generation_length # Maximum input length to allow space for generation
35
 
36
  # # Truncate input_ids to the most recent tokens that fit within the max_input_length
37
- # if input_ids.shape[1] > max_input_length:
38
- # input_ids = input_ids[:, -max_input_length:]
39
 
40
  max_length = input_ids.shape[1] + max_generation_length
41
 
 
31
 
32
  input_ids = self.tokenizer.encode(inputs, return_tensors="pt")
33
  max_generation_length = 75 # Desired number of tokens to generate
34
+ max_input_length = 4092 - max_generation_length # Maximum input length to allow space for generation
35
 
36
  # # Truncate input_ids to the most recent tokens that fit within the max_input_length
37
+ if input_ids.shape[1] > max_input_length:
38
+ input_ids = input_ids[:, -max_input_length:]
39
 
40
  max_length = input_ids.shape[1] + max_generation_length
41