nroggendorff commited on
Commit
db0f387
1 Parent(s): c2f601d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -30,7 +30,7 @@ def create_tokenizer(training_corpus):
30
  special_tokens=["<s>", "<pad>", "</s>", "<unk>", "<mask>", "<|user|>", "<|bot|>", "<|end|>"]
31
  )
32
 
33
- fast_tokenizer = PreTrainedTokenizerFast(tokenizer_object=tokenizer)
34
  return fast_tokenizer
35
 
36
  def get_training_corpus(dataset):
 
30
  special_tokens=["<s>", "<pad>", "</s>", "<unk>", "<mask>", "<|user|>", "<|bot|>", "<|end|>"]
31
  )
32
 
33
+ fast_tokenizer = PreTrainedTokenizerFast(tokenizer_object=tokenizer._tokenizer)
34
  return fast_tokenizer
35
 
36
  def get_training_corpus(dataset):