LnL-AI
/

dbrx-base-converted-v2

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Qubitium commited on Apr 3

Commit

5135d75

•

1 Parent(s): 7fb86d8

Update tiktoken.py (#4)

- Update tiktoken.py (345342df4cc7b09196ac8c6d8de5615037638ceb)

Files changed (1) hide show

tiktoken.py +2 -2

tiktoken.py CHANGED Viewed

@@ -247,7 +247,7 @@ class TiktokenTokenizerWrapper(PreTrainedTokenizer):
             # Get an index to add and add the item
             vocab_clone[candidate_extra_id] = index_to_add
-        return vocab_clone
     def _tokenize(self, text: str) -> List[str]:
         """Returns a tokenized string."""
@@ -371,4 +371,4 @@ class TiktokenTokenizerWrapper(PreTrainedTokenizer):
             if len(encoded) > 1:
                 actual_new_tokens.append(token)
-        return self.add_tokens(actual_new_tokens, special_tokens=True)

             # Get an index to add and add the item
             vocab_clone[candidate_extra_id] = index_to_add
+        return dict(vocab_clone, **self.added_tokens_encoder)
     def _tokenize(self, text: str) -> List[str]:
         """Returns a tokenized string."""
             if len(encoded) > 1:
                 actual_new_tokens.append(token)
+        return self.add_tokens(actual_new_tokens, special_tokens=True)