Rachel Bawden commited on
Commit
529dce5
1 Parent(s): aed875c

init with converted model

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a33a3249593fc78212a66a158f76963748213e50d2a1fc05b85596b2cc7112d2
3
- size 209275077
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bfbd15078882bae5054cd2bdbd8528b451800b319ab7e3a1209e5c0a74bb2a4
3
+ size 192952903
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "additional_special_tokens": ["<t>"]}
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
tokenizer.json CHANGED
@@ -8002,10 +8002,10 @@
8002
  "▁unilat": 7961,
8003
  "madeupword0000": 7962,
8004
  "madeupword0001": 7963,
8005
- "madeupword0002": 7964,
8006
- "madeupword0003": 7965,
8007
- "madeupword0004": 7966,
8008
- "madeupword0005": 7967
8009
  },
8010
  "merges": [
8011
  "▁ d",
@@ -21595,7 +21595,10 @@
21595
  "▁qualifié e",
21596
  "▁elector ale",
21597
  "▁inferi eure",
21598
- "▁inferieur e"
 
 
 
21599
  ]
21600
  }
21601
  }
 
8002
  "▁unilat": 7961,
8003
  "madeupword0000": 7962,
8004
  "madeupword0001": 7963,
8005
+ "<": 7964,
8006
+ "<t": 7965,
8007
+ "▁<t": 7966,
8008
+ "▁<t>": 7967
8009
  },
8010
  "merges": [
8011
  "▁ d",
 
21595
  "▁qualifié e",
21596
  "▁elector ale",
21597
  "▁inferi eure",
21598
+ "▁inferieur e",
21599
+ "< t",
21600
+ "▁ <t",
21601
+ "▁<t >"
21602
  ]
21603
  }
21604
  }
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": "<unk>", "eos_token": "</s>", "bos_token": "<s>", "pad_token": "<pad>", "tokenizer_class": "PreTrainedTokenizerFast", "additional_special_tokens": ["<t>"]}
 
1
+ {"unk_token": "<unk>", "eos_token": "</s>", "bos_token": "<s>", "pad_token": "<pad>", "tokenizer_class": "PreTrainedTokenizerFast"}
vocab-src.json CHANGED
@@ -7967,4 +7967,4 @@
7967
  "madeupword0003": 7965,
7968
  "madeupword0004": 7966,
7969
  "madeupword0005": 7967
7970
- }
 
7967
  "madeupword0003": 7965,
7968
  "madeupword0004": 7966,
7969
  "madeupword0005": 7967
7970
+ }
vocab-tgt.json CHANGED
@@ -7967,4 +7967,4 @@
7967
  "madeupword0003": 7965,
7968
  "madeupword0004": 7966,
7969
  "madeupword0005": 7967
7970
- }
 
7967
  "madeupword0003": 7965,
7968
  "madeupword0004": 7966,
7969
  "madeupword0005": 7967
7970
+ }