japanese-denim commited on
Commit
8010565
1 Parent(s): aa105dc

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -52,7 +52,7 @@
52
  "static_position_embeddings": false,
53
  "tokenizer_class": "MBart50Tokenizer",
54
  "torch_dtype": "float32",
55
- "transformers_version": "4.35.2",
56
  "use_cache": true,
57
  "vocab_size": 250054
58
  }
 
52
  "static_position_embeddings": false,
53
  "tokenizer_class": "MBart50Tokenizer",
54
  "torch_dtype": "float32",
55
+ "transformers_version": "4.33.0",
56
  "use_cache": true,
57
  "vocab_size": 250054
58
  }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb74efed949910605aa06a27f0eb8a8afe0dab6f2578429f0cb39eecd8eab3b5
3
+ size 2444694045
special_tokens_map.json CHANGED
@@ -56,13 +56,7 @@
56
  "bos_token": "<s>",
57
  "cls_token": "<s>",
58
  "eos_token": "</s>",
59
- "mask_token": {
60
- "content": "<mask>",
61
- "lstrip": true,
62
- "normalized": true,
63
- "rstrip": false,
64
- "single_word": false
65
- },
66
  "pad_token": "<pad>",
67
  "sep_token": "</s>",
68
  "unk_token": "<unk>"
 
56
  "bos_token": "<s>",
57
  "cls_token": "<s>",
58
  "eos_token": "</s>",
59
+ "mask_token": "<mask>",
 
 
 
 
 
 
60
  "pad_token": "<pad>",
61
  "sep_token": "</s>",
62
  "unk_token": "<unk>"
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd373880288e6c7079a0c0573a5163926bb9862dbee34a4b8dea126302ead686
3
- size 17109940
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1dc610c1b938b4bf3dbff98a25da0e07bed958cae55dac0df25ed0a40d10a23b
3
+ size 17109850
tokenizer_config.json CHANGED
@@ -1,462 +1,4 @@
1
  {
2
- "added_tokens_decoder": {
3
- "0": {
4
- "content": "<s>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false,
9
- "special": true
10
- },
11
- "1": {
12
- "content": "<pad>",
13
- "lstrip": false,
14
- "normalized": false,
15
- "rstrip": false,
16
- "single_word": false,
17
- "special": true
18
- },
19
- "2": {
20
- "content": "</s>",
21
- "lstrip": false,
22
- "normalized": false,
23
- "rstrip": false,
24
- "single_word": false,
25
- "special": true
26
- },
27
- "3": {
28
- "content": "<unk>",
29
- "lstrip": false,
30
- "normalized": false,
31
- "rstrip": false,
32
- "single_word": false,
33
- "special": true
34
- },
35
- "250001": {
36
- "content": "ar_AR",
37
- "lstrip": false,
38
- "normalized": false,
39
- "rstrip": false,
40
- "single_word": false,
41
- "special": true
42
- },
43
- "250002": {
44
- "content": "cs_CZ",
45
- "lstrip": false,
46
- "normalized": false,
47
- "rstrip": false,
48
- "single_word": false,
49
- "special": true
50
- },
51
- "250003": {
52
- "content": "de_DE",
53
- "lstrip": false,
54
- "normalized": false,
55
- "rstrip": false,
56
- "single_word": false,
57
- "special": true
58
- },
59
- "250004": {
60
- "content": "en_XX",
61
- "lstrip": false,
62
- "normalized": false,
63
- "rstrip": false,
64
- "single_word": false,
65
- "special": true
66
- },
67
- "250005": {
68
- "content": "es_XX",
69
- "lstrip": false,
70
- "normalized": false,
71
- "rstrip": false,
72
- "single_word": false,
73
- "special": true
74
- },
75
- "250006": {
76
- "content": "et_EE",
77
- "lstrip": false,
78
- "normalized": false,
79
- "rstrip": false,
80
- "single_word": false,
81
- "special": true
82
- },
83
- "250007": {
84
- "content": "fi_FI",
85
- "lstrip": false,
86
- "normalized": false,
87
- "rstrip": false,
88
- "single_word": false,
89
- "special": true
90
- },
91
- "250008": {
92
- "content": "fr_XX",
93
- "lstrip": false,
94
- "normalized": false,
95
- "rstrip": false,
96
- "single_word": false,
97
- "special": true
98
- },
99
- "250009": {
100
- "content": "gu_IN",
101
- "lstrip": false,
102
- "normalized": false,
103
- "rstrip": false,
104
- "single_word": false,
105
- "special": true
106
- },
107
- "250010": {
108
- "content": "hi_IN",
109
- "lstrip": false,
110
- "normalized": false,
111
- "rstrip": false,
112
- "single_word": false,
113
- "special": true
114
- },
115
- "250011": {
116
- "content": "it_IT",
117
- "lstrip": false,
118
- "normalized": false,
119
- "rstrip": false,
120
- "single_word": false,
121
- "special": true
122
- },
123
- "250012": {
124
- "content": "ja_XX",
125
- "lstrip": false,
126
- "normalized": false,
127
- "rstrip": false,
128
- "single_word": false,
129
- "special": true
130
- },
131
- "250013": {
132
- "content": "kk_KZ",
133
- "lstrip": false,
134
- "normalized": false,
135
- "rstrip": false,
136
- "single_word": false,
137
- "special": true
138
- },
139
- "250014": {
140
- "content": "ko_KR",
141
- "lstrip": false,
142
- "normalized": false,
143
- "rstrip": false,
144
- "single_word": false,
145
- "special": true
146
- },
147
- "250015": {
148
- "content": "lt_LT",
149
- "lstrip": false,
150
- "normalized": false,
151
- "rstrip": false,
152
- "single_word": false,
153
- "special": true
154
- },
155
- "250016": {
156
- "content": "lv_LV",
157
- "lstrip": false,
158
- "normalized": false,
159
- "rstrip": false,
160
- "single_word": false,
161
- "special": true
162
- },
163
- "250017": {
164
- "content": "my_MM",
165
- "lstrip": false,
166
- "normalized": false,
167
- "rstrip": false,
168
- "single_word": false,
169
- "special": true
170
- },
171
- "250018": {
172
- "content": "ne_NP",
173
- "lstrip": false,
174
- "normalized": false,
175
- "rstrip": false,
176
- "single_word": false,
177
- "special": true
178
- },
179
- "250019": {
180
- "content": "nl_XX",
181
- "lstrip": false,
182
- "normalized": false,
183
- "rstrip": false,
184
- "single_word": false,
185
- "special": true
186
- },
187
- "250020": {
188
- "content": "ro_RO",
189
- "lstrip": false,
190
- "normalized": false,
191
- "rstrip": false,
192
- "single_word": false,
193
- "special": true
194
- },
195
- "250021": {
196
- "content": "ru_RU",
197
- "lstrip": false,
198
- "normalized": false,
199
- "rstrip": false,
200
- "single_word": false,
201
- "special": true
202
- },
203
- "250022": {
204
- "content": "si_LK",
205
- "lstrip": false,
206
- "normalized": false,
207
- "rstrip": false,
208
- "single_word": false,
209
- "special": true
210
- },
211
- "250023": {
212
- "content": "tr_TR",
213
- "lstrip": false,
214
- "normalized": false,
215
- "rstrip": false,
216
- "single_word": false,
217
- "special": true
218
- },
219
- "250024": {
220
- "content": "vi_VN",
221
- "lstrip": false,
222
- "normalized": false,
223
- "rstrip": false,
224
- "single_word": false,
225
- "special": true
226
- },
227
- "250025": {
228
- "content": "zh_CN",
229
- "lstrip": false,
230
- "normalized": false,
231
- "rstrip": false,
232
- "single_word": false,
233
- "special": true
234
- },
235
- "250026": {
236
- "content": "af_ZA",
237
- "lstrip": false,
238
- "normalized": false,
239
- "rstrip": false,
240
- "single_word": false,
241
- "special": true
242
- },
243
- "250027": {
244
- "content": "az_AZ",
245
- "lstrip": false,
246
- "normalized": false,
247
- "rstrip": false,
248
- "single_word": false,
249
- "special": true
250
- },
251
- "250028": {
252
- "content": "bn_IN",
253
- "lstrip": false,
254
- "normalized": false,
255
- "rstrip": false,
256
- "single_word": false,
257
- "special": true
258
- },
259
- "250029": {
260
- "content": "fa_IR",
261
- "lstrip": false,
262
- "normalized": false,
263
- "rstrip": false,
264
- "single_word": false,
265
- "special": true
266
- },
267
- "250030": {
268
- "content": "he_IL",
269
- "lstrip": false,
270
- "normalized": false,
271
- "rstrip": false,
272
- "single_word": false,
273
- "special": true
274
- },
275
- "250031": {
276
- "content": "hr_HR",
277
- "lstrip": false,
278
- "normalized": false,
279
- "rstrip": false,
280
- "single_word": false,
281
- "special": true
282
- },
283
- "250032": {
284
- "content": "id_ID",
285
- "lstrip": false,
286
- "normalized": false,
287
- "rstrip": false,
288
- "single_word": false,
289
- "special": true
290
- },
291
- "250033": {
292
- "content": "ka_GE",
293
- "lstrip": false,
294
- "normalized": false,
295
- "rstrip": false,
296
- "single_word": false,
297
- "special": true
298
- },
299
- "250034": {
300
- "content": "km_KH",
301
- "lstrip": false,
302
- "normalized": false,
303
- "rstrip": false,
304
- "single_word": false,
305
- "special": true
306
- },
307
- "250035": {
308
- "content": "mk_MK",
309
- "lstrip": false,
310
- "normalized": false,
311
- "rstrip": false,
312
- "single_word": false,
313
- "special": true
314
- },
315
- "250036": {
316
- "content": "ml_IN",
317
- "lstrip": false,
318
- "normalized": false,
319
- "rstrip": false,
320
- "single_word": false,
321
- "special": true
322
- },
323
- "250037": {
324
- "content": "mn_MN",
325
- "lstrip": false,
326
- "normalized": false,
327
- "rstrip": false,
328
- "single_word": false,
329
- "special": true
330
- },
331
- "250038": {
332
- "content": "mr_IN",
333
- "lstrip": false,
334
- "normalized": false,
335
- "rstrip": false,
336
- "single_word": false,
337
- "special": true
338
- },
339
- "250039": {
340
- "content": "pl_PL",
341
- "lstrip": false,
342
- "normalized": false,
343
- "rstrip": false,
344
- "single_word": false,
345
- "special": true
346
- },
347
- "250040": {
348
- "content": "ps_AF",
349
- "lstrip": false,
350
- "normalized": false,
351
- "rstrip": false,
352
- "single_word": false,
353
- "special": true
354
- },
355
- "250041": {
356
- "content": "pt_XX",
357
- "lstrip": false,
358
- "normalized": false,
359
- "rstrip": false,
360
- "single_word": false,
361
- "special": true
362
- },
363
- "250042": {
364
- "content": "sv_SE",
365
- "lstrip": false,
366
- "normalized": false,
367
- "rstrip": false,
368
- "single_word": false,
369
- "special": true
370
- },
371
- "250043": {
372
- "content": "sw_KE",
373
- "lstrip": false,
374
- "normalized": false,
375
- "rstrip": false,
376
- "single_word": false,
377
- "special": true
378
- },
379
- "250044": {
380
- "content": "ta_IN",
381
- "lstrip": false,
382
- "normalized": false,
383
- "rstrip": false,
384
- "single_word": false,
385
- "special": true
386
- },
387
- "250045": {
388
- "content": "te_IN",
389
- "lstrip": false,
390
- "normalized": false,
391
- "rstrip": false,
392
- "single_word": false,
393
- "special": true
394
- },
395
- "250046": {
396
- "content": "th_TH",
397
- "lstrip": false,
398
- "normalized": false,
399
- "rstrip": false,
400
- "single_word": false,
401
- "special": true
402
- },
403
- "250047": {
404
- "content": "tl_XX",
405
- "lstrip": false,
406
- "normalized": false,
407
- "rstrip": false,
408
- "single_word": false,
409
- "special": true
410
- },
411
- "250048": {
412
- "content": "uk_UA",
413
- "lstrip": false,
414
- "normalized": false,
415
- "rstrip": false,
416
- "single_word": false,
417
- "special": true
418
- },
419
- "250049": {
420
- "content": "ur_PK",
421
- "lstrip": false,
422
- "normalized": false,
423
- "rstrip": false,
424
- "single_word": false,
425
- "special": true
426
- },
427
- "250050": {
428
- "content": "xh_ZA",
429
- "lstrip": false,
430
- "normalized": false,
431
- "rstrip": false,
432
- "single_word": false,
433
- "special": true
434
- },
435
- "250051": {
436
- "content": "gl_ES",
437
- "lstrip": false,
438
- "normalized": false,
439
- "rstrip": false,
440
- "single_word": false,
441
- "special": true
442
- },
443
- "250052": {
444
- "content": "sl_SI",
445
- "lstrip": false,
446
- "normalized": false,
447
- "rstrip": false,
448
- "single_word": false,
449
- "special": true
450
- },
451
- "250053": {
452
- "content": "<mask>",
453
- "lstrip": true,
454
- "normalized": true,
455
- "rstrip": false,
456
- "single_word": false,
457
- "special": true
458
- }
459
- },
460
  "additional_special_tokens": [
461
  "ar_AR",
462
  "cs_CZ",
@@ -515,7 +57,14 @@
515
  "clean_up_tokenization_spaces": true,
516
  "cls_token": "<s>",
517
  "eos_token": "</s>",
518
- "mask_token": "<mask>",
 
 
 
 
 
 
 
519
  "model_max_length": 1024,
520
  "pad_token": "<pad>",
521
  "sep_token": "</s>",
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "additional_special_tokens": [
3
  "ar_AR",
4
  "cs_CZ",
 
57
  "clean_up_tokenization_spaces": true,
58
  "cls_token": "<s>",
59
  "eos_token": "</s>",
60
+ "mask_token": {
61
+ "__type": "AddedToken",
62
+ "content": "<mask>",
63
+ "lstrip": true,
64
+ "normalized": true,
65
+ "rstrip": false,
66
+ "single_word": false
67
+ },
68
  "model_max_length": 1024,
69
  "pad_token": "<pad>",
70
  "sep_token": "</s>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:785d24a1e7b4b3c075784874ffb0075fd23ee135a6848a44218e073795f14812
3
- size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35c06192fc7f834f74a974454a81199fcd4073ca48be04cfc7785632f36d7f03
3
+ size 4219