justin871030 commited on
Commit
d24acc8
โ€ข
1 Parent(s): 067ab8f

Add special tokens

Browse files
Files changed (5) hide show
  1. config.json +8 -1
  2. pytorch_model.bin +2 -2
  3. special_tokens_map.json +1 -1
  4. tokenizer_config.json +1 -1
  5. vocab.txt +128 -128
config.json CHANGED
@@ -1,9 +1,12 @@
1
  {
 
2
  "architectures": [
3
  "BertForMultiLabelClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
 
6
  "finetuning_task": "goemotions",
 
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
  "hidden_size": 768,
@@ -75,6 +78,10 @@
75
  "num_attention_heads": 12,
76
  "num_hidden_layers": 12,
77
  "pad_token_id": 0,
 
 
 
78
  "type_vocab_size": 2,
79
- "vocab_size": 30524
 
80
  }
 
1
  {
2
+ "_name_or_path": "bert-base-uncased",
3
  "architectures": [
4
  "BertForMultiLabelClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
  "finetuning_task": "goemotions",
9
+ "gradient_checkpointing": false,
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
 
78
  "num_attention_heads": 12,
79
  "num_hidden_layers": 12,
80
  "pad_token_id": 0,
81
+ "position_embedding_type": "absolute",
82
+ "torch_dtype": "float32",
83
+ "transformers_version": "4.13.0",
84
  "type_vocab_size": 2,
85
+ "use_cache": true,
86
+ "vocab_size": 30522
87
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e05799466f321e500385dc4923055ca1b4433673d6f6e7d88eaa960af7feb79
3
- size 438098541
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a94499ef3ef2a096f39ee9b1d39ade8a70317842aba6d2345825d4934efefd05
3
+ size 438096875
special_tokens_map.json CHANGED
@@ -4,5 +4,5 @@
4
  "pad_token": "[PAD]",
5
  "cls_token": "[CLS]",
6
  "mask_token": "[MASK]",
7
- "additional_special_tokens": ["[NAME]", "[RELIGION]"]
8
  }
 
4
  "pad_token": "[PAD]",
5
  "cls_token": "[CLS]",
6
  "mask_token": "[MASK]",
7
+ "additional_special_tokens": ["[NAME]", "[RELIGION]", "๐Ÿ˜‚", "โค", "๐Ÿคฃ", "๐Ÿ˜ญ", "๐Ÿ‘", "โ™€", "๐Ÿ˜", "๐Ÿค”", "๐Ÿฆ€", "๐Ÿ‘", "๐Ÿป", "๐Ÿคท", "๐Ÿผ", "๐Ÿ™„", "๐Ÿ˜Š", "๐Ÿ”ฅ", "๐Ÿ˜ข", "๐Ÿ˜…", "๐Ÿ’œ", "๐Ÿ‘Œ", "โ™‚", "โ˜บ", "๐Ÿ˜Ž", "โ™ฅ", "๐Ÿ’ฏ", "๐Ÿ’ฆ", "๐Ÿ˜", "๐Ÿ˜”", "๐Ÿคข", "๐Ÿ’•", "๐Ÿ™", "๐Ÿ˜‰", "๐Ÿ™Œ", "๐Ÿคฆ", "๐Ÿ™ƒ", "๐Ÿ˜†", "๐Ÿ˜˜", "๐ŸŽถ", "๐Ÿ˜ค", "๐Ÿ˜", "๐Ÿ˜€", "๐Ÿค—", "๐Ÿ˜", "๐Ÿฝ", "๐Ÿ’ช", "๐Ÿ˜ก", "๐ŸŽ‰", "๐Ÿ‘€", "โœ”", "๐Ÿ”ช", "๐Ÿ˜„", "๐Ÿ˜ฌ", "๐Ÿ’–", "๐Ÿ˜ฅ", "๐Ÿ˜’", "โœŒ", "๐Ÿ’ƒ", "โ„ข", "๐Ÿ˜ฉ", "โ˜น", "๐Ÿ’…", "๐Ÿ˜ช", "๐Ÿ‘‘", "๐Ÿ˜ณ", "๐Ÿคช", "๐Ÿ˜•", "๐ŸŽ‚", "๐Ÿ˜ซ", "๐Ÿ’™", "๐Ÿคฎ", "๐Ÿšซ", "๐Ÿ˜ž", "๐Ÿ’Ž", "๐Ÿ˜ฑ", "๐Ÿ˜‘", "๐Ÿ˜–", "๐ŸŠ", "๐Ÿ™ˆ", "๐Ÿค ", "โฃ", "๐Ÿคฉ", "๐Ÿ™‚", "๐Ÿ‘Š", "๐Ÿ’›", "๐Ÿ’“", "๐Ÿ‘ฉ", "โœจ", "๐Ÿ˜ฃ", "๐Ÿ’—", "๐Ÿคž", "๐Ÿฅ€", "๐Ÿš“", "๐Ÿ˜ฐ", "๐Ÿ‘…", "๐Ÿ˜", "๐Ÿป", "๐Ÿค•", "๐Ÿ˜œ", "๐Ÿฆˆ", "๐Ÿ˜ƒ", "๐Ÿ˜ฎ", "โœŠ", "๐Ÿ’š", "๐ŸŽต", "๐Ÿ’จ", "โ˜", "๐ŸŒˆ", "๐Ÿ’„", "๐Ÿ‘ธ", "๐Ÿ’ฅ", "๐Ÿ–ค", "๐Ÿพ", "๐Ÿฉ", "๐Ÿ˜‹", "๐Ÿคฒ", "๐Ÿคค", "๐Ÿง›", "๐Ÿ˜‡", "โ„", "โ–ซ", "๐Ÿ’", "๐Ÿ˜ด", ":)", ":(", "XD", "xD", ":D", ":'("]
8
  }
tokenizer_config.json CHANGED
@@ -6,5 +6,5 @@
6
  "pad_token": "[PAD]",
7
  "cls_token": "[CLS]",
8
  "mask_token": "[MASK]",
9
- "additional_special_tokens": ["[NAME]", "[RELIGION]"]
10
  }
 
6
  "pad_token": "[PAD]",
7
  "cls_token": "[CLS]",
8
  "mask_token": "[MASK]",
9
+ "additional_special_tokens": ["[NAME]", "[RELIGION]", "๐Ÿ˜‚", "โค", "๐Ÿคฃ", "๐Ÿ˜ญ", "๐Ÿ‘", "โ™€", "๐Ÿ˜", "๐Ÿค”", "๐Ÿฆ€", "๐Ÿ‘", "๐Ÿป", "๐Ÿคท", "๐Ÿผ", "๐Ÿ™„", "๐Ÿ˜Š", "๐Ÿ”ฅ", "๐Ÿ˜ข", "๐Ÿ˜…", "๐Ÿ’œ", "๐Ÿ‘Œ", "โ™‚", "โ˜บ", "๐Ÿ˜Ž", "โ™ฅ", "๐Ÿ’ฏ", "๐Ÿ’ฆ", "๐Ÿ˜", "๐Ÿ˜”", "๐Ÿคข", "๐Ÿ’•", "๐Ÿ™", "๐Ÿ˜‰", "๐Ÿ™Œ", "๐Ÿคฆ", "๐Ÿ™ƒ", "๐Ÿ˜†", "๐Ÿ˜˜", "๐ŸŽถ", "๐Ÿ˜ค", "๐Ÿ˜", "๐Ÿ˜€", "๐Ÿค—", "๐Ÿ˜", "๐Ÿฝ", "๐Ÿ’ช", "๐Ÿ˜ก", "๐ŸŽ‰", "๐Ÿ‘€", "โœ”", "๐Ÿ”ช", "๐Ÿ˜„", "๐Ÿ˜ฌ", "๐Ÿ’–", "๐Ÿ˜ฅ", "๐Ÿ˜’", "โœŒ", "๐Ÿ’ƒ", "โ„ข", "๐Ÿ˜ฉ", "โ˜น", "๐Ÿ’…", "๐Ÿ˜ช", "๐Ÿ‘‘", "๐Ÿ˜ณ", "๐Ÿคช", "๐Ÿ˜•", "๐ŸŽ‚", "๐Ÿ˜ซ", "๐Ÿ’™", "๐Ÿคฎ", "๐Ÿšซ", "๐Ÿ˜ž", "๐Ÿ’Ž", "๐Ÿ˜ฑ", "๐Ÿ˜‘", "๐Ÿ˜–", "๐ŸŠ", "๐Ÿ™ˆ", "๐Ÿค ", "โฃ", "๐Ÿคฉ", "๐Ÿ™‚", "๐Ÿ‘Š", "๐Ÿ’›", "๐Ÿ’“", "๐Ÿ‘ฉ", "โœจ", "๐Ÿ˜ฃ", "๐Ÿ’—", "๐Ÿคž", "๐Ÿฅ€", "๐Ÿš“", "๐Ÿ˜ฐ", "๐Ÿ‘…", "๐Ÿ˜", "๐Ÿป", "๐Ÿค•", "๐Ÿ˜œ", "๐Ÿฆˆ", "๐Ÿ˜ƒ", "๐Ÿ˜ฎ", "โœŠ", "๐Ÿ’š", "๐ŸŽต", "๐Ÿ’จ", "โ˜", "๐ŸŒˆ", "๐Ÿ’„", "๐Ÿ‘ธ", "๐Ÿ’ฅ", "๐Ÿ–ค", "๐Ÿพ", "๐Ÿฉ", "๐Ÿ˜‹", "๐Ÿคฒ", "๐Ÿคค", "๐Ÿง›", "๐Ÿ˜‡", "โ„", "โ–ซ", "๐Ÿ’", "๐Ÿ˜ด", ":)", ":(", "XD", "xD", ":D", ":'("]
10
  }
vocab.txt CHANGED
@@ -104,134 +104,134 @@
104
  [MASK]
105
  [NAME]
106
  [RELIGION]
107
- [unused101]
108
- [unused102]
109
- [unused103]
110
- [unused104]
111
- [unused105]
112
- [unused106]
113
- [unused107]
114
- [unused108]
115
- [unused109]
116
- [unused110]
117
- [unused111]
118
- [unused112]
119
- [unused113]
120
- [unused114]
121
- [unused115]
122
- [unused116]
123
- [unused117]
124
- [unused118]
125
- [unused119]
126
- [unused120]
127
- [unused121]
128
- [unused122]
129
- [unused123]
130
- [unused124]
131
- [unused125]
132
- [unused126]
133
- [unused127]
134
- [unused128]
135
- [unused129]
136
- [unused130]
137
- [unused131]
138
- [unused132]
139
- [unused133]
140
- [unused134]
141
- [unused135]
142
- [unused136]
143
- [unused137]
144
- [unused138]
145
- [unused139]
146
- [unused140]
147
- [unused141]
148
- [unused142]
149
- [unused143]
150
- [unused144]
151
- [unused145]
152
- [unused146]
153
- [unused147]
154
- [unused148]
155
- [unused149]
156
- [unused150]
157
- [unused151]
158
- [unused152]
159
- [unused153]
160
- [unused154]
161
- [unused155]
162
- [unused156]
163
- [unused157]
164
- [unused158]
165
- [unused159]
166
- [unused160]
167
- [unused161]
168
- [unused162]
169
- [unused163]
170
- [unused164]
171
- [unused165]
172
- [unused166]
173
- [unused167]
174
- [unused168]
175
- [unused169]
176
- [unused170]
177
- [unused171]
178
- [unused172]
179
- [unused173]
180
- [unused174]
181
- [unused175]
182
- [unused176]
183
- [unused177]
184
- [unused178]
185
- [unused179]
186
- [unused180]
187
- [unused181]
188
- [unused182]
189
- [unused183]
190
- [unused184]
191
- [unused185]
192
- [unused186]
193
- [unused187]
194
- [unused188]
195
- [unused189]
196
- [unused190]
197
- [unused191]
198
- [unused192]
199
- [unused193]
200
- [unused194]
201
- [unused195]
202
- [unused196]
203
- [unused197]
204
- [unused198]
205
- [unused199]
206
- [unused200]
207
- [unused201]
208
- [unused202]
209
- [unused203]
210
- [unused204]
211
- [unused205]
212
- [unused206]
213
- [unused207]
214
- [unused208]
215
- [unused209]
216
- [unused210]
217
- [unused211]
218
- [unused212]
219
- [unused213]
220
- [unused214]
221
- [unused215]
222
- [unused216]
223
- [unused217]
224
- [unused218]
225
- [unused219]
226
- [unused220]
227
- [unused221]
228
- [unused222]
229
- [unused223]
230
- [unused224]
231
- [unused225]
232
- [unused226]
233
- [unused227]
234
- [unused228]
235
  [unused229]
236
  [unused230]
237
  [unused231]
 
104
  [MASK]
105
  [NAME]
106
  [RELIGION]
107
+ ๐Ÿ˜‚
108
+ โค
109
+ ๐Ÿคฃ
110
+ ๐Ÿ˜ญ
111
+ ๐Ÿ‘
112
+ โ™€
113
+ ๐Ÿ˜
114
+ ๐Ÿค”
115
+ ๐Ÿฆ€
116
+ ๐Ÿ‘
117
+ ๐Ÿป
118
+ ๐Ÿคท
119
+ ๐Ÿผ
120
+ ๐Ÿ™„
121
+ ๐Ÿ˜Š
122
+ ๐Ÿ”ฅ
123
+ ๐Ÿ˜ข
124
+ ๐Ÿ˜…
125
+ ๐Ÿ’œ
126
+ ๐Ÿ‘Œ
127
+ โ™‚
128
+ โ˜บ
129
+ ๐Ÿ˜Ž
130
+ โ™ฅ
131
+ ๐Ÿ’ฏ
132
+ ๐Ÿ’ฆ
133
+ ๐Ÿ˜
134
+ ๐Ÿ˜”
135
+ ๐Ÿคข
136
+ ๐Ÿ’•
137
+ ๐Ÿ™
138
+ ๐Ÿ˜‰
139
+ ๐Ÿ™Œ
140
+ ๐Ÿคฆ
141
+ ๐Ÿ™ƒ
142
+ ๐Ÿ˜†
143
+ ๐Ÿ˜˜
144
+ ๐ŸŽถ
145
+ ๐Ÿ˜ค
146
+ ๐Ÿ˜
147
+ ๐Ÿ˜€
148
+ ๐Ÿค—
149
+ ๐Ÿ˜
150
+ ๐Ÿฝ
151
+ ๐Ÿ’ช
152
+ ๐Ÿ˜ก
153
+ ๐ŸŽ‰
154
+ ๐Ÿ‘€
155
+ โœ”
156
+ ๐Ÿ”ช
157
+ ๐Ÿ˜„
158
+ ๐Ÿ˜ฌ
159
+ ๐Ÿ’–
160
+ ๐Ÿ˜ฅ
161
+ ๐Ÿ˜’
162
+ โœŒ
163
+ ๐Ÿ’ƒ
164
+ โ„ข
165
+ ๐Ÿ˜ฉ
166
+ โ˜น
167
+ ๐Ÿ’…
168
+ ๐Ÿ˜ช
169
+ ๐Ÿ‘‘
170
+ ๐Ÿ˜ณ
171
+ ๐Ÿคช
172
+ ๐Ÿ˜•
173
+ ๐ŸŽ‚
174
+ ๐Ÿ˜ซ
175
+ ๐Ÿ’™
176
+ ๐Ÿคฎ
177
+ ๐Ÿšซ
178
+ ๐Ÿ˜ž
179
+ ๐Ÿ’Ž
180
+ ๐Ÿ˜ฑ
181
+ ๐Ÿ˜‘
182
+ ๐Ÿ˜–
183
+ ๐ŸŠ
184
+ ๐Ÿ™ˆ
185
+ ๐Ÿค 
186
+ โฃ
187
+ ๐Ÿคฉ
188
+ ๐Ÿ™‚
189
+ ๐Ÿ‘Š
190
+ ๐Ÿ’›
191
+ ๐Ÿ’“
192
+ ๐Ÿ‘ฉ
193
+ โœจ
194
+ ๐Ÿ˜ฃ
195
+ ๐Ÿ’—
196
+ ๐Ÿคž
197
+ ๐Ÿฅ€
198
+ ๐Ÿš“
199
+ ๐Ÿ˜ฐ
200
+ ๐Ÿ‘…
201
+ ๐Ÿ˜
202
+ ๐Ÿป
203
+ ๐Ÿค•
204
+ ๐Ÿ˜œ
205
+ ๐Ÿฆˆ
206
+ ๐Ÿ˜ƒ
207
+ ๐Ÿ˜ฎ
208
+ โœŠ
209
+ ๐Ÿ’š
210
+ ๐ŸŽต
211
+ ๐Ÿ’จ
212
+ โ˜
213
+ ๐ŸŒˆ
214
+ ๐Ÿ’„
215
+ ๐Ÿ‘ธ
216
+ ๐Ÿ’ฅ
217
+ ๐Ÿ–ค
218
+ ๐Ÿพ
219
+ ๐Ÿฉ
220
+ ๐Ÿ˜‹
221
+ ๐Ÿคฒ
222
+ ๐Ÿคค
223
+ ๐Ÿง›
224
+ ๐Ÿ˜‡
225
+ โ„
226
+ โ–ซ
227
+ ๐Ÿ’
228
+ ๐Ÿ˜ด
229
+ :)
230
+ :(
231
+ XD
232
+ xD
233
+ :D
234
+ :'(
235
  [unused229]
236
  [unused230]
237
  [unused231]