dougtrajano commited on
Commit
191b08d
1 Parent(s): 32620e1

Model save

Browse files
last-checkpoint/config.json DELETED
@@ -1,40 +0,0 @@
1
- {
2
- "_name_or_path": "neuralmind/bert-large-portuguese-cased",
3
- "architectures": [
4
- "ToxicityTypeForSequenceClassification"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "directionality": "bidi",
9
- "hidden_act": "gelu",
10
- "hidden_dropout_prob": 0.1,
11
- "hidden_size": 1024,
12
- "id2label": {
13
- "0": "NOT-OFFENSIVE",
14
- "1": "OFFENSIVE"
15
- },
16
- "initializer_range": 0.02,
17
- "intermediate_size": 4096,
18
- "label2id": {
19
- "NOT-OFFENSIVE": 0,
20
- "OFFENSIVE": 1
21
- },
22
- "layer_norm_eps": 1e-12,
23
- "max_position_embeddings": 512,
24
- "model_type": "bert",
25
- "num_attention_heads": 16,
26
- "num_hidden_layers": 24,
27
- "output_past": true,
28
- "pad_token_id": 0,
29
- "pooler_fc_size": 768,
30
- "pooler_num_attention_heads": 12,
31
- "pooler_num_fc_layers": 3,
32
- "pooler_size_per_head": 128,
33
- "pooler_type": "first_token_transform",
34
- "position_embedding_type": "absolute",
35
- "torch_dtype": "float32",
36
- "transformers_version": "4.26.1",
37
- "type_vocab_size": 2,
38
- "use_cache": true,
39
- "vocab_size": 29794
40
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad6f0a7fef74b0a849fe0f1f072b9ad2a340d72ccc71361c7738247ba88ab8eb
3
- size 2675416477
 
 
 
 
last-checkpoint/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d28275481f29f85dc64692bd1241eeb86b797b543f56ae08bda2af3b80cb1d6f
3
- size 1337729837
 
 
 
 
last-checkpoint/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a48962e5ff4307118621d2d79e5364056e38baa3c35fdf947a099f7f109336e
3
- size 14503
 
 
 
 
last-checkpoint/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2a6b4ae21d721bb29b01e6298b11f998e2f825381fa156b83df6311626b5a39
3
- size 623
 
 
 
 
last-checkpoint/special_tokens_map.json DELETED
@@ -1,7 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
7
- }
 
 
 
 
 
 
 
 
last-checkpoint/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
last-checkpoint/tokenizer_config.json DELETED
@@ -1,16 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "do_basic_tokenize": true,
4
- "do_lower_case": false,
5
- "mask_token": "[MASK]",
6
- "model_max_length": 1000000000000000019884624838656,
7
- "name_or_path": "neuralmind/bert-large-portuguese-cased",
8
- "never_split": null,
9
- "pad_token": "[PAD]",
10
- "sep_token": "[SEP]",
11
- "special_tokens_map_file": "/root/.cache/huggingface/hub/models--neuralmind--bert-large-portuguese-cased/snapshots/aa302f6ea73b759f7df9cad58bd272127b67ec28/special_tokens_map.json",
12
- "strip_accents": null,
13
- "tokenize_chinese_chars": true,
14
- "tokenizer_class": "BertTokenizer",
15
- "unk_token": "[UNK]"
16
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/trainer_state.json DELETED
@@ -1,184 +0,0 @@
1
- {
2
- "best_metric": 0.8549217425622928,
3
- "best_model_checkpoint": "/opt/ml/checkpoints/toxic-comment-classification-2023-02-26-22-07-06-968/model/checkpoint-1408",
4
- "epoch": 6.0,
5
- "global_step": 8448,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.36,
12
- "learning_rate": 3.217249581414747e-05,
13
- "loss": 0.4937,
14
- "step": 500
15
- },
16
- {
17
- "epoch": 0.71,
18
- "learning_rate": 3.1787104153700095e-05,
19
- "loss": 0.4465,
20
- "step": 1000
21
- },
22
- {
23
- "epoch": 1.0,
24
- "eval_accuracy": 0.8546529723000311,
25
- "eval_f1": 0.8549217425622928,
26
- "eval_loss": 0.41022783517837524,
27
- "eval_precision": 0.8668618958335471,
28
- "eval_recall": 0.8546529723000311,
29
- "eval_runtime": 11.9429,
30
- "eval_samples_per_second": 269.03,
31
- "eval_steps_per_second": 33.66,
32
- "step": 1408
33
- },
34
- {
35
- "epoch": 1.07,
36
- "learning_rate": 3.140171249325271e-05,
37
- "loss": 0.4308,
38
- "step": 1500
39
- },
40
- {
41
- "epoch": 1.42,
42
- "learning_rate": 3.1016320832805326e-05,
43
- "loss": 0.3826,
44
- "step": 2000
45
- },
46
- {
47
- "epoch": 1.78,
48
- "learning_rate": 3.063092917235795e-05,
49
- "loss": 0.3839,
50
- "step": 2500
51
- },
52
- {
53
- "epoch": 2.0,
54
- "eval_accuracy": 0.8509181450357921,
55
- "eval_f1": 0.8496719953011838,
56
- "eval_loss": 0.48135700821876526,
57
- "eval_precision": 0.8531835536435355,
58
- "eval_recall": 0.8509181450357921,
59
- "eval_runtime": 11.8064,
60
- "eval_samples_per_second": 272.14,
61
- "eval_steps_per_second": 34.049,
62
- "step": 2816
63
- },
64
- {
65
- "epoch": 2.13,
66
- "learning_rate": 3.0245537511910564e-05,
67
- "loss": 0.4001,
68
- "step": 3000
69
- },
70
- {
71
- "epoch": 2.49,
72
- "learning_rate": 2.986014585146318e-05,
73
- "loss": 0.3603,
74
- "step": 3500
75
- },
76
- {
77
- "epoch": 2.84,
78
- "learning_rate": 2.9474754191015798e-05,
79
- "loss": 0.3945,
80
- "step": 4000
81
- },
82
- {
83
- "epoch": 3.0,
84
- "eval_accuracy": 0.800186741363212,
85
- "eval_f1": 0.7918442179147859,
86
- "eval_loss": 0.6362168192863464,
87
- "eval_precision": 0.8257966335436034,
88
- "eval_recall": 0.800186741363212,
89
- "eval_runtime": 11.7288,
90
- "eval_samples_per_second": 273.94,
91
- "eval_steps_per_second": 34.274,
92
- "step": 4224
93
- },
94
- {
95
- "epoch": 3.2,
96
- "learning_rate": 2.9089362530568417e-05,
97
- "loss": 0.3607,
98
- "step": 4500
99
- },
100
- {
101
- "epoch": 3.55,
102
- "learning_rate": 2.8703970870121032e-05,
103
- "loss": 0.345,
104
- "step": 5000
105
- },
106
- {
107
- "epoch": 3.91,
108
- "learning_rate": 2.831857920967365e-05,
109
- "loss": 0.3643,
110
- "step": 5500
111
- },
112
- {
113
- "epoch": 4.0,
114
- "eval_accuracy": 0.8247743541861189,
115
- "eval_f1": 0.8210678650289922,
116
- "eval_loss": 0.49613112211227417,
117
- "eval_precision": 0.8348592222910702,
118
- "eval_recall": 0.8247743541861189,
119
- "eval_runtime": 11.9823,
120
- "eval_samples_per_second": 268.146,
121
- "eval_steps_per_second": 33.55,
122
- "step": 5632
123
- },
124
- {
125
- "epoch": 4.26,
126
- "learning_rate": 2.793318754922627e-05,
127
- "loss": 0.3293,
128
- "step": 6000
129
- },
130
- {
131
- "epoch": 4.62,
132
- "learning_rate": 2.7547795888778885e-05,
133
- "loss": 0.3316,
134
- "step": 6500
135
- },
136
- {
137
- "epoch": 4.97,
138
- "learning_rate": 2.7162404228331504e-05,
139
- "loss": 0.3345,
140
- "step": 7000
141
- },
142
- {
143
- "epoch": 5.0,
144
- "eval_accuracy": 0.8527855586679116,
145
- "eval_f1": 0.8531826157402111,
146
- "eval_loss": 0.5266692042350769,
147
- "eval_precision": 0.8569563015662375,
148
- "eval_recall": 0.8527855586679116,
149
- "eval_runtime": 11.9018,
150
- "eval_samples_per_second": 269.96,
151
- "eval_steps_per_second": 33.777,
152
- "step": 7040
153
- },
154
- {
155
- "epoch": 5.33,
156
- "learning_rate": 2.6777012567884123e-05,
157
- "loss": 0.2956,
158
- "step": 7500
159
- },
160
- {
161
- "epoch": 5.68,
162
- "learning_rate": 2.6391620907436738e-05,
163
- "loss": 0.3053,
164
- "step": 8000
165
- },
166
- {
167
- "epoch": 6.0,
168
- "eval_accuracy": 0.800186741363212,
169
- "eval_f1": 0.791141616583017,
170
- "eval_loss": 0.590166449546814,
171
- "eval_precision": 0.8292050463846472,
172
- "eval_recall": 0.800186741363212,
173
- "eval_runtime": 11.946,
174
- "eval_samples_per_second": 268.961,
175
- "eval_steps_per_second": 33.652,
176
- "step": 8448
177
- }
178
- ],
179
- "max_steps": 42240,
180
- "num_train_epochs": 30,
181
- "total_flos": 9285913358832600.0,
182
- "trial_name": null,
183
- "trial_params": null
184
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb3b71907c1e39b22ef1ab915290602a79a529af398581187aa888ba7af47b38
3
- size 3695
 
 
 
 
last-checkpoint/vocab.txt DELETED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d28275481f29f85dc64692bd1241eeb86b797b543f56ae08bda2af3b80cb1d6f
3
  size 1337729837
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45592d7a0658665761f426eada85c30d56ec10d413005c3cec81e85c00eb944b
3
  size 1337729837