acelen commited on
Commit
1c758e0
1 Parent(s): 0371204

SecureBERT-V2

Browse files
.DS_Store ADDED
Binary file (6.15 kB). View file
 
config.json CHANGED
@@ -1 +1,112 @@
1
- {"_name_or_path": "ehsanaghaei/SecureBERT", "architectures": ["RobertaForTokenClassification"], "attention_probs_dropout_prob": 0.1, "bos_token_id": 0, "classifier_dropout": null, "eos_token_id": 2, "gradient_checkpointing": false, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": {"0": "O", "1": "B-TIME", "2": "I-TIME", "3": "B-LOC", "4": "B-SECTEAM", "5": "I-SECTEAM", "6": "B-TOOL", "7": "B-IDTY", "8": "I-IDTY", "9": "B-MAL", "10": "B-APT", "11": "I-APT", "12": "I-TOOL", "13": "B-VULNAME", "14": "B-VULID", "15": "I-LOC", "16": "B-ENCR", "17": "B-FILE", "18": "B-SHA2", "19": "B-URL", "20": "B-IP", "21": "PROT", "22": "B-ACT", "23": "I-ACT", "24": "B-MD5", "25": "I-FILE", "26": "B-DOM", "27": "I-MAL", "28": "B-OS", "29": "B-SHA1", "30": "I-URL", "31": "I-IP", "32": "I-SHA2", "33": "I-OS", "34": "B-PROT", "35": "I-VULNAME", "36": "I-PROT", "37": "B-EMAIL", "38": "I-EMAIL", "39": "I-ENCR"}, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": {"LABEL_0": 0, "LABEL_1": 1, "LABEL_10": 10, "LABEL_11": 11, "LABEL_12": 12, "LABEL_13": 13, "LABEL_14": 14, "LABEL_15": 15, "LABEL_16": 16, "LABEL_17": 17, "LABEL_18": 18, "LABEL_19": 19, "LABEL_2": 2, "LABEL_20": 20, "LABEL_21": 21, "LABEL_22": 22, "LABEL_23": 23, "LABEL_24": 24, "LABEL_25": 25, "LABEL_26": 26, "LABEL_27": 27, "LABEL_28": 28, "LABEL_29": 29, "LABEL_3": 3, "LABEL_30": 30, "LABEL_31": 31, "LABEL_32": 32, "LABEL_33": 33, "LABEL_34": 34, "LABEL_35": 35, "LABEL_36": 36, "LABEL_37": 37, "LABEL_38": 38, "LABEL_39": 39, "LABEL_4": 4, "LABEL_5": 5, "LABEL_6": 6, "LABEL_7": 7, "LABEL_8": 8, "LABEL_9": 9}, "layer_norm_eps": 1e-05, "max_position_embeddings": 514, "model_type": "roberta", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 1, "position_embedding_type": "absolute", "torch_dtype": "float32", "transformers_version": "4.30.2", "type_vocab_size": 1, "use_cache": true, "vocab_size": 50265}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "ehsanaghaei/SecureBERT",
3
+ "architectures": [
4
+ "RobertaForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O",
16
+ "1": "B-TIME",
17
+ "2": "I-TIME",
18
+ "3": "B-LOC",
19
+ "4": "B-SECTEAM",
20
+ "5": "I-SECTEAM",
21
+ "6": "B-TOOL",
22
+ "7": "B-IDTY",
23
+ "8": "I-IDTY",
24
+ "9": "B-MAL",
25
+ "10": "B-APT",
26
+ "11": "I-APT",
27
+ "12": "I-TOOL",
28
+ "13": "B-VULNAME",
29
+ "14": "B-VULID",
30
+ "15": "I-LOC",
31
+ "16": "B-ENCR",
32
+ "17": "B-FILE",
33
+ "18": "B-SHA2",
34
+ "19": "B-URL",
35
+ "20": "B-IP",
36
+ "21": "PROT",
37
+ "22": "B-ACT",
38
+ "23": "I-ACT",
39
+ "24": "B-MD5",
40
+ "25": "I-FILE",
41
+ "26": "B-DOM",
42
+ "27": "I-MAL",
43
+ "28": "B-OS",
44
+ "29": "B-SHA1",
45
+ "30": "I-URL",
46
+ "31": "I-IP",
47
+ "32": "I-SHA2",
48
+ "33": "I-OS",
49
+ "34": "B-PROT",
50
+ "35": "I-VULNAME",
51
+ "36": "I-PROT",
52
+ "37": "B-EMAIL",
53
+ "38": "I-EMAIL",
54
+ "39": "I-ENCR"
55
+ },
56
+ "initializer_range": 0.02,
57
+ "intermediate_size": 3072,
58
+ "label2id": {
59
+ "LABEL_0": 0,
60
+ "LABEL_1": 1,
61
+ "LABEL_10": 10,
62
+ "LABEL_11": 11,
63
+ "LABEL_12": 12,
64
+ "LABEL_13": 13,
65
+ "LABEL_14": 14,
66
+ "LABEL_15": 15,
67
+ "LABEL_16": 16,
68
+ "LABEL_17": 17,
69
+ "LABEL_18": 18,
70
+ "LABEL_19": 19,
71
+ "LABEL_2": 2,
72
+ "LABEL_20": 20,
73
+ "LABEL_21": 21,
74
+ "LABEL_22": 22,
75
+ "LABEL_23": 23,
76
+ "LABEL_24": 24,
77
+ "LABEL_25": 25,
78
+ "LABEL_26": 26,
79
+ "LABEL_27": 27,
80
+ "LABEL_28": 28,
81
+ "LABEL_29": 29,
82
+ "LABEL_3": 3,
83
+ "LABEL_30": 30,
84
+ "LABEL_31": 31,
85
+ "LABEL_32": 32,
86
+ "LABEL_33": 33,
87
+ "LABEL_34": 34,
88
+ "LABEL_35": 35,
89
+ "LABEL_36": 36,
90
+ "LABEL_37": 37,
91
+ "LABEL_38": 38,
92
+ "LABEL_39": 39,
93
+ "LABEL_4": 4,
94
+ "LABEL_5": 5,
95
+ "LABEL_6": 6,
96
+ "LABEL_7": 7,
97
+ "LABEL_8": 8,
98
+ "LABEL_9": 9
99
+ },
100
+ "layer_norm_eps": 1e-05,
101
+ "max_position_embeddings": 514,
102
+ "model_type": "roberta",
103
+ "num_attention_heads": 12,
104
+ "num_hidden_layers": 12,
105
+ "pad_token_id": 1,
106
+ "position_embedding_type": "absolute",
107
+ "torch_dtype": "float32",
108
+ "transformers_version": "4.30.2",
109
+ "type_vocab_size": 1,
110
+ "use_cache": true,
111
+ "vocab_size": 50265
112
+ }
model.safetensors → optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77bf2a463b0e30ac6af59c0bcf001b0ca3d2a275e09b2d1817d66ec2b8f79a28
3
- size 496371344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80eeff212abb98c229cf1a57c2c3ba32aabcaa4d0cc870227c25f7f199bf9ac8
3
+ size 992803077
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4e81ebf0b524e792d70b6595bce9ae5ac0002f39ab99c530759a8750a77ce08
3
  size 496415917
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e7b4c4b81357d1b66817e0cd5fe8d98dec8c79e4cb9ba57bfcfaf802057f4e2
3
  size 496415917
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdfc53f7cc49e4005f5d8b36345a038ddf3baff2043f73abe2c889fc8a1bfa92
3
+ size 14575
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74d996bcccf5d50efb552f4856a2c1fd07641d6aa7b4297df83f18bc3624e26a
3
+ size 627
trainer_state.json ADDED
@@ -0,0 +1,274 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 9.433962264150944,
5
+ "global_step": 5000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.38,
12
+ "learning_rate": 9.748427672955975e-05,
13
+ "loss": 1.3506,
14
+ "step": 200
15
+ },
16
+ {
17
+ "epoch": 0.75,
18
+ "learning_rate": 9.496855345911951e-05,
19
+ "loss": 1.0358,
20
+ "step": 400
21
+ },
22
+ {
23
+ "epoch": 1.0,
24
+ "eval_accuracy": 0.9021613276727133,
25
+ "eval_f1": 0.6651721377101681,
26
+ "eval_loss": 0.9438411593437195,
27
+ "eval_precision": 0.6371165644171779,
28
+ "eval_recall": 0.6958123953098827,
29
+ "eval_runtime": 9.5281,
30
+ "eval_samples_per_second": 162.152,
31
+ "eval_steps_per_second": 10.18,
32
+ "step": 530
33
+ },
34
+ {
35
+ "epoch": 1.13,
36
+ "learning_rate": 9.245283018867925e-05,
37
+ "loss": 0.9613,
38
+ "step": 600
39
+ },
40
+ {
41
+ "epoch": 1.51,
42
+ "learning_rate": 8.9937106918239e-05,
43
+ "loss": 0.9255,
44
+ "step": 800
45
+ },
46
+ {
47
+ "epoch": 1.89,
48
+ "learning_rate": 8.742138364779875e-05,
49
+ "loss": 0.9074,
50
+ "step": 1000
51
+ },
52
+ {
53
+ "epoch": 2.0,
54
+ "eval_accuracy": 0.9115099275269094,
55
+ "eval_f1": 0.698074203024698,
56
+ "eval_loss": 0.9242610335350037,
57
+ "eval_precision": 0.6805982815317705,
58
+ "eval_recall": 0.7164712451144611,
59
+ "eval_runtime": 8.173,
60
+ "eval_samples_per_second": 189.038,
61
+ "eval_steps_per_second": 11.868,
62
+ "step": 1060
63
+ },
64
+ {
65
+ "epoch": 2.26,
66
+ "learning_rate": 8.49056603773585e-05,
67
+ "loss": 0.8659,
68
+ "step": 1200
69
+ },
70
+ {
71
+ "epoch": 2.64,
72
+ "learning_rate": 8.238993710691824e-05,
73
+ "loss": 0.8605,
74
+ "step": 1400
75
+ },
76
+ {
77
+ "epoch": 3.0,
78
+ "eval_accuracy": 0.9139971696899524,
79
+ "eval_f1": 0.7123908477948492,
80
+ "eval_loss": 0.9207843542098999,
81
+ "eval_precision": 0.7052193894299158,
82
+ "eval_recall": 0.7197096594081519,
83
+ "eval_runtime": 9.4717,
84
+ "eval_samples_per_second": 163.117,
85
+ "eval_steps_per_second": 10.241,
86
+ "step": 1590
87
+ },
88
+ {
89
+ "epoch": 3.02,
90
+ "learning_rate": 7.9874213836478e-05,
91
+ "loss": 0.8467,
92
+ "step": 1600
93
+ },
94
+ {
95
+ "epoch": 3.4,
96
+ "learning_rate": 7.735849056603774e-05,
97
+ "loss": 0.817,
98
+ "step": 1800
99
+ },
100
+ {
101
+ "epoch": 3.77,
102
+ "learning_rate": 7.484276729559749e-05,
103
+ "loss": 0.8003,
104
+ "step": 2000
105
+ },
106
+ {
107
+ "epoch": 4.0,
108
+ "eval_accuracy": 0.9139757279471675,
109
+ "eval_f1": 0.7284265336009113,
110
+ "eval_loss": 0.9339075088500977,
111
+ "eval_precision": 0.7081839274414681,
112
+ "eval_recall": 0.7498604131769961,
113
+ "eval_runtime": 7.979,
114
+ "eval_samples_per_second": 193.634,
115
+ "eval_steps_per_second": 12.157,
116
+ "step": 2120
117
+ },
118
+ {
119
+ "epoch": 4.15,
120
+ "learning_rate": 7.232704402515723e-05,
121
+ "loss": 0.7937,
122
+ "step": 2200
123
+ },
124
+ {
125
+ "epoch": 4.53,
126
+ "learning_rate": 6.981132075471698e-05,
127
+ "loss": 0.777,
128
+ "step": 2400
129
+ },
130
+ {
131
+ "epoch": 4.91,
132
+ "learning_rate": 6.729559748427673e-05,
133
+ "loss": 0.7759,
134
+ "step": 2600
135
+ },
136
+ {
137
+ "epoch": 5.0,
138
+ "eval_accuracy": 0.9262404048201037,
139
+ "eval_f1": 0.7729500891265597,
140
+ "eval_loss": 0.9294289946556091,
141
+ "eval_precision": 0.7711459375347338,
142
+ "eval_recall": 0.7747627024008934,
143
+ "eval_runtime": 7.9554,
144
+ "eval_samples_per_second": 194.207,
145
+ "eval_steps_per_second": 12.193,
146
+ "step": 2650
147
+ },
148
+ {
149
+ "epoch": 5.28,
150
+ "learning_rate": 6.477987421383648e-05,
151
+ "loss": 0.7514,
152
+ "step": 2800
153
+ },
154
+ {
155
+ "epoch": 5.66,
156
+ "learning_rate": 6.226415094339622e-05,
157
+ "loss": 0.7585,
158
+ "step": 3000
159
+ },
160
+ {
161
+ "epoch": 6.0,
162
+ "eval_accuracy": 0.9251039924525065,
163
+ "eval_f1": 0.7699395015818395,
164
+ "eval_loss": 0.932030200958252,
165
+ "eval_precision": 0.765393952769808,
166
+ "eval_recall": 0.7745393634840871,
167
+ "eval_runtime": 7.9892,
168
+ "eval_samples_per_second": 193.385,
169
+ "eval_steps_per_second": 12.141,
170
+ "step": 3180
171
+ },
172
+ {
173
+ "epoch": 6.04,
174
+ "learning_rate": 5.974842767295597e-05,
175
+ "loss": 0.7529,
176
+ "step": 3200
177
+ },
178
+ {
179
+ "epoch": 6.42,
180
+ "learning_rate": 5.7232704402515724e-05,
181
+ "loss": 0.7338,
182
+ "step": 3400
183
+ },
184
+ {
185
+ "epoch": 6.79,
186
+ "learning_rate": 5.4716981132075475e-05,
187
+ "loss": 0.7357,
188
+ "step": 3600
189
+ },
190
+ {
191
+ "epoch": 7.0,
192
+ "eval_accuracy": 0.9156910673699559,
193
+ "eval_f1": 0.732724471830986,
194
+ "eval_loss": 0.9781692624092102,
195
+ "eval_precision": 0.7221559483787008,
196
+ "eval_recall": 0.743606923506421,
197
+ "eval_runtime": 9.4609,
198
+ "eval_samples_per_second": 163.304,
199
+ "eval_steps_per_second": 10.253,
200
+ "step": 3710
201
+ },
202
+ {
203
+ "epoch": 7.17,
204
+ "learning_rate": 5.220125786163522e-05,
205
+ "loss": 0.7282,
206
+ "step": 3800
207
+ },
208
+ {
209
+ "epoch": 7.55,
210
+ "learning_rate": 4.968553459119497e-05,
211
+ "loss": 0.7249,
212
+ "step": 4000
213
+ },
214
+ {
215
+ "epoch": 7.92,
216
+ "learning_rate": 4.716981132075472e-05,
217
+ "loss": 0.7207,
218
+ "step": 4200
219
+ },
220
+ {
221
+ "epoch": 8.0,
222
+ "eval_accuracy": 0.917277756336035,
223
+ "eval_f1": 0.757945684323743,
224
+ "eval_loss": 0.9978876113891602,
225
+ "eval_precision": 0.7310165975103734,
226
+ "eval_recall": 0.7869346733668342,
227
+ "eval_runtime": 7.9066,
228
+ "eval_samples_per_second": 195.405,
229
+ "eval_steps_per_second": 12.268,
230
+ "step": 4240
231
+ },
232
+ {
233
+ "epoch": 8.3,
234
+ "learning_rate": 4.4654088050314466e-05,
235
+ "loss": 0.7137,
236
+ "step": 4400
237
+ },
238
+ {
239
+ "epoch": 8.68,
240
+ "learning_rate": 4.213836477987422e-05,
241
+ "loss": 0.712,
242
+ "step": 4600
243
+ },
244
+ {
245
+ "epoch": 9.0,
246
+ "eval_accuracy": 0.9261117543633947,
247
+ "eval_f1": 0.7805572280913022,
248
+ "eval_loss": 0.9675424098968506,
249
+ "eval_precision": 0.7655142795791282,
250
+ "eval_recall": 0.7962032384142937,
251
+ "eval_runtime": 7.9396,
252
+ "eval_samples_per_second": 194.593,
253
+ "eval_steps_per_second": 12.217,
254
+ "step": 4770
255
+ },
256
+ {
257
+ "epoch": 9.06,
258
+ "learning_rate": 3.962264150943397e-05,
259
+ "loss": 0.7111,
260
+ "step": 4800
261
+ },
262
+ {
263
+ "epoch": 9.43,
264
+ "learning_rate": 3.710691823899371e-05,
265
+ "loss": 0.7048,
266
+ "step": 5000
267
+ }
268
+ ],
269
+ "max_steps": 7950,
270
+ "num_train_epochs": 15,
271
+ "total_flos": 4470902182940160.0,
272
+ "trial_name": null,
273
+ "trial_params": null
274
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b0aa52a3d66faa93cbd911a3f00510e7297e52451a4d13d72962992f719356e
3
  size 3963
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15afa73cc856b0ff58c9ad71cc382b4a12190fed06d9d360b7dbd0183bb05a5f
3
  size 3963