clincolnoz commited on
Commit
8fa6cc5
1 Parent(s): 887c4ac

correct weights

Browse files
README.md CHANGED
@@ -5,14 +5,14 @@ metrics:
5
  - f1
6
  - accuracy
7
  model-index:
8
- - name: final-lr2e-5-bs16
9
  results: []
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
  should probably proofread and complete it, then remove this comment. -->
14
 
15
- # final-lr2e-5-bs16
16
 
17
  This model is a fine-tuned version of [clincolnoz/LessSexistBERT](https://huggingface.co/clincolnoz/LessSexistBERT) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
 
5
  - f1
6
  - accuracy
7
  model-index:
8
+ - name: final-lr2e-5-bs16-fp16-2
9
  results: []
10
  ---
11
 
12
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
13
  should probably proofread and complete it, then remove this comment. -->
14
 
15
+ # final-lr2e-5-bs16-fp16-2
16
 
17
  This model is a fine-tuned version of [clincolnoz/LessSexistBERT](https://huggingface.co/clincolnoz/LessSexistBERT) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
all_results.json CHANGED
@@ -8,13 +8,13 @@
8
  "eval_f1_macro": 0.8374201959393394,
9
  "eval_f1_weighted": 0.8806450852201921,
10
  "eval_loss": 0.3457934856414795,
11
- "eval_runtime": 9.6259,
12
  "eval_samples": 4000,
13
- "eval_samples_per_second": 415.545,
14
- "eval_steps_per_second": 25.972,
15
  "train_loss": 0.27966182454427085,
16
- "train_runtime": 436.5097,
17
  "train_samples": 16000,
18
- "train_samples_per_second": 109.963,
19
- "train_steps_per_second": 6.873
20
  }
 
8
  "eval_f1_macro": 0.8374201959393394,
9
  "eval_f1_weighted": 0.8806450852201921,
10
  "eval_loss": 0.3457934856414795,
11
+ "eval_runtime": 9.6249,
12
  "eval_samples": 4000,
13
+ "eval_samples_per_second": 415.588,
14
+ "eval_steps_per_second": 25.974,
15
  "train_loss": 0.27966182454427085,
16
+ "train_runtime": 430.7509,
17
  "train_samples": 16000,
18
+ "train_samples_per_second": 111.433,
19
+ "train_steps_per_second": 6.965
20
  }
eval_results.json CHANGED
@@ -8,8 +8,8 @@
8
  "eval_f1_macro": 0.8374201959393394,
9
  "eval_f1_weighted": 0.8806450852201921,
10
  "eval_loss": 0.3457934856414795,
11
- "eval_runtime": 9.6259,
12
  "eval_samples": 4000,
13
- "eval_samples_per_second": 415.545,
14
- "eval_steps_per_second": 25.972
15
  }
 
8
  "eval_f1_macro": 0.8374201959393394,
9
  "eval_f1_weighted": 0.8806450852201921,
10
  "eval_loss": 0.3457934856414795,
11
+ "eval_runtime": 9.6249,
12
  "eval_samples": 4000,
13
+ "eval_samples_per_second": 415.588,
14
+ "eval_steps_per_second": 25.974
15
  }
predict_results_None.txt CHANGED
The diff for this file is too large to render. See raw diff
 
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 0.27966182454427085,
4
- "train_runtime": 436.5097,
5
  "train_samples": 16000,
6
- "train_samples_per_second": 109.963,
7
- "train_steps_per_second": 6.873
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "train_loss": 0.27966182454427085,
4
+ "train_runtime": 430.7509,
5
  "train_samples": 16000,
6
+ "train_samples_per_second": 111.433,
7
+ "train_steps_per_second": 6.965
8
  }
trainer_state.json CHANGED
@@ -29,9 +29,9 @@
29
  "eval_f1_macro": 0.8256385630330887,
30
  "eval_f1_weighted": 0.8748468477738904,
31
  "eval_loss": 0.3010723888874054,
32
- "eval_runtime": 9.6387,
33
- "eval_samples_per_second": 414.993,
34
- "eval_steps_per_second": 25.937,
35
  "step": 1000
36
  },
37
  {
@@ -56,9 +56,9 @@
56
  "eval_f1_macro": 0.84110534680508,
57
  "eval_f1_weighted": 0.8848438807534127,
58
  "eval_loss": 0.3121766746044159,
59
- "eval_runtime": 9.6263,
60
- "eval_samples_per_second": 415.529,
61
- "eval_steps_per_second": 25.971,
62
  "step": 2000
63
  },
64
  {
@@ -83,9 +83,9 @@
83
  "eval_f1_macro": 0.8374201959393394,
84
  "eval_f1_weighted": 0.8806450852201921,
85
  "eval_loss": 0.3457934856414795,
86
- "eval_runtime": 9.6302,
87
- "eval_samples_per_second": 415.361,
88
- "eval_steps_per_second": 25.96,
89
  "step": 3000
90
  },
91
  {
@@ -93,9 +93,9 @@
93
  "step": 3000,
94
  "total_flos": 1.262933065728e+16,
95
  "train_loss": 0.27966182454427085,
96
- "train_runtime": 436.5097,
97
- "train_samples_per_second": 109.963,
98
- "train_steps_per_second": 6.873
99
  }
100
  ],
101
  "max_steps": 3000,
 
29
  "eval_f1_macro": 0.8256385630330887,
30
  "eval_f1_weighted": 0.8748468477738904,
31
  "eval_loss": 0.3010723888874054,
32
+ "eval_runtime": 9.6596,
33
+ "eval_samples_per_second": 414.097,
34
+ "eval_steps_per_second": 25.881,
35
  "step": 1000
36
  },
37
  {
 
56
  "eval_f1_macro": 0.84110534680508,
57
  "eval_f1_weighted": 0.8848438807534127,
58
  "eval_loss": 0.3121766746044159,
59
+ "eval_runtime": 9.6642,
60
+ "eval_samples_per_second": 413.897,
61
+ "eval_steps_per_second": 25.869,
62
  "step": 2000
63
  },
64
  {
 
83
  "eval_f1_macro": 0.8374201959393394,
84
  "eval_f1_weighted": 0.8806450852201921,
85
  "eval_loss": 0.3457934856414795,
86
+ "eval_runtime": 9.6651,
87
+ "eval_samples_per_second": 413.86,
88
+ "eval_steps_per_second": 25.866,
89
  "step": 3000
90
  },
91
  {
 
93
  "step": 3000,
94
  "total_flos": 1.262933065728e+16,
95
  "train_loss": 0.27966182454427085,
96
+ "train_runtime": 430.7509,
97
+ "train_samples_per_second": 111.433,
98
+ "train_steps_per_second": 6.965
99
  }
100
  ],
101
  "max_steps": 3000,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf156ae74a37a378f8916ca566a842b16575ec3ad5384916e9c69010b34a1ae0
3
  size 3643
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19635231ad63260728a01f0ae1dced21f343315a5fc1070be2fd708a403c7343
3
  size 3643