Marcos12886 commited on
Commit
65c1586
1 Parent(s): a007ad9

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -21,11 +21,11 @@ should probably proofread and complete it, then remove this comment. -->
21
 
22
  This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
23
  It achieves the following results on the evaluation set:
24
- - Loss: 0.0878
25
- - Accuracy: 0.9861
26
- - Precision: 0.9861
27
- - Recall: 0.9861
28
- - F1: 0.9861
29
 
30
  ## Model description
31
 
@@ -44,7 +44,7 @@ More information needed
44
  ### Training hyperparameters
45
 
46
  The following hyperparameters were used during training:
47
- - learning_rate: 0.0001
48
  - train_batch_size: 8
49
  - eval_batch_size: 8
50
  - seed: 123
@@ -53,20 +53,19 @@ The following hyperparameters were used during training:
53
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
54
  - lr_scheduler_type: cosine
55
  - lr_scheduler_warmup_ratio: 0.001
56
- - num_epochs: 8
57
 
58
  ### Training results
59
 
60
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
61
  |:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
62
- | No log | 0.9956 | 85 | 0.1204 | 0.9641 | 0.9641 | 0.9641 | 0.9638 |
63
- | No log | 1.9912 | 170 | 0.0847 | 0.9773 | 0.9772 | 0.9773 | 0.9773 |
64
- | No log | 2.9985 | 256 | 0.1025 | 0.9766 | 0.9769 | 0.9766 | 0.9766 |
65
- | No log | 3.9941 | 341 | 0.0869 | 0.9832 | 0.9835 | 0.9832 | 0.9832 |
66
- | No log | 4.9898 | 426 | 0.0746 | 0.9832 | 0.9834 | 0.9832 | 0.9832 |
67
- | 0.0538 | 5.9971 | 512 | 0.0870 | 0.9861 | 0.9861 | 0.9861 | 0.9861 |
68
- | 0.0538 | 6.9927 | 597 | 0.0890 | 0.9861 | 0.9861 | 0.9861 | 0.9861 |
69
- | 0.0538 | 7.9649 | 680 | 0.0878 | 0.9861 | 0.9861 | 0.9861 | 0.9861 |
70
 
71
 
72
  ### Framework versions
 
21
 
22
  This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.0359
25
+ - Accuracy: 0.9883
26
+ - Precision: 0.9883
27
+ - Recall: 0.9883
28
+ - F1: 0.9883
29
 
30
  ## Model description
31
 
 
44
  ### Training hyperparameters
45
 
46
  The following hyperparameters were used during training:
47
+ - learning_rate: 5e-05
48
  - train_batch_size: 8
49
  - eval_batch_size: 8
50
  - seed: 123
 
53
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
54
  - lr_scheduler_type: cosine
55
  - lr_scheduler_warmup_ratio: 0.001
56
+ - num_epochs: 10
57
 
58
  ### Training results
59
 
60
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
61
  |:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
62
+ | No log | 0.9956 | 85 | 0.1341 | 0.9538 | 0.9543 | 0.9538 | 0.9532 |
63
+ | No log | 1.9912 | 170 | 0.0831 | 0.9700 | 0.9720 | 0.9700 | 0.9703 |
64
+ | No log | 2.9985 | 256 | 0.0570 | 0.9846 | 0.9847 | 0.9846 | 0.9846 |
65
+ | No log | 3.9941 | 341 | 0.0340 | 0.9897 | 0.9898 | 0.9897 | 0.9898 |
66
+ | No log | 4.9898 | 426 | 0.0460 | 0.9875 | 0.9879 | 0.9875 | 0.9876 |
67
+ | 0.0707 | 5.9971 | 512 | 0.0431 | 0.9897 | 0.9899 | 0.9897 | 0.9898 |
68
+ | 0.0707 | 6.9927 | 597 | 0.0359 | 0.9883 | 0.9883 | 0.9883 | 0.9883 |
 
69
 
70
 
71
  ### Framework versions
checkpoint-170/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ddc4c9cb0876910fe2ac6089e9622d2ec25163c90268babf3b3a68cc1955bbc3
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85ed9f40490b0d3b2eab42a74aa78295bc0d5dc610c89bcfd6132ab265cc46c1
3
  size 94763496
checkpoint-170/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f284ad3b43a12e7fdbaf43673ca92e158c1ab9cbea63e0352b6085f5564ff555
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:884f223ad6abdd025f9f4a7bfacafc6c26b7792676f01b2a92bf8115fe98f14b
3
  size 189552570
checkpoint-170/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28ead2442e291cf84a44bd5f670a529388e7aee7f31ec31fec65f8af5dd527ac
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cb57d1cea1cb2499417a821f65ecd6374c5073b4605d8ad26f8414a8ef5b7bd
3
  size 1064
checkpoint-170/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.9772893772893773,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170",
4
  "epoch": 1.9912152269399708,
5
  "eval_steps": 500,
@@ -10,33 +10,33 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9772893772893773,
26
- "eval_f1": 0.9772624500008753,
27
- "eval_loss": 0.08473604917526245,
28
- "eval_precision": 0.9772470873644479,
29
- "eval_recall": 0.9772893772893773,
30
- "eval_runtime": 5.9068,
31
- "eval_samples_per_second": 231.09,
32
- "eval_steps_per_second": 28.95,
33
  "step": 170
34
  }
35
  ],
36
  "logging_steps": 500,
37
- "max_steps": 680,
38
  "num_input_tokens_seen": 0,
39
- "num_train_epochs": 8,
40
  "save_steps": 500,
41
  "stateful_callbacks": {
42
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.96996336996337,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170",
4
  "epoch": 1.9912152269399708,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.96996336996337,
26
+ "eval_f1": 0.970275727358029,
27
+ "eval_loss": 0.08308757096529007,
28
+ "eval_precision": 0.9720059808561178,
29
+ "eval_recall": 0.96996336996337,
30
+ "eval_runtime": 5.9321,
31
+ "eval_samples_per_second": 230.105,
32
+ "eval_steps_per_second": 28.826,
33
  "step": 170
34
  }
35
  ],
36
  "logging_steps": 500,
37
+ "max_steps": 850,
38
  "num_input_tokens_seen": 0,
39
+ "num_train_epochs": 10,
40
  "save_steps": 500,
41
  "stateful_callbacks": {
42
  "EarlyStoppingCallback": {
checkpoint-170/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
checkpoint-256/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e8fcce3d6821b09907a57bf2280fdb73fc79c008d23670c77bd0350d6249146
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0ef8be12a66054ee49a311e5cbc1e77f0f3bfeb6e0808f2d1f3fb47764355ad
3
  size 94763496
checkpoint-256/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb370b3600823d6c126a14d977da564c51a816566b23701954070eb23a1ecf47
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fa10a1f73ef67de699f17b8a38795e4419b28e161b6906950ff154e933bfac8
3
  size 189552570
checkpoint-256/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1ef84753a69d0410f7f7d925e2fedd5694b09472e6721f4fe864ef701cb0dd7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b581d82b68cb684515c782403bb76f13250579eff8704b811486ec59bb8e6b6a
3
  size 1064
checkpoint-256/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9772893772893773,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170",
4
  "epoch": 2.998535871156662,
5
  "eval_steps": 500,
6
  "global_step": 256,
@@ -10,45 +10,45 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9772893772893773,
26
- "eval_f1": 0.9772624500008753,
27
- "eval_loss": 0.08473604917526245,
28
- "eval_precision": 0.9772470873644479,
29
- "eval_recall": 0.9772893772893773,
30
- "eval_runtime": 5.9068,
31
- "eval_samples_per_second": 231.09,
32
- "eval_steps_per_second": 28.95,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9765567765567765,
38
- "eval_f1": 0.9766464967450174,
39
- "eval_loss": 0.10245847702026367,
40
- "eval_precision": 0.9768621127754256,
41
- "eval_recall": 0.9765567765567765,
42
- "eval_runtime": 5.8911,
43
- "eval_samples_per_second": 231.706,
44
- "eval_steps_per_second": 29.027,
45
  "step": 256
46
  }
47
  ],
48
  "logging_steps": 500,
49
- "max_steps": 680,
50
  "num_input_tokens_seen": 0,
51
- "num_train_epochs": 8,
52
  "save_steps": 500,
53
  "stateful_callbacks": {
54
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9846153846153847,
3
+ "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-256",
4
  "epoch": 2.998535871156662,
5
  "eval_steps": 500,
6
  "global_step": 256,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.96996336996337,
26
+ "eval_f1": 0.970275727358029,
27
+ "eval_loss": 0.08308757096529007,
28
+ "eval_precision": 0.9720059808561178,
29
+ "eval_recall": 0.96996336996337,
30
+ "eval_runtime": 5.9321,
31
+ "eval_samples_per_second": 230.105,
32
+ "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9846153846153847,
38
+ "eval_f1": 0.9845587007434289,
39
+ "eval_loss": 0.05695493519306183,
40
+ "eval_precision": 0.984652882646444,
41
+ "eval_recall": 0.9846153846153847,
42
+ "eval_runtime": 5.924,
43
+ "eval_samples_per_second": 230.421,
44
+ "eval_steps_per_second": 28.866,
45
  "step": 256
46
  }
47
  ],
48
  "logging_steps": 500,
49
+ "max_steps": 850,
50
  "num_input_tokens_seen": 0,
51
+ "num_train_epochs": 10,
52
  "save_steps": 500,
53
  "stateful_callbacks": {
54
  "EarlyStoppingCallback": {
checkpoint-256/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
checkpoint-341/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:083f40b77a3962067064a68eb072696b4bf2222ce7f9bdab915843b0aab6cf86
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:937ffa1cb79f16f4e7753ea842c3e32fe34e525562027e5b33ce48fc4b308a82
3
  size 94763496
checkpoint-341/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f581f41271d1b7b3e94ec5316e0b37c75a3ad264185a441b84016451887b8ec4
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a6119421582bbc05f8c02a4a9aab4dfdd2cb761cc17d9b827d99f803877b837
3
  size 189552570
checkpoint-341/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5073b7c775ebf0fc889f5dba154fdfe2dbb913e0f115f2091d61c7aad83715e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6383f793cae08448b1e6023eca64340792bd03b29faa8b0a3800859cbaf6c3ca
3
  size 1064
checkpoint-341/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.9831501831501831,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 3.994143484626647,
5
  "eval_steps": 500,
@@ -10,57 +10,57 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9772893772893773,
26
- "eval_f1": 0.9772624500008753,
27
- "eval_loss": 0.08473604917526245,
28
- "eval_precision": 0.9772470873644479,
29
- "eval_recall": 0.9772893772893773,
30
- "eval_runtime": 5.9068,
31
- "eval_samples_per_second": 231.09,
32
- "eval_steps_per_second": 28.95,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9765567765567765,
38
- "eval_f1": 0.9766464967450174,
39
- "eval_loss": 0.10245847702026367,
40
- "eval_precision": 0.9768621127754256,
41
- "eval_recall": 0.9765567765567765,
42
- "eval_runtime": 5.8911,
43
- "eval_samples_per_second": 231.706,
44
- "eval_steps_per_second": 29.027,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9831501831501831,
50
- "eval_f1": 0.9832333934847322,
51
- "eval_loss": 0.08685966581106186,
52
- "eval_precision": 0.9835305336122597,
53
- "eval_recall": 0.9831501831501831,
54
- "eval_runtime": 5.9568,
55
- "eval_samples_per_second": 229.152,
56
- "eval_steps_per_second": 28.707,
57
  "step": 341
58
  }
59
  ],
60
  "logging_steps": 500,
61
- "max_steps": 680,
62
  "num_input_tokens_seen": 0,
63
- "num_train_epochs": 8,
64
  "save_steps": 500,
65
  "stateful_callbacks": {
66
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9897435897435898,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 3.994143484626647,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.96996336996337,
26
+ "eval_f1": 0.970275727358029,
27
+ "eval_loss": 0.08308757096529007,
28
+ "eval_precision": 0.9720059808561178,
29
+ "eval_recall": 0.96996336996337,
30
+ "eval_runtime": 5.9321,
31
+ "eval_samples_per_second": 230.105,
32
+ "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9846153846153847,
38
+ "eval_f1": 0.9845587007434289,
39
+ "eval_loss": 0.05695493519306183,
40
+ "eval_precision": 0.984652882646444,
41
+ "eval_recall": 0.9846153846153847,
42
+ "eval_runtime": 5.924,
43
+ "eval_samples_per_second": 230.421,
44
+ "eval_steps_per_second": 28.866,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9897435897435898,
50
+ "eval_f1": 0.9897502348272303,
51
+ "eval_loss": 0.03400224819779396,
52
+ "eval_precision": 0.9897618176566864,
53
+ "eval_recall": 0.9897435897435898,
54
+ "eval_runtime": 5.9234,
55
+ "eval_samples_per_second": 230.441,
56
+ "eval_steps_per_second": 28.868,
57
  "step": 341
58
  }
59
  ],
60
  "logging_steps": 500,
61
+ "max_steps": 850,
62
  "num_input_tokens_seen": 0,
63
+ "num_train_epochs": 10,
64
  "save_steps": 500,
65
  "stateful_callbacks": {
66
  "EarlyStoppingCallback": {
checkpoint-341/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
checkpoint-426/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a9d6d392a4f841e92110c90f40ef7219881d17b11f11a64bad39c27cbe0178e
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f2381bd8ac8db8cd3c2425166e4419c44d01eb2bdc4a00d95e3ff3806ebad52
3
  size 94763496
checkpoint-426/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcfe6fb7847bde58aeb36b9a7bc45200d4352f754fb3595c33126144f17addf2
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddad96bd00a38ac13e824dddeb8bec0bff93f4b8005f4f483d201e92de9bdadf
3
  size 189552570
checkpoint-426/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d56f52cf1fd1013d5989e211cbbbf97096f52d89af5defd532d0d8a25d4724f7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f3d79bed0dd03dfef1d407d59369329e4670d54e356165ddfc162563cf81d14
3
  size 1064
checkpoint-426/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.9831501831501831,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 4.989751098096632,
5
  "eval_steps": 500,
@@ -10,69 +10,69 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9772893772893773,
26
- "eval_f1": 0.9772624500008753,
27
- "eval_loss": 0.08473604917526245,
28
- "eval_precision": 0.9772470873644479,
29
- "eval_recall": 0.9772893772893773,
30
- "eval_runtime": 5.9068,
31
- "eval_samples_per_second": 231.09,
32
- "eval_steps_per_second": 28.95,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9765567765567765,
38
- "eval_f1": 0.9766464967450174,
39
- "eval_loss": 0.10245847702026367,
40
- "eval_precision": 0.9768621127754256,
41
- "eval_recall": 0.9765567765567765,
42
- "eval_runtime": 5.8911,
43
- "eval_samples_per_second": 231.706,
44
- "eval_steps_per_second": 29.027,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9831501831501831,
50
- "eval_f1": 0.9832333934847322,
51
- "eval_loss": 0.08685966581106186,
52
- "eval_precision": 0.9835305336122597,
53
- "eval_recall": 0.9831501831501831,
54
- "eval_runtime": 5.9568,
55
- "eval_samples_per_second": 229.152,
56
- "eval_steps_per_second": 28.707,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
- "eval_accuracy": 0.9831501831501831,
62
- "eval_f1": 0.983208365019189,
63
- "eval_loss": 0.07458490133285522,
64
- "eval_precision": 0.9833696765629429,
65
- "eval_recall": 0.9831501831501831,
66
- "eval_runtime": 5.9419,
67
- "eval_samples_per_second": 229.726,
68
- "eval_steps_per_second": 28.779,
69
  "step": 426
70
  }
71
  ],
72
  "logging_steps": 500,
73
- "max_steps": 680,
74
  "num_input_tokens_seen": 0,
75
- "num_train_epochs": 8,
76
  "save_steps": 500,
77
  "stateful_callbacks": {
78
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9897435897435898,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 4.989751098096632,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.96996336996337,
26
+ "eval_f1": 0.970275727358029,
27
+ "eval_loss": 0.08308757096529007,
28
+ "eval_precision": 0.9720059808561178,
29
+ "eval_recall": 0.96996336996337,
30
+ "eval_runtime": 5.9321,
31
+ "eval_samples_per_second": 230.105,
32
+ "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9846153846153847,
38
+ "eval_f1": 0.9845587007434289,
39
+ "eval_loss": 0.05695493519306183,
40
+ "eval_precision": 0.984652882646444,
41
+ "eval_recall": 0.9846153846153847,
42
+ "eval_runtime": 5.924,
43
+ "eval_samples_per_second": 230.421,
44
+ "eval_steps_per_second": 28.866,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9897435897435898,
50
+ "eval_f1": 0.9897502348272303,
51
+ "eval_loss": 0.03400224819779396,
52
+ "eval_precision": 0.9897618176566864,
53
+ "eval_recall": 0.9897435897435898,
54
+ "eval_runtime": 5.9234,
55
+ "eval_samples_per_second": 230.441,
56
+ "eval_steps_per_second": 28.868,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.9875457875457876,
62
+ "eval_f1": 0.9876042969414931,
63
+ "eval_loss": 0.04599935933947563,
64
+ "eval_precision": 0.9879353582239604,
65
+ "eval_recall": 0.9875457875457876,
66
+ "eval_runtime": 5.9141,
67
+ "eval_samples_per_second": 230.803,
68
+ "eval_steps_per_second": 28.914,
69
  "step": 426
70
  }
71
  ],
72
  "logging_steps": 500,
73
+ "max_steps": 850,
74
  "num_input_tokens_seen": 0,
75
+ "num_train_epochs": 10,
76
  "save_steps": 500,
77
  "stateful_callbacks": {
78
  "EarlyStoppingCallback": {
checkpoint-426/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
checkpoint-512/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbc5b2463f7b10d6accd90a38663b1fe5924ce417d20bd4c4b022491ab407a53
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35b0d90358beea477341c41eb5ba7259fabcc0922d7900d91362f0fbaf06bab2
3
  size 94763496
checkpoint-512/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00ec41f63df75118d702c2384056a8cc4b5a13080b78a48bdd542ffc79dc1c02
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:648b988b59d53cdfb9a307e0c1ecb64a428672a7b441f4145e8d3d009ae2cfbe
3
  size 189552570
checkpoint-512/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bcc97a747eb11a8dc86d1d122f7b8fac6f5b54e0a4e11d9bd187896e44dca8fe
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1f22cb39573891adcd854d571d182ed521927c0644cb49b42c5a9a0f0635791
3
  size 1064
checkpoint-512/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9860805860805861,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-512",
4
  "epoch": 5.997071742313324,
5
  "eval_steps": 500,
6
  "global_step": 512,
@@ -10,88 +10,88 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9772893772893773,
26
- "eval_f1": 0.9772624500008753,
27
- "eval_loss": 0.08473604917526245,
28
- "eval_precision": 0.9772470873644479,
29
- "eval_recall": 0.9772893772893773,
30
- "eval_runtime": 5.9068,
31
- "eval_samples_per_second": 231.09,
32
- "eval_steps_per_second": 28.95,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9765567765567765,
38
- "eval_f1": 0.9766464967450174,
39
- "eval_loss": 0.10245847702026367,
40
- "eval_precision": 0.9768621127754256,
41
- "eval_recall": 0.9765567765567765,
42
- "eval_runtime": 5.8911,
43
- "eval_samples_per_second": 231.706,
44
- "eval_steps_per_second": 29.027,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9831501831501831,
50
- "eval_f1": 0.9832333934847322,
51
- "eval_loss": 0.08685966581106186,
52
- "eval_precision": 0.9835305336122597,
53
- "eval_recall": 0.9831501831501831,
54
- "eval_runtime": 5.9568,
55
- "eval_samples_per_second": 229.152,
56
- "eval_steps_per_second": 28.707,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
- "eval_accuracy": 0.9831501831501831,
62
- "eval_f1": 0.983208365019189,
63
- "eval_loss": 0.07458490133285522,
64
- "eval_precision": 0.9833696765629429,
65
- "eval_recall": 0.9831501831501831,
66
- "eval_runtime": 5.9419,
67
- "eval_samples_per_second": 229.726,
68
- "eval_steps_per_second": 28.779,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
- "grad_norm": 0.01886621303856373,
74
- "learning_rate": 1.6360497736760383e-05,
75
- "loss": 0.0538,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
- "eval_accuracy": 0.9860805860805861,
81
- "eval_f1": 0.9860860332682386,
82
- "eval_loss": 0.08699370175600052,
83
- "eval_precision": 0.9860927746075414,
84
- "eval_recall": 0.9860805860805861,
85
- "eval_runtime": 5.9399,
86
- "eval_samples_per_second": 229.803,
87
- "eval_steps_per_second": 28.789,
88
  "step": 512
89
  }
90
  ],
91
  "logging_steps": 500,
92
- "max_steps": 680,
93
  "num_input_tokens_seen": 0,
94
- "num_train_epochs": 8,
95
  "save_steps": 500,
96
  "stateful_callbacks": {
97
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9897435897435898,
3
+ "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 5.997071742313324,
5
  "eval_steps": 500,
6
  "global_step": 512,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.96996336996337,
26
+ "eval_f1": 0.970275727358029,
27
+ "eval_loss": 0.08308757096529007,
28
+ "eval_precision": 0.9720059808561178,
29
+ "eval_recall": 0.96996336996337,
30
+ "eval_runtime": 5.9321,
31
+ "eval_samples_per_second": 230.105,
32
+ "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9846153846153847,
38
+ "eval_f1": 0.9845587007434289,
39
+ "eval_loss": 0.05695493519306183,
40
+ "eval_precision": 0.984652882646444,
41
+ "eval_recall": 0.9846153846153847,
42
+ "eval_runtime": 5.924,
43
+ "eval_samples_per_second": 230.421,
44
+ "eval_steps_per_second": 28.866,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9897435897435898,
50
+ "eval_f1": 0.9897502348272303,
51
+ "eval_loss": 0.03400224819779396,
52
+ "eval_precision": 0.9897618176566864,
53
+ "eval_recall": 0.9897435897435898,
54
+ "eval_runtime": 5.9234,
55
+ "eval_samples_per_second": 230.441,
56
+ "eval_steps_per_second": 28.868,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.9875457875457876,
62
+ "eval_f1": 0.9876042969414931,
63
+ "eval_loss": 0.04599935933947563,
64
+ "eval_precision": 0.9879353582239604,
65
+ "eval_recall": 0.9875457875457876,
66
+ "eval_runtime": 5.9141,
67
+ "eval_samples_per_second": 230.803,
68
+ "eval_steps_per_second": 28.914,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
+ "grad_norm": 0.020362911745905876,
74
+ "learning_rate": 1.819507083000514e-05,
75
+ "loss": 0.0707,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
+ "eval_accuracy": 0.9897435897435898,
81
+ "eval_f1": 0.9897761336599745,
82
+ "eval_loss": 0.04312068223953247,
83
+ "eval_precision": 0.9899308989239506,
84
+ "eval_recall": 0.9897435897435898,
85
+ "eval_runtime": 5.5776,
86
+ "eval_samples_per_second": 244.727,
87
+ "eval_steps_per_second": 30.658,
88
  "step": 512
89
  }
90
  ],
91
  "logging_steps": 500,
92
+ "max_steps": 850,
93
  "num_input_tokens_seen": 0,
94
+ "num_train_epochs": 10,
95
  "save_steps": 500,
96
  "stateful_callbacks": {
97
  "EarlyStoppingCallback": {
checkpoint-512/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
checkpoint-597/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a064606432f81dfcabef436b3a7746c96408c18ddc57930d2e91972b830e997f
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c617973600d573c483f588a59837c6d45814ca8e16c64575f5523b65246f0c5e
3
  size 94763496
checkpoint-597/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84091c5d2d0db5e72458d1db7aef4f39da72483fa57f4cd28ecc4085a3dfd425
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86268f89454cc35e41155e346d8e2ca8d5a9b6f579d1fef2bbfc8b823eace3b9
3
  size 189552570
checkpoint-597/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbae7c9f313f104f989b156afed3a79758bf4cf1949ca702f760fa941bede2bf
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c216d743853a404a50b6a598e3c4bf36fa1dc8935b24320ebe609a9c5c9b437
3
  size 1064
checkpoint-597/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9860805860805861,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-512",
4
  "epoch": 6.992679355783309,
5
  "eval_steps": 500,
6
  "global_step": 597,
@@ -10,100 +10,100 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9772893772893773,
26
- "eval_f1": 0.9772624500008753,
27
- "eval_loss": 0.08473604917526245,
28
- "eval_precision": 0.9772470873644479,
29
- "eval_recall": 0.9772893772893773,
30
- "eval_runtime": 5.9068,
31
- "eval_samples_per_second": 231.09,
32
- "eval_steps_per_second": 28.95,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9765567765567765,
38
- "eval_f1": 0.9766464967450174,
39
- "eval_loss": 0.10245847702026367,
40
- "eval_precision": 0.9768621127754256,
41
- "eval_recall": 0.9765567765567765,
42
- "eval_runtime": 5.8911,
43
- "eval_samples_per_second": 231.706,
44
- "eval_steps_per_second": 29.027,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9831501831501831,
50
- "eval_f1": 0.9832333934847322,
51
- "eval_loss": 0.08685966581106186,
52
- "eval_precision": 0.9835305336122597,
53
- "eval_recall": 0.9831501831501831,
54
- "eval_runtime": 5.9568,
55
- "eval_samples_per_second": 229.152,
56
- "eval_steps_per_second": 28.707,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
- "eval_accuracy": 0.9831501831501831,
62
- "eval_f1": 0.983208365019189,
63
- "eval_loss": 0.07458490133285522,
64
- "eval_precision": 0.9833696765629429,
65
- "eval_recall": 0.9831501831501831,
66
- "eval_runtime": 5.9419,
67
- "eval_samples_per_second": 229.726,
68
- "eval_steps_per_second": 28.779,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
- "grad_norm": 0.01886621303856373,
74
- "learning_rate": 1.6360497736760383e-05,
75
- "loss": 0.0538,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
- "eval_accuracy": 0.9860805860805861,
81
- "eval_f1": 0.9860860332682386,
82
- "eval_loss": 0.08699370175600052,
83
- "eval_precision": 0.9860927746075414,
84
- "eval_recall": 0.9860805860805861,
85
- "eval_runtime": 5.9399,
86
- "eval_samples_per_second": 229.803,
87
- "eval_steps_per_second": 28.789,
88
  "step": 512
89
  },
90
  {
91
  "epoch": 6.992679355783309,
92
- "eval_accuracy": 0.9860805860805861,
93
- "eval_f1": 0.9860860332682386,
94
- "eval_loss": 0.08903729915618896,
95
- "eval_precision": 0.9860927746075414,
96
- "eval_recall": 0.9860805860805861,
97
- "eval_runtime": 5.9207,
98
- "eval_samples_per_second": 230.546,
99
- "eval_steps_per_second": 28.882,
100
  "step": 597
101
  }
102
  ],
103
  "logging_steps": 500,
104
- "max_steps": 680,
105
  "num_input_tokens_seen": 0,
106
- "num_train_epochs": 8,
107
  "save_steps": 500,
108
  "stateful_callbacks": {
109
  "EarlyStoppingCallback": {
@@ -121,7 +121,7 @@
121
  "should_evaluate": false,
122
  "should_log": false,
123
  "should_save": true,
124
- "should_training_stop": false
125
  },
126
  "attributes": {}
127
  }
 
1
  {
2
+ "best_metric": 0.9897435897435898,
3
+ "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 6.992679355783309,
5
  "eval_steps": 500,
6
  "global_step": 597,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.96996336996337,
26
+ "eval_f1": 0.970275727358029,
27
+ "eval_loss": 0.08308757096529007,
28
+ "eval_precision": 0.9720059808561178,
29
+ "eval_recall": 0.96996336996337,
30
+ "eval_runtime": 5.9321,
31
+ "eval_samples_per_second": 230.105,
32
+ "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9846153846153847,
38
+ "eval_f1": 0.9845587007434289,
39
+ "eval_loss": 0.05695493519306183,
40
+ "eval_precision": 0.984652882646444,
41
+ "eval_recall": 0.9846153846153847,
42
+ "eval_runtime": 5.924,
43
+ "eval_samples_per_second": 230.421,
44
+ "eval_steps_per_second": 28.866,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9897435897435898,
50
+ "eval_f1": 0.9897502348272303,
51
+ "eval_loss": 0.03400224819779396,
52
+ "eval_precision": 0.9897618176566864,
53
+ "eval_recall": 0.9897435897435898,
54
+ "eval_runtime": 5.9234,
55
+ "eval_samples_per_second": 230.441,
56
+ "eval_steps_per_second": 28.868,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.9875457875457876,
62
+ "eval_f1": 0.9876042969414931,
63
+ "eval_loss": 0.04599935933947563,
64
+ "eval_precision": 0.9879353582239604,
65
+ "eval_recall": 0.9875457875457876,
66
+ "eval_runtime": 5.9141,
67
+ "eval_samples_per_second": 230.803,
68
+ "eval_steps_per_second": 28.914,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
+ "grad_norm": 0.020362911745905876,
74
+ "learning_rate": 1.819507083000514e-05,
75
+ "loss": 0.0707,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
+ "eval_accuracy": 0.9897435897435898,
81
+ "eval_f1": 0.9897761336599745,
82
+ "eval_loss": 0.04312068223953247,
83
+ "eval_precision": 0.9899308989239506,
84
+ "eval_recall": 0.9897435897435898,
85
+ "eval_runtime": 5.5776,
86
+ "eval_samples_per_second": 244.727,
87
+ "eval_steps_per_second": 30.658,
88
  "step": 512
89
  },
90
  {
91
  "epoch": 6.992679355783309,
92
+ "eval_accuracy": 0.9882783882783883,
93
+ "eval_f1": 0.9882934987415589,
94
+ "eval_loss": 0.035927049815654755,
95
+ "eval_precision": 0.9883282714000319,
96
+ "eval_recall": 0.9882783882783883,
97
+ "eval_runtime": 5.5806,
98
+ "eval_samples_per_second": 244.596,
99
+ "eval_steps_per_second": 30.642,
100
  "step": 597
101
  }
102
  ],
103
  "logging_steps": 500,
104
+ "max_steps": 850,
105
  "num_input_tokens_seen": 0,
106
+ "num_train_epochs": 10,
107
  "save_steps": 500,
108
  "stateful_callbacks": {
109
  "EarlyStoppingCallback": {
 
121
  "should_evaluate": false,
122
  "should_log": false,
123
  "should_save": true,
124
+ "should_training_stop": true
125
  },
126
  "attributes": {}
127
  }
checkpoint-597/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
checkpoint-85/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a15277aa4797964b12aaedf5acf9218acf9f11597a299deaf3a64bad8d89176e
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:735ade2638b1f118fe459d58e0f846d8676adb708417e44d45e5c5631286bd6c
3
  size 94763496
checkpoint-85/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9c4d0328f867e3a4371326367364a334fc34c6ecaba4f27c44bae6d943a3f5e
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c2df0704bbd0ae60f95b2890a8b3ca3655b01d98a8e15e46e75396add56c28
3
  size 189552570
checkpoint-85/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a3200599f03a01d89a474fcdd8a567058cd33b2f50dde928b44d422ff5012f0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:627e28ee33138f33050cb3ea94003427c4a362d22084d2243ecd2a8541bf03ff
3
  size 1064
checkpoint-85/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.9641025641025641,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-85",
4
  "epoch": 0.9956076134699854,
5
  "eval_steps": 500,
@@ -10,21 +10,21 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9641025641025641,
14
- "eval_f1": 0.9637911305761953,
15
- "eval_loss": 0.12035853415727615,
16
- "eval_precision": 0.9640509308043554,
17
- "eval_recall": 0.9641025641025641,
18
- "eval_runtime": 6.052,
19
- "eval_samples_per_second": 225.545,
20
- "eval_steps_per_second": 28.255,
21
  "step": 85
22
  }
23
  ],
24
  "logging_steps": 500,
25
- "max_steps": 680,
26
  "num_input_tokens_seen": 0,
27
- "num_train_epochs": 8,
28
  "save_steps": 500,
29
  "stateful_callbacks": {
30
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9538461538461539,
3
  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-85",
4
  "epoch": 0.9956076134699854,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.953235199825453,
15
+ "eval_loss": 0.13410410284996033,
16
+ "eval_precision": 0.9543176332312968,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.9191,
19
+ "eval_samples_per_second": 230.61,
20
+ "eval_steps_per_second": 28.89,
21
  "step": 85
22
  }
23
  ],
24
  "logging_steps": 500,
25
+ "max_steps": 850,
26
  "num_input_tokens_seen": 0,
27
+ "num_train_epochs": 10,
28
  "save_steps": 500,
29
  "stateful_callbacks": {
30
  "EarlyStoppingCallback": {
checkpoint-85/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbc5b2463f7b10d6accd90a38663b1fe5924ce417d20bd4c4b022491ab407a53
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:937ffa1cb79f16f4e7753ea842c3e32fe34e525562027e5b33ce48fc4b308a82
3
  size 94763496
runs/Sep08_20-15-47_ubumarcos/events.out.tfevents.1725819348.ubumarcos ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3acac0f35b9d995564af973913d52663295aac3c4883be89bc110f97f39bcd36
3
+ size 9711
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cda0bf828ccc04cd6d3fb7933f60f34ca3c8ba14b14579f9e878d688bc739b4a
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240