Marcos12886 commited on
Commit
9487b76
1 Parent(s): be8b76f

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +16 -10
  2. checkpoint-170/config.json +0 -4
  3. checkpoint-170/model.safetensors +1 -1
  4. checkpoint-170/optimizer.pt +1 -1
  5. checkpoint-170/scheduler.pt +1 -1
  6. checkpoint-170/trainer_state.json +20 -20
  7. checkpoint-170/training_args.bin +1 -1
  8. checkpoint-256/config.json +0 -4
  9. checkpoint-256/model.safetensors +1 -1
  10. checkpoint-256/optimizer.pt +1 -1
  11. checkpoint-256/scheduler.pt +1 -1
  12. checkpoint-256/trainer_state.json +28 -28
  13. checkpoint-256/training_args.bin +1 -1
  14. checkpoint-341/config.json +0 -4
  15. checkpoint-341/model.safetensors +1 -1
  16. checkpoint-341/optimizer.pt +1 -1
  17. checkpoint-341/trainer_state.json +32 -32
  18. checkpoint-341/training_args.bin +1 -1
  19. checkpoint-426/config.json +0 -4
  20. checkpoint-426/model.safetensors +1 -1
  21. checkpoint-426/optimizer.pt +1 -1
  22. checkpoint-426/scheduler.pt +1 -1
  23. checkpoint-426/trainer_state.json +44 -44
  24. checkpoint-426/training_args.bin +1 -1
  25. checkpoint-512/config.json +0 -4
  26. checkpoint-512/model.safetensors +1 -1
  27. checkpoint-512/optimizer.pt +1 -1
  28. checkpoint-512/scheduler.pt +1 -1
  29. checkpoint-512/trainer_state.json +51 -51
  30. checkpoint-512/training_args.bin +1 -1
  31. checkpoint-597/config.json +0 -4
  32. checkpoint-597/model.safetensors +1 -1
  33. checkpoint-597/optimizer.pt +1 -1
  34. checkpoint-597/scheduler.pt +1 -1
  35. checkpoint-597/trainer_state.json +60 -60
  36. checkpoint-597/training_args.bin +1 -1
  37. checkpoint-683/config.json +1 -4
  38. checkpoint-683/model.safetensors +1 -1
  39. checkpoint-683/optimizer.pt +1 -1
  40. checkpoint-683/scheduler.pt +1 -1
  41. checkpoint-683/trainer_state.json +69 -45
  42. checkpoint-683/training_args.bin +1 -1
  43. checkpoint-768/config.json +1 -4
  44. checkpoint-768/model.safetensors +1 -1
  45. checkpoint-768/optimizer.pt +1 -1
  46. checkpoint-768/scheduler.pt +1 -1
  47. checkpoint-768/trainer_state.json +78 -51
  48. checkpoint-768/training_args.bin +1 -1
  49. checkpoint-85/config.json +0 -4
  50. checkpoint-85/model.safetensors +1 -1
README.md CHANGED
@@ -21,11 +21,11 @@ should probably proofread and complete it, then remove this comment. -->
21
 
22
  This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
23
  It achieves the following results on the evaluation set:
24
- - Loss: 0.0625
25
- - Accuracy: 0.9824
26
- - Precision: 0.9825
27
- - Recall: 0.9824
28
- - F1: 0.9824
29
 
30
  ## Model description
31
 
@@ -53,16 +53,22 @@ The following hyperparameters were used during training:
53
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
54
  - lr_scheduler_type: cosine
55
  - lr_scheduler_warmup_ratio: 0.001
56
- - num_epochs: 4
57
 
58
  ### Training results
59
 
60
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
61
  |:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
62
- | No log | 0.9956 | 85 | 0.1378 | 0.9546 | 0.9543 | 0.9546 | 0.9544 |
63
- | No log | 1.9912 | 170 | 0.0802 | 0.9714 | 0.9713 | 0.9714 | 0.9714 |
64
- | No log | 2.9985 | 256 | 0.0682 | 0.9780 | 0.9783 | 0.9780 | 0.9781 |
65
- | No log | 3.9824 | 340 | 0.0625 | 0.9824 | 0.9825 | 0.9824 | 0.9824 |
 
 
 
 
 
 
66
 
67
 
68
  ### Framework versions
 
21
 
22
  This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.0338
25
+ - Accuracy: 0.9912
26
+ - Precision: 0.9912
27
+ - Recall: 0.9912
28
+ - F1: 0.9912
29
 
30
  ## Model description
31
 
 
53
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
54
  - lr_scheduler_type: cosine
55
  - lr_scheduler_warmup_ratio: 0.001
56
+ - num_epochs: 10
57
 
58
  ### Training results
59
 
60
  | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 |
61
  |:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:|
62
+ | No log | 0.9956 | 85 | 0.1197 | 0.9538 | 0.9535 | 0.9538 | 0.9536 |
63
+ | No log | 1.9912 | 170 | 0.0601 | 0.9832 | 0.9831 | 0.9832 | 0.9831 |
64
+ | No log | 2.9985 | 256 | 0.0506 | 0.9868 | 0.9868 | 0.9868 | 0.9868 |
65
+ | No log | 3.9941 | 341 | 0.0461 | 0.9861 | 0.9864 | 0.9861 | 0.9862 |
66
+ | No log | 4.9898 | 426 | 0.0439 | 0.9890 | 0.9891 | 0.9890 | 0.9890 |
67
+ | 0.0779 | 5.9971 | 512 | 0.0396 | 0.9905 | 0.9905 | 0.9905 | 0.9905 |
68
+ | 0.0779 | 6.9927 | 597 | 0.0350 | 0.9919 | 0.9919 | 0.9919 | 0.9919 |
69
+ | 0.0779 | 8.0 | 683 | 0.0335 | 0.9912 | 0.9912 | 0.9912 | 0.9912 |
70
+ | 0.0779 | 8.9956 | 768 | 0.0337 | 0.9912 | 0.9912 | 0.9912 | 0.9912 |
71
+ | 0.0779 | 9.9561 | 850 | 0.0338 | 0.9912 | 0.9912 | 0.9912 | 0.9912 |
72
 
73
 
74
  ### Framework versions
checkpoint-170/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-170/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8a90553b00c4439fad5a7ed1ff0a9f76e60e707d76e5d455fd77360dff39ae0
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c27ce70effb26d2c4fae3a9e5f9435a7adf1d9096be67f3e04eaf7266135f148
3
  size 94763496
checkpoint-170/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2dba3cd8b01d3153e53635bf2a218b801d4fb4cfcf7a5f02fc1c0e0d267aeace
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f521c92737364b558a7a1f423ef220dcbbcf0650e982c3e4d1b202ec007872c8
3
  size 189552570
checkpoint-170/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44565a4b1d8937c55d485ff9cf817bf33c36c26adc047340853e15a70d1a023d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2c60537414c36d76239817fe1c8be075bed144e4b9d191a70b981deda17823
3
  size 1064
checkpoint-170/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9714285714285714,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170",
4
  "epoch": 1.9912152269399708,
5
  "eval_steps": 500,
6
  "global_step": 170,
@@ -10,33 +10,33 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9545787545787546,
14
- "eval_f1": 0.9543924849872077,
15
- "eval_loss": 0.13782845437526703,
16
- "eval_precision": 0.9543323172404159,
17
- "eval_recall": 0.9545787545787546,
18
- "eval_runtime": 6.1437,
19
- "eval_samples_per_second": 222.18,
20
- "eval_steps_per_second": 27.834,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9714285714285714,
26
- "eval_f1": 0.9713707024010776,
27
- "eval_loss": 0.0802176371216774,
28
- "eval_precision": 0.9713449610559759,
29
- "eval_recall": 0.9714285714285714,
30
- "eval_runtime": 6.0836,
31
- "eval_samples_per_second": 224.373,
32
- "eval_steps_per_second": 28.108,
33
  "step": 170
34
  }
35
  ],
36
  "logging_steps": 500,
37
- "max_steps": 340,
38
  "num_input_tokens_seen": 0,
39
- "num_train_epochs": 4,
40
  "save_steps": 500,
41
  "stateful_callbacks": {
42
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9831501831501831,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-170",
4
  "epoch": 1.9912152269399708,
5
  "eval_steps": 500,
6
  "global_step": 170,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  }
35
  ],
36
  "logging_steps": 500,
37
+ "max_steps": 850,
38
  "num_input_tokens_seen": 0,
39
+ "num_train_epochs": 10,
40
  "save_steps": 500,
41
  "stateful_callbacks": {
42
  "EarlyStoppingCallback": {
checkpoint-170/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7bd8e997c05f23ae464180f8e5e9f881e9c68322e4fcd3f855e79e2e5d54fbb
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-256/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-256/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18d5013bf626b187ac7bbd42a7fb1a1b824c821cd062c951de17f19d9fb95944
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2992b8dfd27781b5920e6b800dd0bec2a8809a5eb8c0508b6726dd68807c3b6d
3
  size 94763496
checkpoint-256/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7187577ead7a6d35f35a5dc44c0b76b32036040837b41821bc67970a2dde3ed2
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb0f801198c29f1cc11cf39d019a185562336bfbfdee4056f15cc25e0604767a
3
  size 189552570
checkpoint-256/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eed9846f2cf239e8810dae264b4e0fe505a115ec40d5b4f9abdb240e9e0a0fae
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ea8c99bcd3f4c186db34ca4e9cbe89b586ea3bd6cf9703b17e9ec1f6c1ff961
3
  size 1064
checkpoint-256/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.978021978021978,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-256",
4
  "epoch": 2.998535871156662,
5
  "eval_steps": 500,
6
  "global_step": 256,
@@ -10,45 +10,45 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9545787545787546,
14
- "eval_f1": 0.9543924849872077,
15
- "eval_loss": 0.13782845437526703,
16
- "eval_precision": 0.9543323172404159,
17
- "eval_recall": 0.9545787545787546,
18
- "eval_runtime": 6.1437,
19
- "eval_samples_per_second": 222.18,
20
- "eval_steps_per_second": 27.834,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9714285714285714,
26
- "eval_f1": 0.9713707024010776,
27
- "eval_loss": 0.0802176371216774,
28
- "eval_precision": 0.9713449610559759,
29
- "eval_recall": 0.9714285714285714,
30
- "eval_runtime": 6.0836,
31
- "eval_samples_per_second": 224.373,
32
- "eval_steps_per_second": 28.108,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.978021978021978,
38
- "eval_f1": 0.9781077738703647,
39
- "eval_loss": 0.06824816763401031,
40
- "eval_precision": 0.9783204609221348,
41
- "eval_recall": 0.978021978021978,
42
- "eval_runtime": 6.0791,
43
- "eval_samples_per_second": 224.54,
44
- "eval_steps_per_second": 28.129,
45
  "step": 256
46
  }
47
  ],
48
  "logging_steps": 500,
49
- "max_steps": 340,
50
  "num_input_tokens_seen": 0,
51
- "num_train_epochs": 4,
52
  "save_steps": 500,
53
  "stateful_callbacks": {
54
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.9868131868131869,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-256",
4
  "epoch": 2.998535871156662,
5
  "eval_steps": 500,
6
  "global_step": 256,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
+ "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  }
47
  ],
48
  "logging_steps": 500,
49
+ "max_steps": 850,
50
  "num_input_tokens_seen": 0,
51
+ "num_train_epochs": 10,
52
  "save_steps": 500,
53
  "stateful_callbacks": {
54
  "EarlyStoppingCallback": {
checkpoint-256/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7bd8e997c05f23ae464180f8e5e9f881e9c68322e4fcd3f855e79e2e5d54fbb
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-341/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-341/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4aef887b699e0e2fffd8fb2dabc3a3ee00a823581110ae055322fc7dccddae5f
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3fb881f587c38faf027d9d2f92c1142607ce7f334b76baccc3fafe76fbc4f38
3
  size 94763496
checkpoint-341/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f9a8acfee398336615756edc66f296d1f801d2fde4edac691df5318d5bad0e5
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62cf0c2fa4abd219e7fa80805ad290927ba54a46ecf6203e78bc102ea268400c
3
  size 189552570
checkpoint-341/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9875457875457876,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 3.994143484626647,
5
  "eval_steps": 500,
6
  "global_step": 341,
@@ -10,50 +10,50 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9663003663003663,
14
- "eval_f1": 0.9661425019393345,
15
- "eval_loss": 0.10625720024108887,
16
- "eval_precision": 0.966167198143384,
17
- "eval_recall": 0.9663003663003663,
18
- "eval_runtime": 6.2148,
19
- "eval_samples_per_second": 219.638,
20
- "eval_steps_per_second": 27.515,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9824175824175824,
26
- "eval_f1": 0.9824569651195038,
27
- "eval_loss": 0.06455090641975403,
28
- "eval_precision": 0.9825418778671476,
29
- "eval_recall": 0.9824175824175824,
30
- "eval_runtime": 5.7635,
31
- "eval_samples_per_second": 236.835,
32
- "eval_steps_per_second": 29.669,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
  "eval_accuracy": 0.9868131868131869,
38
- "eval_f1": 0.9868427238396278,
39
- "eval_loss": 0.04568345472216606,
40
- "eval_precision": 0.98691808355097,
41
  "eval_recall": 0.9868131868131869,
42
- "eval_runtime": 6.1234,
43
- "eval_samples_per_second": 222.916,
44
- "eval_steps_per_second": 27.926,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9875457875457876,
50
- "eval_f1": 0.9875962963533335,
51
- "eval_loss": 0.049539219588041306,
52
- "eval_precision": 0.9877998892958556,
53
- "eval_recall": 0.9875457875457876,
54
- "eval_runtime": 6.1353,
55
- "eval_samples_per_second": 222.481,
56
- "eval_steps_per_second": 27.871,
57
  "step": 341
58
  }
59
  ],
 
1
  {
2
+ "best_metric": 0.9868131868131869,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-256",
4
  "epoch": 3.994143484626647,
5
  "eval_steps": 500,
6
  "global_step": 341,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
  "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
  "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9860805860805861,
50
+ "eval_f1": 0.9861535269385863,
51
+ "eval_loss": 0.04610973969101906,
52
+ "eval_precision": 0.986445121171901,
53
+ "eval_recall": 0.9860805860805861,
54
+ "eval_runtime": 5.9428,
55
+ "eval_samples_per_second": 229.69,
56
+ "eval_steps_per_second": 28.774,
57
  "step": 341
58
  }
59
  ],
checkpoint-341/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:325406b343874b92345e9a863970ee7cd441131f2850f47ab026ed810d19a88c
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-426/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-426/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ccd0853b18fcef29f6c50370c40938c3fc157e6d6ab4f5a8cc0ee4de4c2a330
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f21392d62c0aae2cb86ef601a6fdd136f97139074d9fc1a5418821cfd21d8f2f
3
  size 94763496
checkpoint-426/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58cf1896c9f8575d9e790921f864e581859c2dd6014460c20f2981f52787a4a4
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54aacdf3b8335705d217fdd88584f914b41fdc67436f327708a19652d4774b8e
3
  size 189552570
checkpoint-426/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77da8d31fe5105cdaffd1de28e960ad7041d43ef167667465d3bd1e966ae27b0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:579ef0f1564878cc661672a4c8ce1e561a689fa403a5862a5af2e3ad39ed51e9
3
  size 1064
checkpoint-426/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.991941391941392,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 4.989751098096632,
5
  "eval_steps": 500,
6
  "global_step": 426,
@@ -10,69 +10,69 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9597069597069597,
14
- "eval_f1": 0.9599836188656065,
15
- "eval_loss": 0.12706419825553894,
16
- "eval_precision": 0.960694098126733,
17
- "eval_recall": 0.9597069597069597,
18
- "eval_runtime": 6.1839,
19
- "eval_samples_per_second": 220.733,
20
- "eval_steps_per_second": 27.652,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.9787545787545787,
26
- "eval_f1": 0.9788099592207686,
27
- "eval_loss": 0.07009062170982361,
28
- "eval_precision": 0.9789268917610887,
29
- "eval_recall": 0.9787545787545787,
30
- "eval_runtime": 6.2624,
31
- "eval_samples_per_second": 217.969,
32
- "eval_steps_per_second": 27.306,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9831501831501831,
38
- "eval_f1": 0.9831941055888854,
39
- "eval_loss": 0.06720960885286331,
40
- "eval_precision": 0.9832999772248476,
41
- "eval_recall": 0.9831501831501831,
42
- "eval_runtime": 5.9845,
43
- "eval_samples_per_second": 228.09,
44
- "eval_steps_per_second": 28.574,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.991941391941392,
50
- "eval_f1": 0.9919444380146174,
51
- "eval_loss": 0.04145079106092453,
52
- "eval_precision": 0.9919487758943655,
53
- "eval_recall": 0.991941391941392,
54
- "eval_runtime": 6.1222,
55
- "eval_samples_per_second": 222.958,
56
- "eval_steps_per_second": 27.931,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
- "eval_accuracy": 0.991941391941392,
62
- "eval_f1": 0.9919444380146174,
63
- "eval_loss": 0.037522196769714355,
64
- "eval_precision": 0.9919487758943655,
65
- "eval_recall": 0.991941391941392,
66
- "eval_runtime": 6.1601,
67
- "eval_samples_per_second": 221.586,
68
- "eval_steps_per_second": 27.759,
69
  "step": 426
70
  }
71
  ],
72
  "logging_steps": 500,
73
- "max_steps": 510,
74
  "num_input_tokens_seen": 0,
75
- "num_train_epochs": 6,
76
  "save_steps": 500,
77
  "stateful_callbacks": {
78
  "EarlyStoppingCallback": {
 
1
  {
2
+ "best_metric": 0.989010989010989,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-426",
4
  "epoch": 4.989751098096632,
5
  "eval_steps": 500,
6
  "global_step": 426,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
+ "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9860805860805861,
50
+ "eval_f1": 0.9861535269385863,
51
+ "eval_loss": 0.04610973969101906,
52
+ "eval_precision": 0.986445121171901,
53
+ "eval_recall": 0.9860805860805861,
54
+ "eval_runtime": 5.9428,
55
+ "eval_samples_per_second": 229.69,
56
+ "eval_steps_per_second": 28.774,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.989010989010989,
62
+ "eval_f1": 0.9890246085529585,
63
+ "eval_loss": 0.0438910573720932,
64
+ "eval_precision": 0.989050109460552,
65
+ "eval_recall": 0.989010989010989,
66
+ "eval_runtime": 5.937,
67
+ "eval_samples_per_second": 229.913,
68
+ "eval_steps_per_second": 28.802,
69
  "step": 426
70
  }
71
  ],
72
  "logging_steps": 500,
73
+ "max_steps": 850,
74
  "num_input_tokens_seen": 0,
75
+ "num_train_epochs": 10,
76
  "save_steps": 500,
77
  "stateful_callbacks": {
78
  "EarlyStoppingCallback": {
checkpoint-426/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-512/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-512/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35b0d90358beea477341c41eb5ba7259fabcc0922d7900d91362f0fbaf06bab2
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f0fba66e2bc44178994b63877f32d5ef3660e920cd130dae9ccbf8e054d15a
3
  size 94763496
checkpoint-512/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:648b988b59d53cdfb9a307e0c1ecb64a428672a7b441f4145e8d3d009ae2cfbe
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32489c4cc27d23701cd78e51f1daf46563d47112b4e3520ad9568800f0b86fb3
3
  size 189552570
checkpoint-512/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1f22cb39573891adcd854d571d182ed521927c0644cb49b42c5a9a0f0635791
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0643374a18b5da11030bd13ba87a30fd86ee77d7702b1fa1d0aee2f444563b7c
3
  size 1064
checkpoint-512/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9897435897435898,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 5.997071742313324,
5
  "eval_steps": 500,
6
  "global_step": 512,
@@ -11,80 +11,80 @@
11
  {
12
  "epoch": 0.9956076134699854,
13
  "eval_accuracy": 0.9538461538461539,
14
- "eval_f1": 0.953235199825453,
15
- "eval_loss": 0.13410410284996033,
16
- "eval_precision": 0.9543176332312968,
17
  "eval_recall": 0.9538461538461539,
18
- "eval_runtime": 5.9191,
19
- "eval_samples_per_second": 230.61,
20
- "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.96996336996337,
26
- "eval_f1": 0.970275727358029,
27
- "eval_loss": 0.08308757096529007,
28
- "eval_precision": 0.9720059808561178,
29
- "eval_recall": 0.96996336996337,
30
- "eval_runtime": 5.9321,
31
- "eval_samples_per_second": 230.105,
32
- "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9846153846153847,
38
- "eval_f1": 0.9845587007434289,
39
- "eval_loss": 0.05695493519306183,
40
- "eval_precision": 0.984652882646444,
41
- "eval_recall": 0.9846153846153847,
42
- "eval_runtime": 5.924,
43
- "eval_samples_per_second": 230.421,
44
- "eval_steps_per_second": 28.866,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9897435897435898,
50
- "eval_f1": 0.9897502348272303,
51
- "eval_loss": 0.03400224819779396,
52
- "eval_precision": 0.9897618176566864,
53
- "eval_recall": 0.9897435897435898,
54
- "eval_runtime": 5.9234,
55
- "eval_samples_per_second": 230.441,
56
- "eval_steps_per_second": 28.868,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
- "eval_accuracy": 0.9875457875457876,
62
- "eval_f1": 0.9876042969414931,
63
- "eval_loss": 0.04599935933947563,
64
- "eval_precision": 0.9879353582239604,
65
- "eval_recall": 0.9875457875457876,
66
- "eval_runtime": 5.9141,
67
- "eval_samples_per_second": 230.803,
68
- "eval_steps_per_second": 28.914,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
- "grad_norm": 0.020362911745905876,
74
- "learning_rate": 1.819507083000514e-05,
75
- "loss": 0.0707,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
- "eval_accuracy": 0.9897435897435898,
81
- "eval_f1": 0.9897761336599745,
82
- "eval_loss": 0.04312068223953247,
83
- "eval_precision": 0.9899308989239506,
84
- "eval_recall": 0.9897435897435898,
85
- "eval_runtime": 5.5776,
86
- "eval_samples_per_second": 244.727,
87
- "eval_steps_per_second": 30.658,
88
  "step": 512
89
  }
90
  ],
 
1
  {
2
+ "best_metric": 0.9904761904761905,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-512",
4
  "epoch": 5.997071742313324,
5
  "eval_steps": 500,
6
  "global_step": 512,
 
11
  {
12
  "epoch": 0.9956076134699854,
13
  "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
  "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
+ "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9860805860805861,
50
+ "eval_f1": 0.9861535269385863,
51
+ "eval_loss": 0.04610973969101906,
52
+ "eval_precision": 0.986445121171901,
53
+ "eval_recall": 0.9860805860805861,
54
+ "eval_runtime": 5.9428,
55
+ "eval_samples_per_second": 229.69,
56
+ "eval_steps_per_second": 28.774,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.989010989010989,
62
+ "eval_f1": 0.9890246085529585,
63
+ "eval_loss": 0.0438910573720932,
64
+ "eval_precision": 0.989050109460552,
65
+ "eval_recall": 0.989010989010989,
66
+ "eval_runtime": 5.937,
67
+ "eval_samples_per_second": 229.913,
68
+ "eval_steps_per_second": 28.802,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
+ "grad_norm": 0.08060992509126663,
74
+ "learning_rate": 1.0917042498003083e-05,
75
+ "loss": 0.0779,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
+ "eval_accuracy": 0.9904761904761905,
81
+ "eval_f1": 0.9904879940792306,
82
+ "eval_loss": 0.0396205335855484,
83
+ "eval_precision": 0.9905117057078526,
84
+ "eval_recall": 0.9904761904761905,
85
+ "eval_runtime": 5.9047,
86
+ "eval_samples_per_second": 231.172,
87
+ "eval_steps_per_second": 28.96,
88
  "step": 512
89
  }
90
  ],
checkpoint-512/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-597/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-597/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c617973600d573c483f588a59837c6d45814ca8e16c64575f5523b65246f0c5e
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fefc9fc9e0c6f521d52f6944550be09ad08cf2a406465b2bad96d43e8e656a9
3
  size 94763496
checkpoint-597/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86268f89454cc35e41155e346d8e2ca8d5a9b6f579d1fef2bbfc8b823eace3b9
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de0a5be77c65d20eadb1a24d44af2c728f76e6c9b01b584c11efa9dac4bab929
3
  size 189552570
checkpoint-597/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c216d743853a404a50b6a598e3c4bf36fa1dc8935b24320ebe609a9c5c9b437
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e5b7798f882f09e50f351045d72a3f8133a68153dae42b3d7541432cd2e9e0
3
  size 1064
checkpoint-597/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9897435897435898,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
4
  "epoch": 6.992679355783309,
5
  "eval_steps": 500,
6
  "global_step": 597,
@@ -11,92 +11,92 @@
11
  {
12
  "epoch": 0.9956076134699854,
13
  "eval_accuracy": 0.9538461538461539,
14
- "eval_f1": 0.953235199825453,
15
- "eval_loss": 0.13410410284996033,
16
- "eval_precision": 0.9543176332312968,
17
  "eval_recall": 0.9538461538461539,
18
- "eval_runtime": 5.9191,
19
- "eval_samples_per_second": 230.61,
20
- "eval_steps_per_second": 28.89,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
- "eval_accuracy": 0.96996336996337,
26
- "eval_f1": 0.970275727358029,
27
- "eval_loss": 0.08308757096529007,
28
- "eval_precision": 0.9720059808561178,
29
- "eval_recall": 0.96996336996337,
30
- "eval_runtime": 5.9321,
31
- "eval_samples_per_second": 230.105,
32
- "eval_steps_per_second": 28.826,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
- "eval_accuracy": 0.9846153846153847,
38
- "eval_f1": 0.9845587007434289,
39
- "eval_loss": 0.05695493519306183,
40
- "eval_precision": 0.984652882646444,
41
- "eval_recall": 0.9846153846153847,
42
- "eval_runtime": 5.924,
43
- "eval_samples_per_second": 230.421,
44
- "eval_steps_per_second": 28.866,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
- "eval_accuracy": 0.9897435897435898,
50
- "eval_f1": 0.9897502348272303,
51
- "eval_loss": 0.03400224819779396,
52
- "eval_precision": 0.9897618176566864,
53
- "eval_recall": 0.9897435897435898,
54
- "eval_runtime": 5.9234,
55
- "eval_samples_per_second": 230.441,
56
- "eval_steps_per_second": 28.868,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
- "eval_accuracy": 0.9875457875457876,
62
- "eval_f1": 0.9876042969414931,
63
- "eval_loss": 0.04599935933947563,
64
- "eval_precision": 0.9879353582239604,
65
- "eval_recall": 0.9875457875457876,
66
- "eval_runtime": 5.9141,
67
- "eval_samples_per_second": 230.803,
68
- "eval_steps_per_second": 28.914,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
- "grad_norm": 0.020362911745905876,
74
- "learning_rate": 1.819507083000514e-05,
75
- "loss": 0.0707,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
- "eval_accuracy": 0.9897435897435898,
81
- "eval_f1": 0.9897761336599745,
82
- "eval_loss": 0.04312068223953247,
83
- "eval_precision": 0.9899308989239506,
84
- "eval_recall": 0.9897435897435898,
85
- "eval_runtime": 5.5776,
86
- "eval_samples_per_second": 244.727,
87
- "eval_steps_per_second": 30.658,
88
  "step": 512
89
  },
90
  {
91
  "epoch": 6.992679355783309,
92
- "eval_accuracy": 0.9882783882783883,
93
- "eval_f1": 0.9882934987415589,
94
- "eval_loss": 0.035927049815654755,
95
- "eval_precision": 0.9883282714000319,
96
- "eval_recall": 0.9882783882783883,
97
- "eval_runtime": 5.5806,
98
- "eval_samples_per_second": 244.596,
99
- "eval_steps_per_second": 30.642,
100
  "step": 597
101
  }
102
  ],
@@ -121,7 +121,7 @@
121
  "should_evaluate": false,
122
  "should_log": false,
123
  "should_save": true,
124
- "should_training_stop": true
125
  },
126
  "attributes": {}
127
  }
 
1
  {
2
+ "best_metric": 0.991941391941392,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597",
4
  "epoch": 6.992679355783309,
5
  "eval_steps": 500,
6
  "global_step": 597,
 
11
  {
12
  "epoch": 0.9956076134699854,
13
  "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
  "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
+ "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9860805860805861,
50
+ "eval_f1": 0.9861535269385863,
51
+ "eval_loss": 0.04610973969101906,
52
+ "eval_precision": 0.986445121171901,
53
+ "eval_recall": 0.9860805860805861,
54
+ "eval_runtime": 5.9428,
55
+ "eval_samples_per_second": 229.69,
56
+ "eval_steps_per_second": 28.774,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.989010989010989,
62
+ "eval_f1": 0.9890246085529585,
63
+ "eval_loss": 0.0438910573720932,
64
+ "eval_precision": 0.989050109460552,
65
+ "eval_recall": 0.989010989010989,
66
+ "eval_runtime": 5.937,
67
+ "eval_samples_per_second": 229.913,
68
+ "eval_steps_per_second": 28.802,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
+ "grad_norm": 0.08060992509126663,
74
+ "learning_rate": 1.0917042498003083e-05,
75
+ "loss": 0.0779,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
+ "eval_accuracy": 0.9904761904761905,
81
+ "eval_f1": 0.9904879940792306,
82
+ "eval_loss": 0.0396205335855484,
83
+ "eval_precision": 0.9905117057078526,
84
+ "eval_recall": 0.9904761904761905,
85
+ "eval_runtime": 5.9047,
86
+ "eval_samples_per_second": 231.172,
87
+ "eval_steps_per_second": 28.96,
88
  "step": 512
89
  },
90
  {
91
  "epoch": 6.992679355783309,
92
+ "eval_accuracy": 0.991941391941392,
93
+ "eval_f1": 0.9919447375447602,
94
+ "eval_loss": 0.035047151148319244,
95
+ "eval_precision": 0.9919494135494136,
96
+ "eval_recall": 0.991941391941392,
97
+ "eval_runtime": 6.0502,
98
+ "eval_samples_per_second": 225.612,
99
+ "eval_steps_per_second": 28.264,
100
  "step": 597
101
  }
102
  ],
 
121
  "should_evaluate": false,
122
  "should_log": false,
123
  "should_save": true,
124
+ "should_training_stop": false
125
  },
126
  "attributes": {}
127
  }
checkpoint-597/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-683/config.json CHANGED
@@ -45,6 +45,7 @@
45
  "feat_proj_dropout": 0.0,
46
  "feat_proj_layer_norm": false,
47
  "final_dropout": 0.0,
 
48
  "hidden_act": "gelu",
49
  "hidden_dropout": 0.1,
50
  "hidden_size": 768,
@@ -54,10 +55,6 @@
54
  },
55
  "initializer_range": 0.02,
56
  "intermediate_size": 3072,
57
- "label2id": {
58
- "crying": "0",
59
- "no_crying": "1"
60
- },
61
  "layer_norm_eps": 1e-05,
62
  "layerdrop": 0.0,
63
  "mask_feature_length": 10,
 
45
  "feat_proj_dropout": 0.0,
46
  "feat_proj_layer_norm": false,
47
  "final_dropout": 0.0,
48
+ "finetuning_task": "audio-classification",
49
  "hidden_act": "gelu",
50
  "hidden_dropout": 0.1,
51
  "hidden_size": 768,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-683/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52ec3a122dd4e1c3f5b4ae3dc2e2256f512a563d42eb82426ac3f8094e0c4490
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47eb6b3cfe6fa933d4d9bda0995a1e235c1d9ec1d2481708bed5a4149e8262a4
3
  size 94763496
checkpoint-683/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b6591188ba0c4025fcbff86219e7c2755b85671c8b4d10202fa03cef2f8831a1
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd75da0e8ea0bf33fb98b23e1d8b9fc9f33d7c31a91837683d49c15ae856034
3
  size 189552570
checkpoint-683/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b712ee88015e952bb23b1f5495f272411d9c19a17334b27df15dc1ebbac98f35
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bde01021f76a64b9ec7866fcc536e72a45008d7566739a02f03c4c895a14c72c
3
  size 1064
checkpoint-683/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9926739926739927,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-512",
4
  "epoch": 8.0,
5
  "eval_steps": 500,
6
  "global_step": 683,
@@ -10,81 +10,105 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9772893772893773,
14
- "eval_loss": 0.06922276318073273,
15
- "eval_runtime": 15.5305,
16
- "eval_samples_per_second": 87.892,
17
- "eval_steps_per_second": 11.011,
 
 
 
18
  "step": 85
19
  },
20
  {
21
  "epoch": 1.9912152269399708,
22
- "eval_accuracy": 0.9860805860805861,
23
- "eval_loss": 0.04661192744970322,
24
- "eval_runtime": 15.4605,
25
- "eval_samples_per_second": 88.29,
26
- "eval_steps_per_second": 11.06,
 
 
 
27
  "step": 170
28
  },
29
  {
30
  "epoch": 2.998535871156662,
31
- "eval_accuracy": 0.9853479853479854,
32
- "eval_loss": 0.04894961416721344,
33
- "eval_runtime": 15.5622,
34
- "eval_samples_per_second": 87.713,
35
- "eval_steps_per_second": 10.988,
 
 
 
36
  "step": 256
37
  },
38
  {
39
  "epoch": 3.994143484626647,
40
- "eval_accuracy": 0.9897435897435898,
41
- "eval_loss": 0.04228556528687477,
42
- "eval_runtime": 15.6217,
43
- "eval_samples_per_second": 87.378,
44
- "eval_steps_per_second": 10.946,
 
 
 
45
  "step": 341
46
  },
47
  {
48
  "epoch": 4.989751098096632,
49
- "eval_accuracy": 0.991941391941392,
50
- "eval_loss": 0.044283464550971985,
51
- "eval_runtime": 15.0667,
52
- "eval_samples_per_second": 90.597,
53
- "eval_steps_per_second": 11.35,
 
 
 
54
  "step": 426
55
  },
56
  {
57
  "epoch": 5.856515373352855,
58
- "grad_norm": 0.008579956367611885,
59
- "learning_rate": 3.639014166001028e-05,
60
- "loss": 0.055,
61
  "step": 500
62
  },
63
  {
64
  "epoch": 5.997071742313324,
65
- "eval_accuracy": 0.9926739926739927,
66
- "eval_loss": 0.04338795691728592,
67
- "eval_runtime": 14.898,
68
- "eval_samples_per_second": 91.623,
69
- "eval_steps_per_second": 11.478,
 
 
 
70
  "step": 512
71
  },
72
  {
73
  "epoch": 6.992679355783309,
74
- "eval_accuracy": 0.9926739926739927,
75
- "eval_loss": 0.04399614781141281,
76
- "eval_runtime": 15.2426,
77
- "eval_samples_per_second": 89.552,
78
- "eval_steps_per_second": 11.219,
 
 
 
79
  "step": 597
80
  },
81
  {
82
  "epoch": 8.0,
83
- "eval_accuracy": 0.9926739926739927,
84
- "eval_loss": 0.045955102890729904,
85
- "eval_runtime": 15.1372,
86
- "eval_samples_per_second": 90.175,
87
- "eval_steps_per_second": 11.297,
 
 
 
88
  "step": 683
89
  }
90
  ],
 
1
  {
2
+ "best_metric": 0.991941391941392,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597",
4
  "epoch": 8.0,
5
  "eval_steps": 500,
6
  "global_step": 683,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
+ "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9860805860805861,
50
+ "eval_f1": 0.9861535269385863,
51
+ "eval_loss": 0.04610973969101906,
52
+ "eval_precision": 0.986445121171901,
53
+ "eval_recall": 0.9860805860805861,
54
+ "eval_runtime": 5.9428,
55
+ "eval_samples_per_second": 229.69,
56
+ "eval_steps_per_second": 28.774,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.989010989010989,
62
+ "eval_f1": 0.9890246085529585,
63
+ "eval_loss": 0.0438910573720932,
64
+ "eval_precision": 0.989050109460552,
65
+ "eval_recall": 0.989010989010989,
66
+ "eval_runtime": 5.937,
67
+ "eval_samples_per_second": 229.913,
68
+ "eval_steps_per_second": 28.802,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
+ "grad_norm": 0.08060992509126663,
74
+ "learning_rate": 1.0917042498003083e-05,
75
+ "loss": 0.0779,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
+ "eval_accuracy": 0.9904761904761905,
81
+ "eval_f1": 0.9904879940792306,
82
+ "eval_loss": 0.0396205335855484,
83
+ "eval_precision": 0.9905117057078526,
84
+ "eval_recall": 0.9904761904761905,
85
+ "eval_runtime": 5.9047,
86
+ "eval_samples_per_second": 231.172,
87
+ "eval_steps_per_second": 28.96,
88
  "step": 512
89
  },
90
  {
91
  "epoch": 6.992679355783309,
92
+ "eval_accuracy": 0.991941391941392,
93
+ "eval_f1": 0.9919447375447602,
94
+ "eval_loss": 0.035047151148319244,
95
+ "eval_precision": 0.9919494135494136,
96
+ "eval_recall": 0.991941391941392,
97
+ "eval_runtime": 6.0502,
98
+ "eval_samples_per_second": 225.612,
99
+ "eval_steps_per_second": 28.264,
100
  "step": 597
101
  },
102
  {
103
  "epoch": 8.0,
104
+ "eval_accuracy": 0.9912087912087912,
105
+ "eval_f1": 0.9912160728160728,
106
+ "eval_loss": 0.03350323066115379,
107
+ "eval_precision": 0.9912286614059304,
108
+ "eval_recall": 0.9912087912087912,
109
+ "eval_runtime": 5.79,
110
+ "eval_samples_per_second": 235.751,
111
+ "eval_steps_per_second": 29.534,
112
  "step": 683
113
  }
114
  ],
checkpoint-683/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84d763bc52a548d7900e672478766167dea5015bedfc4ad077e5cffda9256cc8
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-768/config.json CHANGED
@@ -45,6 +45,7 @@
45
  "feat_proj_dropout": 0.0,
46
  "feat_proj_layer_norm": false,
47
  "final_dropout": 0.0,
 
48
  "hidden_act": "gelu",
49
  "hidden_dropout": 0.1,
50
  "hidden_size": 768,
@@ -54,10 +55,6 @@
54
  },
55
  "initializer_range": 0.02,
56
  "intermediate_size": 3072,
57
- "label2id": {
58
- "crying": "0",
59
- "no_crying": "1"
60
- },
61
  "layer_norm_eps": 1e-05,
62
  "layerdrop": 0.0,
63
  "mask_feature_length": 10,
 
45
  "feat_proj_dropout": 0.0,
46
  "feat_proj_layer_norm": false,
47
  "final_dropout": 0.0,
48
+ "finetuning_task": "audio-classification",
49
  "hidden_act": "gelu",
50
  "hidden_dropout": 0.1,
51
  "hidden_size": 768,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-768/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e5671ffc6960b29ad80f820b4317ec548ff0deefca2464ad359c421c360e64f
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:589720455553dad3b547e7fc5aac19151dbefadb26d39a6a04c708e344cfd310
3
  size 94763496
checkpoint-768/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7516d91f602bba3efff25344b03b35e85d41b8ce4db2a56619d6dcf6cd2cc2df
3
  size 189552570
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b863d95ad20867c4606dfd4b07ae1866e1bfbd283086e4449d924ccf79d9d2dc
3
  size 189552570
checkpoint-768/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46a9a21b9ea0c395732aadaa7b885d80eaa4d81c9d9d1eea099d6180e939da87
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acb83cb237d82342af5936197af5c426903999a84d7161b385fa3b80c0070365
3
  size 1064
checkpoint-768/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9926739926739927,
3
- "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-512",
4
  "epoch": 8.995607613469986,
5
  "eval_steps": 500,
6
  "global_step": 768,
@@ -10,90 +10,117 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
- "eval_accuracy": 0.9772893772893773,
14
- "eval_loss": 0.06922276318073273,
15
- "eval_runtime": 15.5305,
16
- "eval_samples_per_second": 87.892,
17
- "eval_steps_per_second": 11.011,
 
 
 
18
  "step": 85
19
  },
20
  {
21
  "epoch": 1.9912152269399708,
22
- "eval_accuracy": 0.9860805860805861,
23
- "eval_loss": 0.04661192744970322,
24
- "eval_runtime": 15.4605,
25
- "eval_samples_per_second": 88.29,
26
- "eval_steps_per_second": 11.06,
 
 
 
27
  "step": 170
28
  },
29
  {
30
  "epoch": 2.998535871156662,
31
- "eval_accuracy": 0.9853479853479854,
32
- "eval_loss": 0.04894961416721344,
33
- "eval_runtime": 15.5622,
34
- "eval_samples_per_second": 87.713,
35
- "eval_steps_per_second": 10.988,
 
 
 
36
  "step": 256
37
  },
38
  {
39
  "epoch": 3.994143484626647,
40
- "eval_accuracy": 0.9897435897435898,
41
- "eval_loss": 0.04228556528687477,
42
- "eval_runtime": 15.6217,
43
- "eval_samples_per_second": 87.378,
44
- "eval_steps_per_second": 10.946,
 
 
 
45
  "step": 341
46
  },
47
  {
48
  "epoch": 4.989751098096632,
49
- "eval_accuracy": 0.991941391941392,
50
- "eval_loss": 0.044283464550971985,
51
- "eval_runtime": 15.0667,
52
- "eval_samples_per_second": 90.597,
53
- "eval_steps_per_second": 11.35,
 
 
 
54
  "step": 426
55
  },
56
  {
57
  "epoch": 5.856515373352855,
58
- "grad_norm": 0.008579956367611885,
59
- "learning_rate": 3.639014166001028e-05,
60
- "loss": 0.055,
61
  "step": 500
62
  },
63
  {
64
  "epoch": 5.997071742313324,
65
- "eval_accuracy": 0.9926739926739927,
66
- "eval_loss": 0.04338795691728592,
67
- "eval_runtime": 14.898,
68
- "eval_samples_per_second": 91.623,
69
- "eval_steps_per_second": 11.478,
 
 
 
70
  "step": 512
71
  },
72
  {
73
  "epoch": 6.992679355783309,
74
- "eval_accuracy": 0.9926739926739927,
75
- "eval_loss": 0.04399614781141281,
76
- "eval_runtime": 15.2426,
77
- "eval_samples_per_second": 89.552,
78
- "eval_steps_per_second": 11.219,
 
 
 
79
  "step": 597
80
  },
81
  {
82
  "epoch": 8.0,
83
- "eval_accuracy": 0.9926739926739927,
84
- "eval_loss": 0.045955102890729904,
85
- "eval_runtime": 15.1372,
86
- "eval_samples_per_second": 90.175,
87
- "eval_steps_per_second": 11.297,
 
 
 
88
  "step": 683
89
  },
90
  {
91
  "epoch": 8.995607613469986,
92
- "eval_accuracy": 0.9926739926739927,
93
- "eval_loss": 0.04587433487176895,
94
- "eval_runtime": 15.0807,
95
- "eval_samples_per_second": 90.513,
96
- "eval_steps_per_second": 11.339,
 
 
 
97
  "step": 768
98
  }
99
  ],
@@ -118,7 +145,7 @@
118
  "should_evaluate": false,
119
  "should_log": false,
120
  "should_save": true,
121
- "should_training_stop": true
122
  },
123
  "attributes": {}
124
  }
 
1
  {
2
+ "best_metric": 0.991941391941392,
3
+ "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597",
4
  "epoch": 8.995607613469986,
5
  "eval_steps": 500,
6
  "global_step": 768,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.9956076134699854,
13
+ "eval_accuracy": 0.9538461538461539,
14
+ "eval_f1": 0.9535883665206972,
15
+ "eval_loss": 0.11965569853782654,
16
+ "eval_precision": 0.9535470731605858,
17
+ "eval_recall": 0.9538461538461539,
18
+ "eval_runtime": 5.8661,
19
+ "eval_samples_per_second": 232.691,
20
+ "eval_steps_per_second": 29.15,
21
  "step": 85
22
  },
23
  {
24
  "epoch": 1.9912152269399708,
25
+ "eval_accuracy": 0.9831501831501831,
26
+ "eval_f1": 0.983143153392684,
27
+ "eval_loss": 0.060115572065114975,
28
+ "eval_precision": 0.9831374404084774,
29
+ "eval_recall": 0.9831501831501831,
30
+ "eval_runtime": 5.9254,
31
+ "eval_samples_per_second": 230.365,
32
+ "eval_steps_per_second": 28.859,
33
  "step": 170
34
  },
35
  {
36
  "epoch": 2.998535871156662,
37
+ "eval_accuracy": 0.9868131868131869,
38
+ "eval_f1": 0.9868241092241091,
39
+ "eval_loss": 0.05060575157403946,
40
+ "eval_precision": 0.9868403029537207,
41
+ "eval_recall": 0.9868131868131869,
42
+ "eval_runtime": 5.9299,
43
+ "eval_samples_per_second": 230.189,
44
+ "eval_steps_per_second": 28.837,
45
  "step": 256
46
  },
47
  {
48
  "epoch": 3.994143484626647,
49
+ "eval_accuracy": 0.9860805860805861,
50
+ "eval_f1": 0.9861535269385863,
51
+ "eval_loss": 0.04610973969101906,
52
+ "eval_precision": 0.986445121171901,
53
+ "eval_recall": 0.9860805860805861,
54
+ "eval_runtime": 5.9428,
55
+ "eval_samples_per_second": 229.69,
56
+ "eval_steps_per_second": 28.774,
57
  "step": 341
58
  },
59
  {
60
  "epoch": 4.989751098096632,
61
+ "eval_accuracy": 0.989010989010989,
62
+ "eval_f1": 0.9890246085529585,
63
+ "eval_loss": 0.0438910573720932,
64
+ "eval_precision": 0.989050109460552,
65
+ "eval_recall": 0.989010989010989,
66
+ "eval_runtime": 5.937,
67
+ "eval_samples_per_second": 229.913,
68
+ "eval_steps_per_second": 28.802,
69
  "step": 426
70
  },
71
  {
72
  "epoch": 5.856515373352855,
73
+ "grad_norm": 0.08060992509126663,
74
+ "learning_rate": 1.0917042498003083e-05,
75
+ "loss": 0.0779,
76
  "step": 500
77
  },
78
  {
79
  "epoch": 5.997071742313324,
80
+ "eval_accuracy": 0.9904761904761905,
81
+ "eval_f1": 0.9904879940792306,
82
+ "eval_loss": 0.0396205335855484,
83
+ "eval_precision": 0.9905117057078526,
84
+ "eval_recall": 0.9904761904761905,
85
+ "eval_runtime": 5.9047,
86
+ "eval_samples_per_second": 231.172,
87
+ "eval_steps_per_second": 28.96,
88
  "step": 512
89
  },
90
  {
91
  "epoch": 6.992679355783309,
92
+ "eval_accuracy": 0.991941391941392,
93
+ "eval_f1": 0.9919447375447602,
94
+ "eval_loss": 0.035047151148319244,
95
+ "eval_precision": 0.9919494135494136,
96
+ "eval_recall": 0.991941391941392,
97
+ "eval_runtime": 6.0502,
98
+ "eval_samples_per_second": 225.612,
99
+ "eval_steps_per_second": 28.264,
100
  "step": 597
101
  },
102
  {
103
  "epoch": 8.0,
104
+ "eval_accuracy": 0.9912087912087912,
105
+ "eval_f1": 0.9912160728160728,
106
+ "eval_loss": 0.03350323066115379,
107
+ "eval_precision": 0.9912286614059304,
108
+ "eval_recall": 0.9912087912087912,
109
+ "eval_runtime": 5.79,
110
+ "eval_samples_per_second": 235.751,
111
+ "eval_steps_per_second": 29.534,
112
  "step": 683
113
  },
114
  {
115
  "epoch": 8.995607613469986,
116
+ "eval_accuracy": 0.9912087912087912,
117
+ "eval_f1": 0.9912160728160728,
118
+ "eval_loss": 0.03368490934371948,
119
+ "eval_precision": 0.9912286614059304,
120
+ "eval_recall": 0.9912087912087912,
121
+ "eval_runtime": 5.7784,
122
+ "eval_samples_per_second": 236.224,
123
+ "eval_steps_per_second": 29.593,
124
  "step": 768
125
  }
126
  ],
 
145
  "should_evaluate": false,
146
  "should_log": false,
147
  "should_save": true,
148
+ "should_training_stop": false
149
  },
150
  "attributes": {}
151
  }
checkpoint-768/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:84d763bc52a548d7900e672478766167dea5015bedfc4ad077e5cffda9256cc8
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b
3
  size 5240
checkpoint-85/config.json CHANGED
@@ -55,10 +55,6 @@
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
58
- "label2id": {
59
- "crying": 0,
60
- "no_crying": 1
61
- },
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.0,
64
  "mask_feature_length": 10,
 
55
  },
56
  "initializer_range": 0.02,
57
  "intermediate_size": 3072,
 
 
 
 
58
  "layer_norm_eps": 1e-05,
59
  "layerdrop": 0.0,
60
  "mask_feature_length": 10,
checkpoint-85/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:667f991dfd621ded0f030ae62bee9e55c4e297c107c7ab609989f56ba7da4287
3
  size 94763496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23b104b8e2a8ab0ab3becb4267c1082a46bc58158acb8a209710fb47609d3b4f
3
  size 94763496