Spaces:
Sleeping
Sleeping
Marcos12886
commited on
Commit
•
96d8764
1
Parent(s):
9b48c7d
Subir parámetros entrenamiento 10 class, 6 mon
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitignore +1 -3
- distilhubert-finetuned-cry-detector/checkpoint-170/config.json +81 -0
- distilhubert-finetuned-cry-detector/checkpoint-170/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-170/optimizer.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-170/rng_state.pth +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-170/scheduler.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-170/trainer_state.json +66 -0
- distilhubert-finetuned-cry-detector/checkpoint-170/training_args.bin +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/config.json +81 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/optimizer.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/rng_state.pth +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/scheduler.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/trainer_state.json +78 -0
- distilhubert-finetuned-cry-detector/checkpoint-256/training_args.bin +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/config.json +81 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/optimizer.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/rng_state.pth +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/scheduler.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/trainer_state.json +90 -0
- distilhubert-finetuned-cry-detector/checkpoint-341/training_args.bin +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/config.json +81 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/optimizer.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/rng_state.pth +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/scheduler.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/trainer_state.json +102 -0
- distilhubert-finetuned-cry-detector/checkpoint-426/training_args.bin +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/config.json +81 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/optimizer.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/rng_state.pth +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/scheduler.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/trainer_state.json +121 -0
- distilhubert-finetuned-cry-detector/checkpoint-510/training_args.bin +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/config.json +81 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/optimizer.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/rng_state.pth +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/scheduler.pt +3 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/trainer_state.json +54 -0
- distilhubert-finetuned-cry-detector/checkpoint-85/training_args.bin +3 -0
- distilhubert-finetuned-cry-detector/config.json +81 -0
- distilhubert-finetuned-cry-detector/model.safetensors +3 -0
- distilhubert-finetuned-cry-detector/runs/Sep06_15-54-59_ubumarcos/events.out.tfevents.1725630900.ubumarcos +3 -0
- distilhubert-finetuned-cry-detector/runs/Sep06_17-32-26_ubumarcos/events.out.tfevents.1725636747.ubumarcos +3 -0
- distilhubert-finetuned-cry-detector/training_args.bin +3 -0
- distilhubert-finetuned-mixed-data/checkpoint-121/config.json +85 -0
- distilhubert-finetuned-mixed-data/checkpoint-121/model.safetensors +3 -0
.gitignore
CHANGED
@@ -1,5 +1,3 @@
|
|
1 |
__pycache__
|
2 |
.venv
|
3 |
-
.vscode
|
4 |
-
distilhubert-finetuned-cry-detector
|
5 |
-
distilhubert-finetuned-mixed-data
|
|
|
1 |
__pycache__
|
2 |
.venv
|
3 |
+
.vscode
|
|
|
|
distilhubert-finetuned-cry-detector/checkpoint-170/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-170/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c12a1b9a24a4e6c65e2a4cfef5a14bb3968815375ff10b423d324c8475fae74a
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/checkpoint-170/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:435b96196eb0ed805f14f064a35d0757c0d693014f991ba8af93c9bee59d0dbe
|
3 |
+
size 189552570
|
distilhubert-finetuned-cry-detector/checkpoint-170/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8284a213c68ebec7c890dfc113fc2b6a01af65d958e077d0ff89531cb54f031
|
3 |
+
size 14308
|
distilhubert-finetuned-cry-detector/checkpoint-170/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80195c13720277b88ef44d4298c322ee9ab935ad2c366470453549aba8f696c4
|
3 |
+
size 1064
|
distilhubert-finetuned-cry-detector/checkpoint-170/trainer_state.json
ADDED
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.9787545787545787,
|
3 |
+
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170",
|
4 |
+
"epoch": 1.9912152269399708,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 170,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9597069597069597,
|
14 |
+
"eval_f1": 0.9599836188656065,
|
15 |
+
"eval_loss": 0.12706419825553894,
|
16 |
+
"eval_precision": 0.960694098126733,
|
17 |
+
"eval_recall": 0.9597069597069597,
|
18 |
+
"eval_runtime": 6.1839,
|
19 |
+
"eval_samples_per_second": 220.733,
|
20 |
+
"eval_steps_per_second": 27.652,
|
21 |
+
"step": 85
|
22 |
+
},
|
23 |
+
{
|
24 |
+
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9787545787545787,
|
26 |
+
"eval_f1": 0.9788099592207686,
|
27 |
+
"eval_loss": 0.07009062170982361,
|
28 |
+
"eval_precision": 0.9789268917610887,
|
29 |
+
"eval_recall": 0.9787545787545787,
|
30 |
+
"eval_runtime": 6.2624,
|
31 |
+
"eval_samples_per_second": 217.969,
|
32 |
+
"eval_steps_per_second": 27.306,
|
33 |
+
"step": 170
|
34 |
+
}
|
35 |
+
],
|
36 |
+
"logging_steps": 500,
|
37 |
+
"max_steps": 510,
|
38 |
+
"num_input_tokens_seen": 0,
|
39 |
+
"num_train_epochs": 6,
|
40 |
+
"save_steps": 500,
|
41 |
+
"stateful_callbacks": {
|
42 |
+
"EarlyStoppingCallback": {
|
43 |
+
"args": {
|
44 |
+
"early_stopping_patience": 3,
|
45 |
+
"early_stopping_threshold": 0.0
|
46 |
+
},
|
47 |
+
"attributes": {
|
48 |
+
"early_stopping_patience_counter": 0
|
49 |
+
}
|
50 |
+
},
|
51 |
+
"TrainerControl": {
|
52 |
+
"args": {
|
53 |
+
"should_epoch_stop": false,
|
54 |
+
"should_evaluate": false,
|
55 |
+
"should_log": false,
|
56 |
+
"should_save": true,
|
57 |
+
"should_training_stop": false
|
58 |
+
},
|
59 |
+
"attributes": {}
|
60 |
+
}
|
61 |
+
},
|
62 |
+
"total_flos": 2.483401519872e+16,
|
63 |
+
"train_batch_size": 8,
|
64 |
+
"trial_name": null,
|
65 |
+
"trial_params": null
|
66 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-170/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-cry-detector/checkpoint-256/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-256/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ae93606e0068417987c861ef701d781fdc293c56822885b321b538499e3ed9f
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/checkpoint-256/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68055f1bc468b50d717af19d82688b5760436263325799749b5a24328beeda08
|
3 |
+
size 189552570
|
distilhubert-finetuned-cry-detector/checkpoint-256/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0eb65cebf665d8f9d6639246c9118d47b498a1653a2714b80f3ab7cf865354d2
|
3 |
+
size 14308
|
distilhubert-finetuned-cry-detector/checkpoint-256/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c9f438092711eef2a53f839a45eb7a09d5325f42278d87a60fc53d358b3a04a
|
3 |
+
size 1064
|
distilhubert-finetuned-cry-detector/checkpoint-256/trainer_state.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.9831501831501831,
|
3 |
+
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-256",
|
4 |
+
"epoch": 2.998535871156662,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 256,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9597069597069597,
|
14 |
+
"eval_f1": 0.9599836188656065,
|
15 |
+
"eval_loss": 0.12706419825553894,
|
16 |
+
"eval_precision": 0.960694098126733,
|
17 |
+
"eval_recall": 0.9597069597069597,
|
18 |
+
"eval_runtime": 6.1839,
|
19 |
+
"eval_samples_per_second": 220.733,
|
20 |
+
"eval_steps_per_second": 27.652,
|
21 |
+
"step": 85
|
22 |
+
},
|
23 |
+
{
|
24 |
+
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9787545787545787,
|
26 |
+
"eval_f1": 0.9788099592207686,
|
27 |
+
"eval_loss": 0.07009062170982361,
|
28 |
+
"eval_precision": 0.9789268917610887,
|
29 |
+
"eval_recall": 0.9787545787545787,
|
30 |
+
"eval_runtime": 6.2624,
|
31 |
+
"eval_samples_per_second": 217.969,
|
32 |
+
"eval_steps_per_second": 27.306,
|
33 |
+
"step": 170
|
34 |
+
},
|
35 |
+
{
|
36 |
+
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9831501831501831,
|
38 |
+
"eval_f1": 0.9831941055888854,
|
39 |
+
"eval_loss": 0.06720960885286331,
|
40 |
+
"eval_precision": 0.9832999772248476,
|
41 |
+
"eval_recall": 0.9831501831501831,
|
42 |
+
"eval_runtime": 5.9845,
|
43 |
+
"eval_samples_per_second": 228.09,
|
44 |
+
"eval_steps_per_second": 28.574,
|
45 |
+
"step": 256
|
46 |
+
}
|
47 |
+
],
|
48 |
+
"logging_steps": 500,
|
49 |
+
"max_steps": 510,
|
50 |
+
"num_input_tokens_seen": 0,
|
51 |
+
"num_train_epochs": 6,
|
52 |
+
"save_steps": 500,
|
53 |
+
"stateful_callbacks": {
|
54 |
+
"EarlyStoppingCallback": {
|
55 |
+
"args": {
|
56 |
+
"early_stopping_patience": 3,
|
57 |
+
"early_stopping_threshold": 0.0
|
58 |
+
},
|
59 |
+
"attributes": {
|
60 |
+
"early_stopping_patience_counter": 0
|
61 |
+
}
|
62 |
+
},
|
63 |
+
"TrainerControl": {
|
64 |
+
"args": {
|
65 |
+
"should_epoch_stop": false,
|
66 |
+
"should_evaluate": false,
|
67 |
+
"should_log": false,
|
68 |
+
"should_save": true,
|
69 |
+
"should_training_stop": false
|
70 |
+
},
|
71 |
+
"attributes": {}
|
72 |
+
}
|
73 |
+
},
|
74 |
+
"total_flos": 3.725102279808e+16,
|
75 |
+
"train_batch_size": 8,
|
76 |
+
"trial_name": null,
|
77 |
+
"trial_params": null
|
78 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-256/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-cry-detector/checkpoint-341/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-341/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7944ecc75fe28e156d4c1967e013e12ebf361ba4a1e84d569b5656c10cbbf99f
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/checkpoint-341/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ea12d3536b65dc14e8f5d189dcebc6f55fd60a564653f1c462a9b8fd994950d
|
3 |
+
size 189552570
|
distilhubert-finetuned-cry-detector/checkpoint-341/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:536f0fc323ef01dfbff60019f8668ef49478dbb6c4c93f5f8458a58aa887a7ac
|
3 |
+
size 14308
|
distilhubert-finetuned-cry-detector/checkpoint-341/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:370ad1e402d1e5afefc57f92c683bc92a503cf91bcf53776012b25e1805f62fc
|
3 |
+
size 1064
|
distilhubert-finetuned-cry-detector/checkpoint-341/trainer_state.json
ADDED
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.991941391941392,
|
3 |
+
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
|
4 |
+
"epoch": 3.994143484626647,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 341,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9597069597069597,
|
14 |
+
"eval_f1": 0.9599836188656065,
|
15 |
+
"eval_loss": 0.12706419825553894,
|
16 |
+
"eval_precision": 0.960694098126733,
|
17 |
+
"eval_recall": 0.9597069597069597,
|
18 |
+
"eval_runtime": 6.1839,
|
19 |
+
"eval_samples_per_second": 220.733,
|
20 |
+
"eval_steps_per_second": 27.652,
|
21 |
+
"step": 85
|
22 |
+
},
|
23 |
+
{
|
24 |
+
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9787545787545787,
|
26 |
+
"eval_f1": 0.9788099592207686,
|
27 |
+
"eval_loss": 0.07009062170982361,
|
28 |
+
"eval_precision": 0.9789268917610887,
|
29 |
+
"eval_recall": 0.9787545787545787,
|
30 |
+
"eval_runtime": 6.2624,
|
31 |
+
"eval_samples_per_second": 217.969,
|
32 |
+
"eval_steps_per_second": 27.306,
|
33 |
+
"step": 170
|
34 |
+
},
|
35 |
+
{
|
36 |
+
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9831501831501831,
|
38 |
+
"eval_f1": 0.9831941055888854,
|
39 |
+
"eval_loss": 0.06720960885286331,
|
40 |
+
"eval_precision": 0.9832999772248476,
|
41 |
+
"eval_recall": 0.9831501831501831,
|
42 |
+
"eval_runtime": 5.9845,
|
43 |
+
"eval_samples_per_second": 228.09,
|
44 |
+
"eval_steps_per_second": 28.574,
|
45 |
+
"step": 256
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.991941391941392,
|
50 |
+
"eval_f1": 0.9919444380146174,
|
51 |
+
"eval_loss": 0.04145079106092453,
|
52 |
+
"eval_precision": 0.9919487758943655,
|
53 |
+
"eval_recall": 0.991941391941392,
|
54 |
+
"eval_runtime": 6.1222,
|
55 |
+
"eval_samples_per_second": 222.958,
|
56 |
+
"eval_steps_per_second": 27.931,
|
57 |
+
"step": 341
|
58 |
+
}
|
59 |
+
],
|
60 |
+
"logging_steps": 500,
|
61 |
+
"max_steps": 510,
|
62 |
+
"num_input_tokens_seen": 0,
|
63 |
+
"num_train_epochs": 6,
|
64 |
+
"save_steps": 500,
|
65 |
+
"stateful_callbacks": {
|
66 |
+
"EarlyStoppingCallback": {
|
67 |
+
"args": {
|
68 |
+
"early_stopping_patience": 3,
|
69 |
+
"early_stopping_threshold": 0.0
|
70 |
+
},
|
71 |
+
"attributes": {
|
72 |
+
"early_stopping_patience_counter": 0
|
73 |
+
}
|
74 |
+
},
|
75 |
+
"TrainerControl": {
|
76 |
+
"args": {
|
77 |
+
"should_epoch_stop": false,
|
78 |
+
"should_evaluate": false,
|
79 |
+
"should_log": false,
|
80 |
+
"should_save": true,
|
81 |
+
"should_training_stop": false
|
82 |
+
},
|
83 |
+
"attributes": {}
|
84 |
+
}
|
85 |
+
},
|
86 |
+
"total_flos": 4.966803039744e+16,
|
87 |
+
"train_batch_size": 8,
|
88 |
+
"trial_name": null,
|
89 |
+
"trial_params": null
|
90 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-341/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-cry-detector/checkpoint-426/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-426/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ccd0853b18fcef29f6c50370c40938c3fc157e6d6ab4f5a8cc0ee4de4c2a330
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/checkpoint-426/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58cf1896c9f8575d9e790921f864e581859c2dd6014460c20f2981f52787a4a4
|
3 |
+
size 189552570
|
distilhubert-finetuned-cry-detector/checkpoint-426/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67844b2b0357256b4d8649897b9ffa4d435413091b8757335f941cac6b60c370
|
3 |
+
size 14308
|
distilhubert-finetuned-cry-detector/checkpoint-426/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77da8d31fe5105cdaffd1de28e960ad7041d43ef167667465d3bd1e966ae27b0
|
3 |
+
size 1064
|
distilhubert-finetuned-cry-detector/checkpoint-426/trainer_state.json
ADDED
@@ -0,0 +1,102 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.991941391941392,
|
3 |
+
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
|
4 |
+
"epoch": 4.989751098096632,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 426,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9597069597069597,
|
14 |
+
"eval_f1": 0.9599836188656065,
|
15 |
+
"eval_loss": 0.12706419825553894,
|
16 |
+
"eval_precision": 0.960694098126733,
|
17 |
+
"eval_recall": 0.9597069597069597,
|
18 |
+
"eval_runtime": 6.1839,
|
19 |
+
"eval_samples_per_second": 220.733,
|
20 |
+
"eval_steps_per_second": 27.652,
|
21 |
+
"step": 85
|
22 |
+
},
|
23 |
+
{
|
24 |
+
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9787545787545787,
|
26 |
+
"eval_f1": 0.9788099592207686,
|
27 |
+
"eval_loss": 0.07009062170982361,
|
28 |
+
"eval_precision": 0.9789268917610887,
|
29 |
+
"eval_recall": 0.9787545787545787,
|
30 |
+
"eval_runtime": 6.2624,
|
31 |
+
"eval_samples_per_second": 217.969,
|
32 |
+
"eval_steps_per_second": 27.306,
|
33 |
+
"step": 170
|
34 |
+
},
|
35 |
+
{
|
36 |
+
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9831501831501831,
|
38 |
+
"eval_f1": 0.9831941055888854,
|
39 |
+
"eval_loss": 0.06720960885286331,
|
40 |
+
"eval_precision": 0.9832999772248476,
|
41 |
+
"eval_recall": 0.9831501831501831,
|
42 |
+
"eval_runtime": 5.9845,
|
43 |
+
"eval_samples_per_second": 228.09,
|
44 |
+
"eval_steps_per_second": 28.574,
|
45 |
+
"step": 256
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.991941391941392,
|
50 |
+
"eval_f1": 0.9919444380146174,
|
51 |
+
"eval_loss": 0.04145079106092453,
|
52 |
+
"eval_precision": 0.9919487758943655,
|
53 |
+
"eval_recall": 0.991941391941392,
|
54 |
+
"eval_runtime": 6.1222,
|
55 |
+
"eval_samples_per_second": 222.958,
|
56 |
+
"eval_steps_per_second": 27.931,
|
57 |
+
"step": 341
|
58 |
+
},
|
59 |
+
{
|
60 |
+
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.991941391941392,
|
62 |
+
"eval_f1": 0.9919444380146174,
|
63 |
+
"eval_loss": 0.037522196769714355,
|
64 |
+
"eval_precision": 0.9919487758943655,
|
65 |
+
"eval_recall": 0.991941391941392,
|
66 |
+
"eval_runtime": 6.1601,
|
67 |
+
"eval_samples_per_second": 221.586,
|
68 |
+
"eval_steps_per_second": 27.759,
|
69 |
+
"step": 426
|
70 |
+
}
|
71 |
+
],
|
72 |
+
"logging_steps": 500,
|
73 |
+
"max_steps": 510,
|
74 |
+
"num_input_tokens_seen": 0,
|
75 |
+
"num_train_epochs": 6,
|
76 |
+
"save_steps": 500,
|
77 |
+
"stateful_callbacks": {
|
78 |
+
"EarlyStoppingCallback": {
|
79 |
+
"args": {
|
80 |
+
"early_stopping_patience": 3,
|
81 |
+
"early_stopping_threshold": 0.0
|
82 |
+
},
|
83 |
+
"attributes": {
|
84 |
+
"early_stopping_patience_counter": 0
|
85 |
+
}
|
86 |
+
},
|
87 |
+
"TrainerControl": {
|
88 |
+
"args": {
|
89 |
+
"should_epoch_stop": false,
|
90 |
+
"should_evaluate": false,
|
91 |
+
"should_log": false,
|
92 |
+
"should_save": true,
|
93 |
+
"should_training_stop": false
|
94 |
+
},
|
95 |
+
"attributes": {}
|
96 |
+
}
|
97 |
+
},
|
98 |
+
"total_flos": 6.20850379968e+16,
|
99 |
+
"train_batch_size": 8,
|
100 |
+
"trial_name": null,
|
101 |
+
"trial_params": null
|
102 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-426/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-cry-detector/checkpoint-510/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-510/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4372169de69c47d33397222523009d2fdeed9d3854c7375e8590a1241949291d
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/checkpoint-510/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:294fd84ccb3eb4e7c39baaa641e3c8f3ea74bdf3b1a46a34208e1257b56d0054
|
3 |
+
size 189552570
|
distilhubert-finetuned-cry-detector/checkpoint-510/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cc7449d67ace31a2b3ec5d56092754753743418fdab51384b92915bdf832f21
|
3 |
+
size 14308
|
distilhubert-finetuned-cry-detector/checkpoint-510/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c10e0f825c3d4b6dffd76325c743990d99721ef8a75e18bb498ded17f46b6918
|
3 |
+
size 1064
|
distilhubert-finetuned-cry-detector/checkpoint-510/trainer_state.json
ADDED
@@ -0,0 +1,121 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.991941391941392,
|
3 |
+
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
|
4 |
+
"epoch": 5.973645680819912,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 510,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9597069597069597,
|
14 |
+
"eval_f1": 0.9599836188656065,
|
15 |
+
"eval_loss": 0.12706419825553894,
|
16 |
+
"eval_precision": 0.960694098126733,
|
17 |
+
"eval_recall": 0.9597069597069597,
|
18 |
+
"eval_runtime": 6.1839,
|
19 |
+
"eval_samples_per_second": 220.733,
|
20 |
+
"eval_steps_per_second": 27.652,
|
21 |
+
"step": 85
|
22 |
+
},
|
23 |
+
{
|
24 |
+
"epoch": 1.9912152269399708,
|
25 |
+
"eval_accuracy": 0.9787545787545787,
|
26 |
+
"eval_f1": 0.9788099592207686,
|
27 |
+
"eval_loss": 0.07009062170982361,
|
28 |
+
"eval_precision": 0.9789268917610887,
|
29 |
+
"eval_recall": 0.9787545787545787,
|
30 |
+
"eval_runtime": 6.2624,
|
31 |
+
"eval_samples_per_second": 217.969,
|
32 |
+
"eval_steps_per_second": 27.306,
|
33 |
+
"step": 170
|
34 |
+
},
|
35 |
+
{
|
36 |
+
"epoch": 2.998535871156662,
|
37 |
+
"eval_accuracy": 0.9831501831501831,
|
38 |
+
"eval_f1": 0.9831941055888854,
|
39 |
+
"eval_loss": 0.06720960885286331,
|
40 |
+
"eval_precision": 0.9832999772248476,
|
41 |
+
"eval_recall": 0.9831501831501831,
|
42 |
+
"eval_runtime": 5.9845,
|
43 |
+
"eval_samples_per_second": 228.09,
|
44 |
+
"eval_steps_per_second": 28.574,
|
45 |
+
"step": 256
|
46 |
+
},
|
47 |
+
{
|
48 |
+
"epoch": 3.994143484626647,
|
49 |
+
"eval_accuracy": 0.991941391941392,
|
50 |
+
"eval_f1": 0.9919444380146174,
|
51 |
+
"eval_loss": 0.04145079106092453,
|
52 |
+
"eval_precision": 0.9919487758943655,
|
53 |
+
"eval_recall": 0.991941391941392,
|
54 |
+
"eval_runtime": 6.1222,
|
55 |
+
"eval_samples_per_second": 222.958,
|
56 |
+
"eval_steps_per_second": 27.931,
|
57 |
+
"step": 341
|
58 |
+
},
|
59 |
+
{
|
60 |
+
"epoch": 4.989751098096632,
|
61 |
+
"eval_accuracy": 0.991941391941392,
|
62 |
+
"eval_f1": 0.9919444380146174,
|
63 |
+
"eval_loss": 0.037522196769714355,
|
64 |
+
"eval_precision": 0.9919487758943655,
|
65 |
+
"eval_recall": 0.991941391941392,
|
66 |
+
"eval_runtime": 6.1601,
|
67 |
+
"eval_samples_per_second": 221.586,
|
68 |
+
"eval_steps_per_second": 27.759,
|
69 |
+
"step": 426
|
70 |
+
},
|
71 |
+
{
|
72 |
+
"epoch": 5.856515373352855,
|
73 |
+
"grad_norm": 0.05031043663620949,
|
74 |
+
"learning_rate": 9.520643773712201e-08,
|
75 |
+
"loss": 0.056,
|
76 |
+
"step": 500
|
77 |
+
},
|
78 |
+
{
|
79 |
+
"epoch": 5.973645680819912,
|
80 |
+
"eval_accuracy": 0.991941391941392,
|
81 |
+
"eval_f1": 0.9919444380146174,
|
82 |
+
"eval_loss": 0.037607260048389435,
|
83 |
+
"eval_precision": 0.9919487758943655,
|
84 |
+
"eval_recall": 0.991941391941392,
|
85 |
+
"eval_runtime": 6.0461,
|
86 |
+
"eval_samples_per_second": 225.765,
|
87 |
+
"eval_steps_per_second": 28.283,
|
88 |
+
"step": 510
|
89 |
+
}
|
90 |
+
],
|
91 |
+
"logging_steps": 500,
|
92 |
+
"max_steps": 510,
|
93 |
+
"num_input_tokens_seen": 0,
|
94 |
+
"num_train_epochs": 6,
|
95 |
+
"save_steps": 500,
|
96 |
+
"stateful_callbacks": {
|
97 |
+
"EarlyStoppingCallback": {
|
98 |
+
"args": {
|
99 |
+
"early_stopping_patience": 3,
|
100 |
+
"early_stopping_threshold": 0.0
|
101 |
+
},
|
102 |
+
"attributes": {
|
103 |
+
"early_stopping_patience_counter": 0
|
104 |
+
}
|
105 |
+
},
|
106 |
+
"TrainerControl": {
|
107 |
+
"args": {
|
108 |
+
"should_epoch_stop": false,
|
109 |
+
"should_evaluate": false,
|
110 |
+
"should_log": false,
|
111 |
+
"should_save": true,
|
112 |
+
"should_training_stop": true
|
113 |
+
},
|
114 |
+
"attributes": {}
|
115 |
+
}
|
116 |
+
},
|
117 |
+
"total_flos": 7.418366078592e+16,
|
118 |
+
"train_batch_size": 8,
|
119 |
+
"trial_name": null,
|
120 |
+
"trial_params": null
|
121 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-510/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-cry-detector/checkpoint-85/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-85/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25b5dedf2a772cebe9534bac9b4f4b2cae3c78d018c5e1a5a81305bf2945ebd1
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/checkpoint-85/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c71f3df5c54a5867dc09782b6116eb9a8f338591753dc3c3c099a4abc235053a
|
3 |
+
size 189552570
|
distilhubert-finetuned-cry-detector/checkpoint-85/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74e1c11b94b090a41a3c1ccee3afde4077ab65e935c7dfa8559b5a7860ed3169
|
3 |
+
size 14308
|
distilhubert-finetuned-cry-detector/checkpoint-85/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33e2a8e76399fe02fb40c65ecf028aa55e02ca8e63c8cb6c0fbb6115c6f4d731
|
3 |
+
size 1064
|
distilhubert-finetuned-cry-detector/checkpoint-85/trainer_state.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.9597069597069597,
|
3 |
+
"best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-85",
|
4 |
+
"epoch": 0.9956076134699854,
|
5 |
+
"eval_steps": 500,
|
6 |
+
"global_step": 85,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.9956076134699854,
|
13 |
+
"eval_accuracy": 0.9597069597069597,
|
14 |
+
"eval_f1": 0.9599836188656065,
|
15 |
+
"eval_loss": 0.12706419825553894,
|
16 |
+
"eval_precision": 0.960694098126733,
|
17 |
+
"eval_recall": 0.9597069597069597,
|
18 |
+
"eval_runtime": 6.1839,
|
19 |
+
"eval_samples_per_second": 220.733,
|
20 |
+
"eval_steps_per_second": 27.652,
|
21 |
+
"step": 85
|
22 |
+
}
|
23 |
+
],
|
24 |
+
"logging_steps": 500,
|
25 |
+
"max_steps": 510,
|
26 |
+
"num_input_tokens_seen": 0,
|
27 |
+
"num_train_epochs": 6,
|
28 |
+
"save_steps": 500,
|
29 |
+
"stateful_callbacks": {
|
30 |
+
"EarlyStoppingCallback": {
|
31 |
+
"args": {
|
32 |
+
"early_stopping_patience": 3,
|
33 |
+
"early_stopping_threshold": 0.0
|
34 |
+
},
|
35 |
+
"attributes": {
|
36 |
+
"early_stopping_patience_counter": 0
|
37 |
+
}
|
38 |
+
},
|
39 |
+
"TrainerControl": {
|
40 |
+
"args": {
|
41 |
+
"should_epoch_stop": false,
|
42 |
+
"should_evaluate": false,
|
43 |
+
"should_log": false,
|
44 |
+
"should_save": true,
|
45 |
+
"should_training_stop": false
|
46 |
+
},
|
47 |
+
"attributes": {}
|
48 |
+
}
|
49 |
+
},
|
50 |
+
"total_flos": 1.241700759936e+16,
|
51 |
+
"train_batch_size": 8,
|
52 |
+
"trial_name": null,
|
53 |
+
"trial_params": null
|
54 |
+
}
|
distilhubert-finetuned-cry-detector/checkpoint-85/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-cry-detector/config.json
ADDED
@@ -0,0 +1,81 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "crying",
|
54 |
+
"1": "no_crying"
|
55 |
+
},
|
56 |
+
"initializer_range": 0.02,
|
57 |
+
"intermediate_size": 3072,
|
58 |
+
"label2id": {
|
59 |
+
"crying": 0,
|
60 |
+
"no_crying": 1
|
61 |
+
},
|
62 |
+
"layer_norm_eps": 1e-05,
|
63 |
+
"layerdrop": 0.0,
|
64 |
+
"mask_feature_length": 10,
|
65 |
+
"mask_feature_min_masks": 0,
|
66 |
+
"mask_feature_prob": 0.0,
|
67 |
+
"mask_time_length": 10,
|
68 |
+
"mask_time_min_masks": 2,
|
69 |
+
"mask_time_prob": 0.05,
|
70 |
+
"model_type": "hubert",
|
71 |
+
"num_attention_heads": 12,
|
72 |
+
"num_conv_pos_embedding_groups": 16,
|
73 |
+
"num_conv_pos_embeddings": 128,
|
74 |
+
"num_feat_extract_layers": 7,
|
75 |
+
"num_hidden_layers": 2,
|
76 |
+
"pad_token_id": 0,
|
77 |
+
"torch_dtype": "float32",
|
78 |
+
"transformers_version": "4.44.2",
|
79 |
+
"use_weighted_layer_sum": false,
|
80 |
+
"vocab_size": 32
|
81 |
+
}
|
distilhubert-finetuned-cry-detector/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7944ecc75fe28e156d4c1967e013e12ebf361ba4a1e84d569b5656c10cbbf99f
|
3 |
+
size 94763496
|
distilhubert-finetuned-cry-detector/runs/Sep06_15-54-59_ubumarcos/events.out.tfevents.1725630900.ubumarcos
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1acef9821029fd1212d748efd26c746ef609728916bb04756b301a4027aed9d7
|
3 |
+
size 5850
|
distilhubert-finetuned-cry-detector/runs/Sep06_17-32-26_ubumarcos/events.out.tfevents.1725636747.ubumarcos
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89395943d8de67b3553472ad01aa836188c676359cc9b10e225dd488dbb1d7ac
|
3 |
+
size 9238
|
distilhubert-finetuned-cry-detector/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3
|
3 |
+
size 5240
|
distilhubert-finetuned-mixed-data/checkpoint-121/config.json
ADDED
@@ -0,0 +1,85 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "ntu-spml/distilhubert",
|
3 |
+
"activation_dropout": 0.1,
|
4 |
+
"apply_spec_augment": false,
|
5 |
+
"architectures": [
|
6 |
+
"HubertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.1,
|
9 |
+
"bos_token_id": 1,
|
10 |
+
"classifier_proj_size": 256,
|
11 |
+
"conv_bias": false,
|
12 |
+
"conv_dim": [
|
13 |
+
512,
|
14 |
+
512,
|
15 |
+
512,
|
16 |
+
512,
|
17 |
+
512,
|
18 |
+
512,
|
19 |
+
512
|
20 |
+
],
|
21 |
+
"conv_kernel": [
|
22 |
+
10,
|
23 |
+
3,
|
24 |
+
3,
|
25 |
+
3,
|
26 |
+
3,
|
27 |
+
2,
|
28 |
+
2
|
29 |
+
],
|
30 |
+
"conv_stride": [
|
31 |
+
5,
|
32 |
+
2,
|
33 |
+
2,
|
34 |
+
2,
|
35 |
+
2,
|
36 |
+
2,
|
37 |
+
2
|
38 |
+
],
|
39 |
+
"ctc_loss_reduction": "sum",
|
40 |
+
"ctc_zero_infinity": false,
|
41 |
+
"do_stable_layer_norm": false,
|
42 |
+
"eos_token_id": 2,
|
43 |
+
"feat_extract_activation": "gelu",
|
44 |
+
"feat_extract_norm": "group",
|
45 |
+
"feat_proj_dropout": 0.0,
|
46 |
+
"feat_proj_layer_norm": false,
|
47 |
+
"final_dropout": 0.0,
|
48 |
+
"finetuning_task": "audio-classification",
|
49 |
+
"hidden_act": "gelu",
|
50 |
+
"hidden_dropout": 0.1,
|
51 |
+
"hidden_size": 768,
|
52 |
+
"id2label": {
|
53 |
+
"0": "1s_normal",
|
54 |
+
"1": "1s_pain",
|
55 |
+
"2": "1s_hunger",
|
56 |
+
"3": "1s_asphyxia"
|
57 |
+
},
|
58 |
+
"initializer_range": 0.02,
|
59 |
+
"intermediate_size": 3072,
|
60 |
+
"label2id": {
|
61 |
+
"1s_asphyxia": 3,
|
62 |
+
"1s_hunger": 2,
|
63 |
+
"1s_normal": 0,
|
64 |
+
"1s_pain": 1
|
65 |
+
},
|
66 |
+
"layer_norm_eps": 1e-05,
|
67 |
+
"layerdrop": 0.0,
|
68 |
+
"mask_feature_length": 10,
|
69 |
+
"mask_feature_min_masks": 0,
|
70 |
+
"mask_feature_prob": 0.0,
|
71 |
+
"mask_time_length": 10,
|
72 |
+
"mask_time_min_masks": 2,
|
73 |
+
"mask_time_prob": 0.05,
|
74 |
+
"model_type": "hubert",
|
75 |
+
"num_attention_heads": 12,
|
76 |
+
"num_conv_pos_embedding_groups": 16,
|
77 |
+
"num_conv_pos_embeddings": 128,
|
78 |
+
"num_feat_extract_layers": 7,
|
79 |
+
"num_hidden_layers": 2,
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"torch_dtype": "float32",
|
82 |
+
"transformers_version": "4.44.2",
|
83 |
+
"use_weighted_layer_sum": false,
|
84 |
+
"vocab_size": 32
|
85 |
+
}
|
distilhubert-finetuned-mixed-data/checkpoint-121/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:812ef836989997aee1750c6a31d13aded72b6dae0ab04fd01133347e51bda632
|
3 |
+
size 94765560
|