Marcos12886 commited on Sep 1

Commit

925fa09

•

1 Parent(s): 6e73b9f

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +61 -3
checkpoint-11/config.json +80 -0
checkpoint-11/model.safetensors +3 -0
checkpoint-11/optimizer.pt +3 -0
checkpoint-11/preprocessor_config.json +9 -0
checkpoint-11/rng_state.pth +3 -0
checkpoint-11/scheduler.pt +3 -0
checkpoint-11/trainer_state.json +54 -0
checkpoint-11/training_args.bin +3 -0
checkpoint-12/config.json +80 -0
checkpoint-12/model.safetensors +3 -0
checkpoint-12/optimizer.pt +3 -0
checkpoint-12/preprocessor_config.json +9 -0
checkpoint-12/rng_state.pth +3 -0
checkpoint-12/scheduler.pt +3 -0
checkpoint-12/trainer_state.json +54 -0
checkpoint-12/training_args.bin +3 -0
checkpoint-23/config.json +80 -0
checkpoint-23/model.safetensors +3 -0
checkpoint-23/optimizer.pt +3 -0
checkpoint-23/preprocessor_config.json +9 -0
checkpoint-23/rng_state.pth +3 -0
checkpoint-23/scheduler.pt +3 -0
checkpoint-23/trainer_state.json +66 -0
checkpoint-23/training_args.bin +3 -0
checkpoint-25/config.json +80 -0
checkpoint-25/model.safetensors +3 -0
checkpoint-25/optimizer.pt +3 -0
checkpoint-25/preprocessor_config.json +9 -0
checkpoint-25/rng_state.pth +3 -0
checkpoint-25/scheduler.pt +3 -0
checkpoint-25/trainer_state.json +66 -0
checkpoint-25/training_args.bin +3 -0
checkpoint-35/config.json +80 -0
checkpoint-35/model.safetensors +3 -0
checkpoint-35/optimizer.pt +3 -0
checkpoint-35/preprocessor_config.json +9 -0
checkpoint-35/rng_state.pth +3 -0
checkpoint-35/scheduler.pt +3 -0
checkpoint-35/trainer_state.json +78 -0
checkpoint-35/training_args.bin +3 -0
checkpoint-38/config.json +80 -0
checkpoint-38/model.safetensors +3 -0
checkpoint-38/optimizer.pt +3 -0
checkpoint-38/preprocessor_config.json +9 -0
checkpoint-38/rng_state.pth +3 -0
checkpoint-38/scheduler.pt +3 -0
checkpoint-38/trainer_state.json +78 -0
checkpoint-38/training_args.bin +3 -0
checkpoint-47/config.json +80 -0

README.md CHANGED Viewed

@@ -1,3 +1,61 @@
----
-license: apache-2.0
----

+---
+library_name: transformers
+license: apache-2.0
+base_model: ntu-spml/distilhubert
+tags:
+- generated_from_trainer
+datasets:
+- audiofolder
+model-index:
+- name: distilhubert-finetuned-cry-detector
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# distilhubert-finetuned-cry-detector
+This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 8
+- eval_batch_size: 8
+- seed: 42
+- gradient_accumulation_steps: 8
+- total_train_batch_size: 64
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: cosine
+- lr_scheduler_warmup_ratio: 0.001
+- num_epochs: 1
+### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Accuracy | F1     | Precision | Recall |
+|:-------------:|:------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
+| No log        | 0.9412 | 12   | 0.3494          | 0.9559   | 0.9555 | 0.9564    | 0.9559 |
+### Framework versions
+- Transformers 4.44.2
+- Pytorch 2.4.0+cu121
+- Datasets 2.21.0
+- Tokenizers 0.19.1

checkpoint-11/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-11/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:587ded30bd6f5b2016dddc435305926663e21b45f69b6624b780f4463d828358
+size 94763496

checkpoint-11/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:75ac2969c72bfbf4d666e562f2cf544a17e201d5d9ab77d34a6a987ad3b8a166
+size 189552570

checkpoint-11/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-11/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ed664212b7cd99a57c71d748ab059acd10207cf6e9c571c8704e3e414764217
+size 14244

checkpoint-11/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6491db7666ee7abd7f00b7daf389f37f42623e77d2190d7cedb399d4309fda5
+size 1064

checkpoint-11/trainer_state.json ADDED Viewed

	@@ -0,0 +1,54 @@

+{
+  "best_metric": 0.9411764705882353,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-11",
+  "epoch": 0.9361702127659575,
+  "eval_steps": 500,
+  "global_step": 11,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9361702127659575,
+      "eval_accuracy": 0.9411764705882353,
+      "eval_f1": 0.9415646417647925,
+      "eval_loss": 0.2156958132982254,
+      "eval_precision": 0.9446294240966827,
+      "eval_recall": 0.9411764705882353,
+      "eval_runtime": 3.0828,
+      "eval_samples_per_second": 60.66,
+      "eval_steps_per_second": 7.785,
+      "step": 11
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 55,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.1981257051356672e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-11/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba58ce355cad2f4a942fe159c5c029d2f1af4a92781bdfa4ca805848d823376f
+size 5240

checkpoint-12/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-12/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3667c942b60fb4aaa6da75bdc8c45dda9b2120a968bd96844eff1c2eeb6569d6
+size 94763496

checkpoint-12/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aaaabc411e12db72e6080d520aaf489915b57b63ecf13116359246428ab28a0d
+size 189552570

checkpoint-12/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-12/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e214e6365eb6a4284a4e8e647133f419a1798d93f9dd2f8d941c02dcdc8922a
+size 14244

checkpoint-12/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00ac470d61d5b4613444f686474fe5bf71dbe645a07555e3c0011199a78b17ab
+size 1064

checkpoint-12/trainer_state.json ADDED Viewed

	@@ -0,0 +1,54 @@

+{
+  "best_metric": 0.9558823529411765,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-12",
+  "epoch": 0.9411764705882353,
+  "eval_steps": 500,
+  "global_step": 12,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9558823529411765,
+      "eval_f1": 0.9555272696227192,
+      "eval_loss": 0.3494149148464203,
+      "eval_precision": 0.9564428025638596,
+      "eval_recall": 0.9558823529411765,
+      "eval_runtime": 2.8857,
+      "eval_samples_per_second": 70.694,
+      "eval_steps_per_second": 9.01,
+      "step": 12
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 12,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.2382512879347712e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-12/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3105fda5f2c454de8afa76f767893fbe3ebf0bc8395507bd768109ec948f149d
+size 5240

checkpoint-23/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-23/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:abcb331765a018ac29ea85db630ddaf1074010344d78be5475cd1aad2e9d9cc2
+size 94763496

checkpoint-23/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:869c3a62cf0034a6126c18ad904e2e7854bbb38aef9b494fa53842ef1e414046
+size 189552570

checkpoint-23/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-23/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3e5afa942f0cac1d664ff6ebdf17eca5a923a087ce434e17a231d65b71899089
+size 14244

checkpoint-23/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:747167933fffcfb0c95ca8e0a62d67e7d36cf718d4a70e795658ad992dc31698
+size 1064

checkpoint-23/trainer_state.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+  "best_metric": 0.9572192513368984,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-23",
+  "epoch": 1.9574468085106385,
+  "eval_steps": 500,
+  "global_step": 23,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9361702127659575,
+      "eval_accuracy": 0.9411764705882353,
+      "eval_f1": 0.9415646417647925,
+      "eval_loss": 0.2156958132982254,
+      "eval_precision": 0.9446294240966827,
+      "eval_recall": 0.9411764705882353,
+      "eval_runtime": 3.0828,
+      "eval_samples_per_second": 60.66,
+      "eval_steps_per_second": 7.785,
+      "step": 11
+    },
+    {
+      "epoch": 1.9574468085106385,
+      "eval_accuracy": 0.9572192513368984,
+      "eval_f1": 0.9573134708428827,
+      "eval_loss": 0.12373537570238113,
+      "eval_precision": 0.9576338229589004,
+      "eval_recall": 0.9572192513368984,
+      "eval_runtime": 2.9612,
+      "eval_samples_per_second": 63.15,
+      "eval_steps_per_second": 8.105,
+      "step": 23
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 55,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.3947368082454784e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-23/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba58ce355cad2f4a942fe159c5c029d2f1af4a92781bdfa4ca805848d823376f
+size 5240

checkpoint-25/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-25/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:457aaf1ca73f2bd8fdf652ff897b1db85473a23401cdea192ccda04c31e902f9
+size 94763496

checkpoint-25/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f78eeb88abcee76fe1f3cb427847a3366d60d465ad4933bdf631baef11c677d
+size 189552570

checkpoint-25/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-25/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e5c954d42fa0d2b945cf8a644f5bb95c0ecae8f78ef6f89815808920b5b330c
+size 14244

checkpoint-25/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91532783b102a4c8ff5ee86df37d3662ca7a62e198729a349c132e2c9a68d5d0
+size 1064

checkpoint-25/trainer_state.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+  "best_metric": 0.9558823529411765,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-25",
+  "epoch": 1.9607843137254903,
+  "eval_steps": 500,
+  "global_step": 25,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9509803921568627,
+      "eval_f1": 0.9509803921568627,
+      "eval_loss": 0.19337645173072815,
+      "eval_precision": 0.9509803921568627,
+      "eval_recall": 0.9509803921568627,
+      "eval_runtime": 2.9937,
+      "eval_samples_per_second": 68.144,
+      "eval_steps_per_second": 8.685,
+      "step": 12
+    },
+    {
+      "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9558823529411765,
+      "eval_f1": 0.9558168094824137,
+      "eval_loss": 0.11207430809736252,
+      "eval_precision": 0.9558008500901145,
+      "eval_recall": 0.9558823529411765,
+      "eval_runtime": 2.9789,
+      "eval_samples_per_second": 68.481,
+      "eval_steps_per_second": 8.728,
+      "step": 25
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 48,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.632285534507315e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-25/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b08c1ef2199623b781e926f1d827964186fca47326620731302bfe37c5d058b9
+size 5240

checkpoint-35/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-35/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45ac590ecbfe521110ab81f16af790aa2a6f1cb4ab70317973e13165d0709582
+size 94763496

checkpoint-35/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5616c1cbc4a632a4500d7065ca4131e413c67941e4f867d528e017d8f4114178
+size 189552570

checkpoint-35/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-35/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f40c7263da12c8166f64ce9b0988018ca7ba311284f65e80ebcaa3856ca7de3f
+size 14244

checkpoint-35/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:928490201c93ddf3bddd80ff74fac96f745a82dfb6404304be920725c0a03457
+size 1064

checkpoint-35/trainer_state.json ADDED Viewed

	@@ -0,0 +1,78 @@

+{
+  "best_metric": 0.9572192513368984,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-23",
+  "epoch": 2.978723404255319,
+  "eval_steps": 500,
+  "global_step": 35,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9361702127659575,
+      "eval_accuracy": 0.9411764705882353,
+      "eval_f1": 0.9415646417647925,
+      "eval_loss": 0.2156958132982254,
+      "eval_precision": 0.9446294240966827,
+      "eval_recall": 0.9411764705882353,
+      "eval_runtime": 3.0828,
+      "eval_samples_per_second": 60.66,
+      "eval_steps_per_second": 7.785,
+      "step": 11
+    },
+    {
+      "epoch": 1.9574468085106385,
+      "eval_accuracy": 0.9572192513368984,
+      "eval_f1": 0.9573134708428827,
+      "eval_loss": 0.12373537570238113,
+      "eval_precision": 0.9576338229589004,
+      "eval_recall": 0.9572192513368984,
+      "eval_runtime": 2.9612,
+      "eval_samples_per_second": 63.15,
+      "eval_steps_per_second": 8.105,
+      "step": 23
+    },
+    {
+      "epoch": 2.978723404255319,
+      "eval_accuracy": 0.9518716577540107,
+      "eval_f1": 0.9521892523530119,
+      "eval_loss": 0.1370447278022766,
+      "eval_precision": 0.9552156165178733,
+      "eval_recall": 0.9518716577540107,
+      "eval_runtime": 2.9378,
+      "eval_samples_per_second": 63.653,
+      "eval_steps_per_second": 8.169,
+      "step": 35
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 55,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.5925100159126656e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-35/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba58ce355cad2f4a942fe159c5c029d2f1af4a92781bdfa4ca805848d823376f
+size 5240

checkpoint-38/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-38/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:365a9fb794f55008ff39b21086b11700c109a194efb2127a6db2145604a614b6
+size 94763496

checkpoint-38/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:198372300c7cb71ea5cd197e4b8f17970da74cfc971f4a284751e8c5c2fe5397
+size 189552570

checkpoint-38/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-38/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:780c51c50482e6e8f628b4687957abc3bb4ff7f96b977c02d8538cf6f0d2d494
+size 14244

checkpoint-38/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96ddec5715a7e2a3cc7175b7f159a7e1fd2303094015b4bffdae6a236e889974
+size 1064

checkpoint-38/trainer_state.json ADDED Viewed

	@@ -0,0 +1,78 @@

+{
+  "best_metric": 0.9607843137254902,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-38",
+  "epoch": 2.980392156862745,
+  "eval_steps": 500,
+  "global_step": 38,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9509803921568627,
+      "eval_f1": 0.9509803921568627,
+      "eval_loss": 0.19337645173072815,
+      "eval_precision": 0.9509803921568627,
+      "eval_recall": 0.9509803921568627,
+      "eval_runtime": 2.9937,
+      "eval_samples_per_second": 68.144,
+      "eval_steps_per_second": 8.685,
+      "step": 12
+    },
+    {
+      "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9558823529411765,
+      "eval_f1": 0.9558168094824137,
+      "eval_loss": 0.11207430809736252,
+      "eval_precision": 0.9558008500901145,
+      "eval_recall": 0.9558823529411765,
+      "eval_runtime": 2.9789,
+      "eval_samples_per_second": 68.481,
+      "eval_steps_per_second": 8.728,
+      "step": 25
+    },
+    {
+      "epoch": 2.980392156862745,
+      "eval_accuracy": 0.9607843137254902,
+      "eval_f1": 0.9608937528499771,
+      "eval_loss": 0.08983828127384186,
+      "eval_precision": 0.9611995291537668,
+      "eval_recall": 0.9607843137254902,
+      "eval_runtime": 2.927,
+      "eval_samples_per_second": 69.695,
+      "eval_steps_per_second": 8.883,
+      "step": 38
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 48,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.947040143988326e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-38/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b08c1ef2199623b781e926f1d827964186fca47326620731302bfe37c5d058b9
+size 5240

checkpoint-47/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}