Marcos12886 commited on 20 days ago

Commit

5c2a1eb

•

1 Parent(s): ee61ac2

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +17 -20
checkpoint-170/config.json +80 -0
checkpoint-170/model.safetensors +3 -0
checkpoint-170/optimizer.pt +3 -0
checkpoint-170/preprocessor_config.json +9 -0
checkpoint-170/rng_state.pth +3 -0
checkpoint-170/scheduler.pt +3 -0
checkpoint-170/trainer_state.json +66 -0
checkpoint-170/training_args.bin +3 -0
checkpoint-255/config.json +80 -0
checkpoint-255/model.safetensors +3 -0
checkpoint-255/optimizer.pt +3 -0
checkpoint-255/preprocessor_config.json +9 -0
checkpoint-255/rng_state.pth +3 -0
checkpoint-255/scheduler.pt +3 -0
checkpoint-255/trainer_state.json +78 -0
checkpoint-255/training_args.bin +3 -0
checkpoint-256/config.json +80 -0
checkpoint-256/model.safetensors +3 -0
checkpoint-256/optimizer.pt +3 -0
checkpoint-256/preprocessor_config.json +9 -0
checkpoint-256/rng_state.pth +3 -0
checkpoint-256/scheduler.pt +3 -0
checkpoint-256/trainer_state.json +78 -0
checkpoint-256/training_args.bin +3 -0
checkpoint-341/config.json +80 -0
checkpoint-341/model.safetensors +3 -0
checkpoint-341/optimizer.pt +3 -0
checkpoint-341/preprocessor_config.json +9 -0
checkpoint-341/rng_state.pth +3 -0
checkpoint-341/scheduler.pt +3 -0
checkpoint-341/trainer_state.json +90 -0
checkpoint-341/training_args.bin +3 -0
checkpoint-426/config.json +80 -0
checkpoint-426/model.safetensors +3 -0
checkpoint-426/optimizer.pt +3 -0
checkpoint-426/preprocessor_config.json +9 -0
checkpoint-426/rng_state.pth +3 -0
checkpoint-426/scheduler.pt +3 -0
checkpoint-426/trainer_state.json +102 -0
checkpoint-426/training_args.bin +3 -0
checkpoint-512/config.json +80 -0
checkpoint-512/model.safetensors +3 -0
checkpoint-512/optimizer.pt +3 -0
checkpoint-512/preprocessor_config.json +9 -0
checkpoint-512/rng_state.pth +3 -0
checkpoint-512/scheduler.pt +3 -0
checkpoint-512/trainer_state.json +121 -0
checkpoint-512/training_args.bin +3 -0
checkpoint-595/config.json +80 -0

README.md CHANGED Viewed

@@ -26,16 +26,16 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: 0.9852941176470589
     - name: F1
       type: f1
-      value: 0.9853150765112866
     - name: Precision
       type: precision
-      value: 0.9853868369053048
     - name: Recall
       type: recall
-      value: 0.9852941176470589
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -45,11 +45,11 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.0332
-- Accuracy: 0.9853
-- F1: 0.9853
-- Precision: 0.9854
-- Recall: 0.9853
 ## Model description
@@ -77,22 +77,19 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.001
-- num_epochs: 10
 ### Training results
 | Training Loss | Epoch  | Step | Validation Loss | Accuracy | F1     | Precision | Recall |
 |:-------------:|:------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
-| No log        | 0.9412 | 12   | 0.1931          | 0.9363   | 0.9365 | 0.9372    | 0.9363 |
-| No log        | 1.9608 | 25   | 0.0950          | 0.9706   | 0.9704 | 0.9710    | 0.9706 |
-| No log        | 2.9804 | 38   | 0.0611          | 0.9804   | 0.9804 | 0.9804    | 0.9804 |
-| No log        | 4.0    | 51   | 0.0492          | 0.9853   | 0.9853 | 0.9853    | 0.9853 |
-| No log        | 4.9412 | 63   | 0.0588          | 0.9804   | 0.9805 | 0.9814    | 0.9804 |
-| No log        | 5.9608 | 76   | 0.0368          | 0.9853   | 0.9853 | 0.9854    | 0.9853 |
-| No log        | 6.9804 | 89   | 0.0382          | 0.9902   | 0.9902 | 0.9903    | 0.9902 |
-| No log        | 8.0    | 102  | 0.0318          | 0.9951   | 0.9951 | 0.9951    | 0.9951 |
-| No log        | 8.9412 | 114  | 0.0331          | 0.9853   | 0.9853 | 0.9854    | 0.9853 |
-| No log        | 9.4118 | 120  | 0.0332          | 0.9853   | 0.9853 | 0.9854    | 0.9853 |
 ### Framework versions

     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.991941391941392
     - name: F1
       type: f1
+      value: 0.9919569277165429
     - name: Precision
       type: precision
+      value: 0.9920048531706146
     - name: Recall
       type: recall
+      value: 0.991941391941392
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.0408
+- Accuracy: 0.9919
+- F1: 0.9920
+- Precision: 0.9920
+- Recall: 0.9919
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.001
+- num_epochs: 7
 ### Training results
 | Training Loss | Epoch  | Step | Validation Loss | Accuracy | F1     | Precision | Recall |
 |:-------------:|:------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
+| No log        | 0.9956 | 85   | 0.0736          | 0.9788   | 0.9788 | 0.9790    | 0.9788 |
+| No log        | 1.9912 | 170  | 0.0680          | 0.9758   | 0.9760 | 0.9770    | 0.9758 |
+| No log        | 2.9985 | 256  | 0.0447          | 0.9875   | 0.9876 | 0.9876    | 0.9875 |
+| No log        | 3.9941 | 341  | 0.0452          | 0.9905   | 0.9905 | 0.9905    | 0.9905 |
+| No log        | 4.9898 | 426  | 0.0439          | 0.9919   | 0.9920 | 0.9920    | 0.9919 |
+| 0.053         | 5.9971 | 512  | 0.0401          | 0.9919   | 0.9920 | 0.9920    | 0.9919 |
+| 0.053         | 6.9693 | 595  | 0.0408          | 0.9919   | 0.9920 | 0.9920    | 0.9919 |
 ### Framework versions

checkpoint-170/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-170/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:14ad2529c107706df5e38d4e839c5fe54bbd3638840f1b016ba56f9e40cfd45a
+size 94763496

checkpoint-170/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:feca43a53b1ea22e785cf6aebc67731d4d759491623447479b488904538b9c5d
+size 189552570

checkpoint-170/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-170/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:309f3425e8cb713e30160da01fdcf088ad760dfa7761c7bd73a907a4115b0ee0
+size 14308

checkpoint-170/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e9632dd1819b93de48e3bbe467fe0d96e895179dd60318df68d501d078c6ed9
+size 1064

checkpoint-170/trainer_state.json ADDED Viewed

	@@ -0,0 +1,66 @@

+{
+  "best_metric": 0.9787545787545787,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-85",
+  "epoch": 1.9912152269399708,
+  "eval_steps": 500,
+  "global_step": 170,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9956076134699854,
+      "eval_accuracy": 0.9787545787545787,
+      "eval_f1": 0.9788275754377449,
+      "eval_loss": 0.07363971322774887,
+      "eval_precision": 0.9790028856592324,
+      "eval_recall": 0.9787545787545787,
+      "eval_runtime": 4.1234,
+      "eval_samples_per_second": 331.041,
+      "eval_steps_per_second": 41.471,
+      "step": 85
+    },
+    {
+      "epoch": 1.9912152269399708,
+      "eval_accuracy": 0.9758241758241758,
+      "eval_f1": 0.9760458977669253,
+      "eval_loss": 0.0680176243185997,
+      "eval_precision": 0.9770364666252971,
+      "eval_recall": 0.9758241758241758,
+      "eval_runtime": 3.9805,
+      "eval_samples_per_second": 342.924,
+      "eval_steps_per_second": 42.96,
+      "step": 170
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 595,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2.483401519872e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-170/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:caa3df7f2810faa9c35a46d178b12337edb0b134aa27dc1689b302d9bcc9d3d0
+size 5240

checkpoint-255/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-255/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f4d1bcece15f285a46eb855f203bd43924522bb36fe48d2d6c26990580d046d
+size 94763496

checkpoint-255/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:55c75ae0d01ca9c0fa93dadeceec95f962b2525037b69dc1a327f1b6c3c0ad59
+size 189552570

checkpoint-255/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-255/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:32bb7f9c3cdfdb4246f58a8319fd0b86a841985e3d321ecf44d228390d31634d
+size 14308

checkpoint-255/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7859ab68e5739b704ca9ce13610ef11b9b1125824d2905d10d4a9ea15d8739ea
+size 1064

checkpoint-255/trainer_state.json ADDED Viewed

	@@ -0,0 +1,78 @@

+{
+  "best_metric": 0.989010989010989,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-255",
+  "epoch": 2.986822840409956,
+  "eval_steps": 500,
+  "global_step": 255,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9956076134699854,
+      "eval_accuracy": 0.9758241758241758,
+      "eval_f1": 0.9759605689530879,
+      "eval_loss": 0.07685838639736176,
+      "eval_precision": 0.9763775351444481,
+      "eval_recall": 0.9758241758241758,
+      "eval_runtime": 3.9273,
+      "eval_samples_per_second": 347.571,
+      "eval_steps_per_second": 43.542,
+      "step": 85
+    },
+    {
+      "epoch": 1.9912152269399708,
+      "eval_accuracy": 0.9875457875457876,
+      "eval_f1": 0.9875697973801115,
+      "eval_loss": 0.04443557932972908,
+      "eval_precision": 0.9876259880187351,
+      "eval_recall": 0.9875457875457876,
+      "eval_runtime": 3.9441,
+      "eval_samples_per_second": 346.088,
+      "eval_steps_per_second": 43.356,
+      "step": 170
+    },
+    {
+      "epoch": 2.986822840409956,
+      "eval_accuracy": 0.989010989010989,
+      "eval_f1": 0.9890405015532383,
+      "eval_loss": 0.03978995233774185,
+      "eval_precision": 0.9891330367917903,
+      "eval_recall": 0.989010989010989,
+      "eval_runtime": 3.9868,
+      "eval_samples_per_second": 342.378,
+      "eval_steps_per_second": 42.891,
+      "step": 255
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 255,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.7096378747392e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-255/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:37edd9986d3659d5cfeb9aa8cfbe6429149a6cd74482bcfbbbae5877c8eae7df
+size 5240

checkpoint-256/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-256/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a88f787681237fee33b288f12593aacb934387bd6da2bb8ff790e9b5a05f9556
+size 94763496

checkpoint-256/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:346b3d592afd4162ca6d18904ccc574e4d170d2fe28c5c444a687f9850fd23b6
+size 189552570

checkpoint-256/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-256/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:681b1a6a4f0a991d47831ff66346aef2bdf16d4f5cc0b1dfbedc7d47e4c328a1
+size 14308

checkpoint-256/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93dfa4ba2e0507f7a6d68626387a161a1bbe6b94f9a9daf967637af5f5748293
+size 1064

checkpoint-256/trainer_state.json ADDED Viewed

	@@ -0,0 +1,78 @@

+{
+  "best_metric": 0.9875457875457876,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-256",
+  "epoch": 2.998535871156662,
+  "eval_steps": 500,
+  "global_step": 256,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9956076134699854,
+      "eval_accuracy": 0.9787545787545787,
+      "eval_f1": 0.9788275754377449,
+      "eval_loss": 0.07363971322774887,
+      "eval_precision": 0.9790028856592324,
+      "eval_recall": 0.9787545787545787,
+      "eval_runtime": 4.1234,
+      "eval_samples_per_second": 331.041,
+      "eval_steps_per_second": 41.471,
+      "step": 85
+    },
+    {
+      "epoch": 1.9912152269399708,
+      "eval_accuracy": 0.9758241758241758,
+      "eval_f1": 0.9760458977669253,
+      "eval_loss": 0.0680176243185997,
+      "eval_precision": 0.9770364666252971,
+      "eval_recall": 0.9758241758241758,
+      "eval_runtime": 3.9805,
+      "eval_samples_per_second": 342.924,
+      "eval_steps_per_second": 42.96,
+      "step": 170
+    },
+    {
+      "epoch": 2.998535871156662,
+      "eval_accuracy": 0.9875457875457876,
+      "eval_f1": 0.987550637300988,
+      "eval_loss": 0.044689420610666275,
+      "eval_precision": 0.9875567820840008,
+      "eval_recall": 0.9875457875457876,
+      "eval_runtime": 4.1011,
+      "eval_samples_per_second": 332.839,
+      "eval_steps_per_second": 41.696,
+      "step": 256
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 595,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 3.725102279808e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-256/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:caa3df7f2810faa9c35a46d178b12337edb0b134aa27dc1689b302d9bcc9d3d0
+size 5240

checkpoint-341/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-341/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d274d762a507f6e75c1d2a58abb70f2a03423ada1370bde55f03f89babb022da
+size 94763496

checkpoint-341/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab5a9612889baf3497db6846ceb8c24a7fa052bc1a8f788d7b5b366a70c8d5b9
+size 189552570

checkpoint-341/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-341/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8c14b301b5ea3ffdd05cbe8ff85a0d16fa4c4467786db8506b5bdcb5af8a9a2d
+size 14308

checkpoint-341/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:db61ebcfff67389442b8098d4cae839f684a87068fe21401504beb7ddd27d04d
+size 1064

checkpoint-341/trainer_state.json ADDED Viewed

	@@ -0,0 +1,90 @@

+{
+  "best_metric": 0.9904761904761905,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341",
+  "epoch": 3.994143484626647,
+  "eval_steps": 500,
+  "global_step": 341,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9956076134699854,
+      "eval_accuracy": 0.9787545787545787,
+      "eval_f1": 0.9788275754377449,
+      "eval_loss": 0.07363971322774887,
+      "eval_precision": 0.9790028856592324,
+      "eval_recall": 0.9787545787545787,
+      "eval_runtime": 4.1234,
+      "eval_samples_per_second": 331.041,
+      "eval_steps_per_second": 41.471,
+      "step": 85
+    },
+    {
+      "epoch": 1.9912152269399708,
+      "eval_accuracy": 0.9758241758241758,
+      "eval_f1": 0.9760458977669253,
+      "eval_loss": 0.0680176243185997,
+      "eval_precision": 0.9770364666252971,
+      "eval_recall": 0.9758241758241758,
+      "eval_runtime": 3.9805,
+      "eval_samples_per_second": 342.924,
+      "eval_steps_per_second": 42.96,
+      "step": 170
+    },
+    {
+      "epoch": 2.998535871156662,
+      "eval_accuracy": 0.9875457875457876,
+      "eval_f1": 0.987550637300988,
+      "eval_loss": 0.044689420610666275,
+      "eval_precision": 0.9875567820840008,
+      "eval_recall": 0.9875457875457876,
+      "eval_runtime": 4.1011,
+      "eval_samples_per_second": 332.839,
+      "eval_steps_per_second": 41.696,
+      "step": 256
+    },
+    {
+      "epoch": 3.994143484626647,
+      "eval_accuracy": 0.9904761904761905,
+      "eval_f1": 0.9904945509377323,
+      "eval_loss": 0.045228052884340286,
+      "eval_precision": 0.9905452314533213,
+      "eval_recall": 0.9904761904761905,
+      "eval_runtime": 3.9393,
+      "eval_samples_per_second": 346.509,
+      "eval_steps_per_second": 43.409,
+      "step": 341
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 595,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 4.966803039744e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-341/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:caa3df7f2810faa9c35a46d178b12337edb0b134aa27dc1689b302d9bcc9d3d0
+size 5240

checkpoint-426/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-426/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:94760f7df9dc2c6bad702593ec0871720fa6ae352e88f79c71bcfccc8fab1a09
+size 94763496

checkpoint-426/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b6550e976738f22f913650571284f8eb12dea30c8877134bbe84a1ebd7a73b5e
+size 189552570

checkpoint-426/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-426/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c2a1aad7f62f9d383e6bd694b87da317b54d942be2b578a455bcdaaf3258d46a
+size 14308

checkpoint-426/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1894ac3a34350cc065802675cae4d32438918a7d772edc033390240aaf5d8841
+size 1064

checkpoint-426/trainer_state.json ADDED Viewed

	@@ -0,0 +1,102 @@

+{
+  "best_metric": 0.991941391941392,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-426",
+  "epoch": 4.989751098096632,
+  "eval_steps": 500,
+  "global_step": 426,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9956076134699854,
+      "eval_accuracy": 0.9787545787545787,
+      "eval_f1": 0.9788275754377449,
+      "eval_loss": 0.07363971322774887,
+      "eval_precision": 0.9790028856592324,
+      "eval_recall": 0.9787545787545787,
+      "eval_runtime": 4.1234,
+      "eval_samples_per_second": 331.041,
+      "eval_steps_per_second": 41.471,
+      "step": 85
+    },
+    {
+      "epoch": 1.9912152269399708,
+      "eval_accuracy": 0.9758241758241758,
+      "eval_f1": 0.9760458977669253,
+      "eval_loss": 0.0680176243185997,
+      "eval_precision": 0.9770364666252971,
+      "eval_recall": 0.9758241758241758,
+      "eval_runtime": 3.9805,
+      "eval_samples_per_second": 342.924,
+      "eval_steps_per_second": 42.96,
+      "step": 170
+    },
+    {
+      "epoch": 2.998535871156662,
+      "eval_accuracy": 0.9875457875457876,
+      "eval_f1": 0.987550637300988,
+      "eval_loss": 0.044689420610666275,
+      "eval_precision": 0.9875567820840008,
+      "eval_recall": 0.9875457875457876,
+      "eval_runtime": 4.1011,
+      "eval_samples_per_second": 332.839,
+      "eval_steps_per_second": 41.696,
+      "step": 256
+    },
+    {
+      "epoch": 3.994143484626647,
+      "eval_accuracy": 0.9904761904761905,
+      "eval_f1": 0.9904945509377323,
+      "eval_loss": 0.045228052884340286,
+      "eval_precision": 0.9905452314533213,
+      "eval_recall": 0.9904761904761905,
+      "eval_runtime": 3.9393,
+      "eval_samples_per_second": 346.509,
+      "eval_steps_per_second": 43.409,
+      "step": 341
+    },
+    {
+      "epoch": 4.989751098096632,
+      "eval_accuracy": 0.991941391941392,
+      "eval_f1": 0.9919569277165429,
+      "eval_loss": 0.04387320205569267,
+      "eval_precision": 0.9920048531706146,
+      "eval_recall": 0.991941391941392,
+      "eval_runtime": 4.0115,
+      "eval_samples_per_second": 340.268,
+      "eval_steps_per_second": 42.627,
+      "step": 426
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 595,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 6.20850379968e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-426/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:caa3df7f2810faa9c35a46d178b12337edb0b134aa27dc1689b302d9bcc9d3d0
+size 5240

checkpoint-512/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-512/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6beddb5fef4d20200cfcf763c9460267deb7ad4514b1fa760fa4f89d398502cf
+size 94763496

checkpoint-512/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2cfb7299eb13d9980cb44dcbfcf90cc3e4a95d2c84fd840b959005ca0b7566d6
+size 189552570

checkpoint-512/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-512/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:863dd8c5b813736d29c00a5bac8fd9a20f38b88a7fb576cceea0cc85f0cbd789
+size 14308

checkpoint-512/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7900f26d6583fa63e5c081f39e0457bc3033e9e087a3f2085f881f9fac700fb3
+size 1064

checkpoint-512/trainer_state.json ADDED Viewed

	@@ -0,0 +1,121 @@

+{
+  "best_metric": 0.991941391941392,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-426",
+  "epoch": 5.997071742313324,
+  "eval_steps": 500,
+  "global_step": 512,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9956076134699854,
+      "eval_accuracy": 0.9787545787545787,
+      "eval_f1": 0.9788275754377449,
+      "eval_loss": 0.07363971322774887,
+      "eval_precision": 0.9790028856592324,
+      "eval_recall": 0.9787545787545787,
+      "eval_runtime": 4.1234,
+      "eval_samples_per_second": 331.041,
+      "eval_steps_per_second": 41.471,
+      "step": 85
+    },
+    {
+      "epoch": 1.9912152269399708,
+      "eval_accuracy": 0.9758241758241758,
+      "eval_f1": 0.9760458977669253,
+      "eval_loss": 0.0680176243185997,
+      "eval_precision": 0.9770364666252971,
+      "eval_recall": 0.9758241758241758,
+      "eval_runtime": 3.9805,
+      "eval_samples_per_second": 342.924,
+      "eval_steps_per_second": 42.96,
+      "step": 170
+    },
+    {
+      "epoch": 2.998535871156662,
+      "eval_accuracy": 0.9875457875457876,
+      "eval_f1": 0.987550637300988,
+      "eval_loss": 0.044689420610666275,
+      "eval_precision": 0.9875567820840008,
+      "eval_recall": 0.9875457875457876,
+      "eval_runtime": 4.1011,
+      "eval_samples_per_second": 332.839,
+      "eval_steps_per_second": 41.696,
+      "step": 256
+    },
+    {
+      "epoch": 3.994143484626647,
+      "eval_accuracy": 0.9904761904761905,
+      "eval_f1": 0.9904945509377323,
+      "eval_loss": 0.045228052884340286,
+      "eval_precision": 0.9905452314533213,
+      "eval_recall": 0.9904761904761905,
+      "eval_runtime": 3.9393,
+      "eval_samples_per_second": 346.509,
+      "eval_steps_per_second": 43.409,
+      "step": 341
+    },
+    {
+      "epoch": 4.989751098096632,
+      "eval_accuracy": 0.991941391941392,
+      "eval_f1": 0.9919569277165429,
+      "eval_loss": 0.04387320205569267,
+      "eval_precision": 0.9920048531706146,
+      "eval_recall": 0.991941391941392,
+      "eval_runtime": 4.0115,
+      "eval_samples_per_second": 340.268,
+      "eval_steps_per_second": 42.627,
+      "step": 426
+    },
+    {
+      "epoch": 5.856515373352855,
+      "grad_norm": 0.01621050015091896,
+      "learning_rate": 6.1795711069424666e-06,
+      "loss": 0.053,
+      "step": 500
+    },
+    {
+      "epoch": 5.997071742313324,
+      "eval_accuracy": 0.991941391941392,
+      "eval_f1": 0.9919507596926951,
+      "eval_loss": 0.04010434448719025,
+      "eval_precision": 0.991971823048746,
+      "eval_recall": 0.991941391941392,
+      "eval_runtime": 4.1768,
+      "eval_samples_per_second": 326.803,
+      "eval_steps_per_second": 40.94,
+      "step": 512
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 595,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 7,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 7.450204559616e+16,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-512/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:caa3df7f2810faa9c35a46d178b12337edb0b134aa27dc1689b302d9bcc9d3d0
+size 5240

checkpoint-595/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}