Marcos12886 commited on 21 days ago

Commit

ee61ac2

•

1 Parent(s): 119c958

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +45 -3
checkpoint-102/config.json +80 -0
checkpoint-102/model.safetensors +3 -0
checkpoint-102/optimizer.pt +3 -0
checkpoint-102/preprocessor_config.json +9 -0
checkpoint-102/rng_state.pth +3 -0
checkpoint-102/scheduler.pt +3 -0
checkpoint-102/trainer_state.json +138 -0
checkpoint-102/training_args.bin +3 -0
checkpoint-114/config.json +80 -0
checkpoint-114/model.safetensors +3 -0
checkpoint-114/optimizer.pt +3 -0
checkpoint-114/preprocessor_config.json +9 -0
checkpoint-114/rng_state.pth +3 -0
checkpoint-114/scheduler.pt +3 -0
checkpoint-114/trainer_state.json +150 -0
checkpoint-114/training_args.bin +3 -0
checkpoint-12/model.safetensors +1 -1
checkpoint-12/optimizer.pt +1 -1
checkpoint-12/rng_state.pth +1 -1
checkpoint-12/scheduler.pt +1 -1
checkpoint-12/trainer_state.json +13 -13
checkpoint-12/training_args.bin +1 -1
checkpoint-120/config.json +80 -0
checkpoint-120/model.safetensors +3 -0
checkpoint-120/optimizer.pt +3 -0
checkpoint-120/preprocessor_config.json +9 -0
checkpoint-120/rng_state.pth +3 -0
checkpoint-120/scheduler.pt +3 -0
checkpoint-120/trainer_state.json +162 -0
checkpoint-120/training_args.bin +3 -0
checkpoint-25/model.safetensors +1 -1
checkpoint-25/optimizer.pt +1 -1
checkpoint-25/rng_state.pth +2 -2
checkpoint-25/scheduler.pt +1 -1
checkpoint-25/trainer_state.json +20 -20
checkpoint-25/training_args.bin +1 -1
checkpoint-38/model.safetensors +1 -1
checkpoint-38/optimizer.pt +1 -1
checkpoint-38/rng_state.pth +2 -2
checkpoint-38/scheduler.pt +1 -1
checkpoint-38/trainer_state.json +28 -28
checkpoint-38/training_args.bin +1 -1
checkpoint-51/model.safetensors +1 -1
checkpoint-51/optimizer.pt +1 -1
checkpoint-51/rng_state.pth +2 -2
checkpoint-51/scheduler.pt +1 -1
checkpoint-51/trainer_state.json +36 -36
checkpoint-51/training_args.bin +1 -1
checkpoint-63/model.safetensors +1 -1

README.md CHANGED Viewed

@@ -6,9 +6,36 @@ tags:
 - generated_from_trainer
 datasets:
 - audiofolder
 model-index:
 - name: distilhubert-finetuned-cry-detector
-  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -17,6 +44,12 @@ should probably proofread and complete it, then remove this comment. -->
 # distilhubert-finetuned-cry-detector
 This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
 ## Model description
@@ -44,13 +77,22 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.001
-- num_epochs: 1
 ### Training results
 | Training Loss | Epoch  | Step | Validation Loss | Accuracy | F1     | Precision | Recall |
 |:-------------:|:------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
-| No log        | 0.9412 | 12   | 0.3379          | 0.9559   | 0.9555 | 0.9564    | 0.9559 |
 ### Framework versions

 - generated_from_trainer
 datasets:
 - audiofolder
+metrics:
+- accuracy
+- f1
+- precision
+- recall
 model-index:
 - name: distilhubert-finetuned-cry-detector
+  results:
+  - task:
+      name: Audio Classification
+      type: audio-classification
+    dataset:
+      name: audiofolder
+      type: audiofolder
+      config: default
+      split: train
+      args: default
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 0.9852941176470589
+    - name: F1
+      type: f1
+      value: 0.9853150765112866
+    - name: Precision
+      type: precision
+      value: 0.9853868369053048
+    - name: Recall
+      type: recall
+      value: 0.9852941176470589
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # distilhubert-finetuned-cry-detector
 This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the audiofolder dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.0332
+- Accuracy: 0.9853
+- F1: 0.9853
+- Precision: 0.9854
+- Recall: 0.9853
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: cosine
 - lr_scheduler_warmup_ratio: 0.001
+- num_epochs: 10
 ### Training results
 | Training Loss | Epoch  | Step | Validation Loss | Accuracy | F1     | Precision | Recall |
 |:-------------:|:------:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
+| No log        | 0.9412 | 12   | 0.1931          | 0.9363   | 0.9365 | 0.9372    | 0.9363 |
+| No log        | 1.9608 | 25   | 0.0950          | 0.9706   | 0.9704 | 0.9710    | 0.9706 |
+| No log        | 2.9804 | 38   | 0.0611          | 0.9804   | 0.9804 | 0.9804    | 0.9804 |
+| No log        | 4.0    | 51   | 0.0492          | 0.9853   | 0.9853 | 0.9853    | 0.9853 |
+| No log        | 4.9412 | 63   | 0.0588          | 0.9804   | 0.9805 | 0.9814    | 0.9804 |
+| No log        | 5.9608 | 76   | 0.0368          | 0.9853   | 0.9853 | 0.9854    | 0.9853 |
+| No log        | 6.9804 | 89   | 0.0382          | 0.9902   | 0.9902 | 0.9903    | 0.9902 |
+| No log        | 8.0    | 102  | 0.0318          | 0.9951   | 0.9951 | 0.9951    | 0.9951 |
+| No log        | 8.9412 | 114  | 0.0331          | 0.9853   | 0.9853 | 0.9854    | 0.9853 |
+| No log        | 9.4118 | 120  | 0.0332          | 0.9853   | 0.9853 | 0.9854    | 0.9853 |
 ### Framework versions

checkpoint-102/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-102/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:098c90d2cba195ac20033090c5954f7ef596abcdeebba724cb1365151033b05e
+size 94763496

checkpoint-102/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6038d1ad5c694fa39b163e31b2ae8b290c47bf72179e6f7edebc2516088a6742
+size 189552570

checkpoint-102/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-102/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e516bd48eedd1efdcdab1bc63eb245ee5f25372c9b0345efbc5ed2cd8b1b542
+size 14308

checkpoint-102/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2b0f7d0de8839ca69a8acf7eae5d4a6ab5235d97ffbdfee2586222c3a1d5f473
+size 1064

checkpoint-102/trainer_state.json ADDED Viewed

	@@ -0,0 +1,138 @@

+{
+  "best_metric": 0.9950980392156863,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-102",
+  "epoch": 8.0,
+  "eval_steps": 500,
+  "global_step": 102,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
+      "step": 12
+    },
+    {
+      "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9705882352941176,
+      "eval_f1": 0.9704025549613785,
+      "eval_loss": 0.09495726972818375,
+      "eval_precision": 0.971039759187257,
+      "eval_recall": 0.9705882352941176,
+      "eval_runtime": 3.1171,
+      "eval_samples_per_second": 65.446,
+      "eval_steps_per_second": 8.341,
+      "step": 25
+    },
+    {
+      "epoch": 2.980392156862745,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9803921568627451,
+      "eval_loss": 0.06114682927727699,
+      "eval_precision": 0.9803921568627451,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.2163,
+      "eval_samples_per_second": 63.428,
+      "eval_steps_per_second": 8.084,
+      "step": 38
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9852722698274712,
+      "eval_loss": 0.049169763922691345,
+      "eval_precision": 0.9853018065952722,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1223,
+      "eval_samples_per_second": 65.336,
+      "eval_steps_per_second": 8.327,
+      "step": 51
+    },
+    {
+      "epoch": 4.9411764705882355,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9804969685242518,
+      "eval_loss": 0.05879249796271324,
+      "eval_precision": 0.9813976872800402,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.1449,
+      "eval_samples_per_second": 64.868,
+      "eval_steps_per_second": 8.267,
+      "step": 63
+    },
+    {
+      "epoch": 5.96078431372549,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9853150765112866,
+      "eval_loss": 0.03680075705051422,
+      "eval_precision": 0.9853868369053048,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1698,
+      "eval_samples_per_second": 64.358,
+      "eval_steps_per_second": 8.203,
+      "step": 76
+    },
+    {
+      "epoch": 6.980392156862745,
+      "eval_accuracy": 0.9901960784313726,
+      "eval_f1": 0.9901663478316141,
+      "eval_loss": 0.0382298119366169,
+      "eval_precision": 0.9903446226975638,
+      "eval_recall": 0.9901960784313726,
+      "eval_runtime": 3.1376,
+      "eval_samples_per_second": 65.019,
+      "eval_steps_per_second": 8.287,
+      "step": 89
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.9950980392156863,
+      "eval_f1": 0.995090756609157,
+      "eval_loss": 0.03175761550664902,
+      "eval_precision": 0.995135458763658,
+      "eval_recall": 0.9950980392156863,
+      "eval_runtime": 2.949,
+      "eval_samples_per_second": 69.175,
+      "eval_steps_per_second": 8.816,
+      "step": 102
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 120,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.052064945063383e+17,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-102/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
+size 5240

checkpoint-114/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-114/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b910bf6b8ec6e19d58a4b52c50de712e949fcdaeece42948112d2e5d95e8f47c
+size 94763496

checkpoint-114/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:85b95917e0620b5556323a8c02ab048666c97ab19fb25f8fa5f1554c0bfc225f
+size 189552570

checkpoint-114/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-114/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:636081736c072d4bb3052b5541d861668c6c103f9a3ad62f001239e9a3a36fb1
+size 14308

checkpoint-114/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3fde2346e00a3c4644832268d0eaddcd20d8548145016394246c018bb8a28ba1
+size 1064

checkpoint-114/trainer_state.json ADDED Viewed

	@@ -0,0 +1,150 @@

+{
+  "best_metric": 0.9950980392156863,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-102",
+  "epoch": 8.941176470588236,
+  "eval_steps": 500,
+  "global_step": 114,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
+      "step": 12
+    },
+    {
+      "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9705882352941176,
+      "eval_f1": 0.9704025549613785,
+      "eval_loss": 0.09495726972818375,
+      "eval_precision": 0.971039759187257,
+      "eval_recall": 0.9705882352941176,
+      "eval_runtime": 3.1171,
+      "eval_samples_per_second": 65.446,
+      "eval_steps_per_second": 8.341,
+      "step": 25
+    },
+    {
+      "epoch": 2.980392156862745,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9803921568627451,
+      "eval_loss": 0.06114682927727699,
+      "eval_precision": 0.9803921568627451,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.2163,
+      "eval_samples_per_second": 63.428,
+      "eval_steps_per_second": 8.084,
+      "step": 38
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9852722698274712,
+      "eval_loss": 0.049169763922691345,
+      "eval_precision": 0.9853018065952722,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1223,
+      "eval_samples_per_second": 65.336,
+      "eval_steps_per_second": 8.327,
+      "step": 51
+    },
+    {
+      "epoch": 4.9411764705882355,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9804969685242518,
+      "eval_loss": 0.05879249796271324,
+      "eval_precision": 0.9813976872800402,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.1449,
+      "eval_samples_per_second": 64.868,
+      "eval_steps_per_second": 8.267,
+      "step": 63
+    },
+    {
+      "epoch": 5.96078431372549,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9853150765112866,
+      "eval_loss": 0.03680075705051422,
+      "eval_precision": 0.9853868369053048,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1698,
+      "eval_samples_per_second": 64.358,
+      "eval_steps_per_second": 8.203,
+      "step": 76
+    },
+    {
+      "epoch": 6.980392156862745,
+      "eval_accuracy": 0.9901960784313726,
+      "eval_f1": 0.9901663478316141,
+      "eval_loss": 0.0382298119366169,
+      "eval_precision": 0.9903446226975638,
+      "eval_recall": 0.9901960784313726,
+      "eval_runtime": 3.1376,
+      "eval_samples_per_second": 65.019,
+      "eval_steps_per_second": 8.287,
+      "step": 89
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.9950980392156863,
+      "eval_f1": 0.995090756609157,
+      "eval_loss": 0.03175761550664902,
+      "eval_precision": 0.995135458763658,
+      "eval_recall": 0.9950980392156863,
+      "eval_runtime": 2.949,
+      "eval_samples_per_second": 69.175,
+      "eval_steps_per_second": 8.816,
+      "step": 102
+    },
+    {
+      "epoch": 8.941176470588236,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9853150765112866,
+      "eval_loss": 0.033123087137937546,
+      "eval_precision": 0.9853868369053048,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 2.9458,
+      "eval_samples_per_second": 69.251,
+      "eval_steps_per_second": 8.826,
+      "step": 114
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 120,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.1834894644418458e+17,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-114/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
+size 5240

checkpoint-12/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ed24ddc80fbfa0595409861cddf08e518561fbdd7c4461e5edac2ef1da033508
 size 94763496

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ac774d14fe5167fbe1adddc20941f151440dc32f43d6762bbe9d60a26726e8e
 size 94763496

checkpoint-12/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf1fd2bcc1d5386abd738663f70a4cfa450e0389d1bb46d5ebbd8d22ee0082c5
 size 189552570

 version https://git-lfs.github.com/spec/v1
+oid sha256:56315b610ef113026417660dc64000a73d31bcdf367d4ade81935feefcbbb425
 size 189552570

checkpoint-12/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0dd5e5067cb0b69c310c1cb6eb41548b436585db6c11789bed910bb1926cd7c4
 size 14308

 version https://git-lfs.github.com/spec/v1
+oid sha256:caebb0abc1e3f29ed8c6d6714ac9331ab5a6b59efbd9b310598bb00f5bca4c19
 size 14308

checkpoint-12/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:00ac470d61d5b4613444f686474fe5bf71dbe645a07555e3c0011199a78b17ab
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ca0321d043e24273cc9815784db5e90a317cada9c48cd156d448ab1591d936c
 size 1064

checkpoint-12/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.9558823529411765,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-12",
   "epoch": 0.9411764705882353,
   "eval_steps": 500,
@@ -10,21 +10,21 @@
   "log_history": [
     {
       "epoch": 0.9411764705882353,
-      "eval_accuracy": 0.9558823529411765,
-      "eval_f1": 0.9555272696227192,
-      "eval_loss": 0.33786964416503906,
-      "eval_precision": 0.9564428025638596,
-      "eval_recall": 0.9558823529411765,
-      "eval_runtime": 3.0231,
-      "eval_samples_per_second": 67.479,
-      "eval_steps_per_second": 8.6,
       "step": 12
     }
   ],
   "logging_steps": 500,
-  "max_steps": 12,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 1,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
@@ -42,12 +42,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": true
       },
       "attributes": {}
     }
   },
-  "total_flos": 1.238025689554944e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.9362745098039216,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-12",
   "epoch": 0.9411764705882353,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
       "step": 12
     }
   ],
   "logging_steps": 500,
+  "max_steps": 120,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": false
       },
       "attributes": {}
     }
   },
+  "total_flos": 1.315729776671232e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

checkpoint-12/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a1c27b4ecab2c1ddc610f4ce2ead133759bcabe788a27ce90b2b23560c4e6ad3
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
 size 5240

checkpoint-120/config.json ADDED Viewed

	@@ -0,0 +1,80 @@

+{
+  "_name_or_path": "ntu-spml/distilhubert",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": false,
+  "architectures": [
+    "HubertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 1,
+  "classifier_proj_size": 256,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "ctc_loss_reduction": "sum",
+  "ctc_zero_infinity": false,
+  "do_stable_layer_norm": false,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "feat_proj_layer_norm": false,
+  "final_dropout": 0.0,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "crying",
+    "1": "no_crying"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "crying": "0",
+    "no_crying": "1"
+  },
+  "layer_norm_eps": 1e-05,
+  "layerdrop": 0.0,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "model_type": "hubert",
+  "num_attention_heads": 12,
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_hidden_layers": 2,
+  "pad_token_id": 0,
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.2",
+  "use_weighted_layer_sum": false,
+  "vocab_size": 32
+}

checkpoint-120/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3258e17c3151e1d9899b5ecaa38ee7208137f2c975f17a7f66834494fb6f1ddb
+size 94763496

checkpoint-120/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d67e947c82c7eff62fe82e2161b429d0f674dcb710ae9e066c9aaeaa53719096
+size 189552570

checkpoint-120/preprocessor_config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "do_normalize": false,
+  "feature_extractor_type": "Wav2Vec2FeatureExtractor",
+  "feature_size": 1,
+  "padding_side": "right",
+  "padding_value": 0,
+  "return_attention_mask": false,
+  "sampling_rate": 16000
+}

checkpoint-120/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:286671099adfaa4371e8fead24d8a5f622004012b7f075f68979922946bd3511
+size 14308

checkpoint-120/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2409fb1c3fd1c2de2c63b5459c49a97abc9a50084af4337cc5090c00ef975a6
+size 1064

checkpoint-120/trainer_state.json ADDED Viewed

	@@ -0,0 +1,162 @@

+{
+  "best_metric": 0.9950980392156863,
+  "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-102",
+  "epoch": 9.411764705882353,
+  "eval_steps": 500,
+  "global_step": 120,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
+      "step": 12
+    },
+    {
+      "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9705882352941176,
+      "eval_f1": 0.9704025549613785,
+      "eval_loss": 0.09495726972818375,
+      "eval_precision": 0.971039759187257,
+      "eval_recall": 0.9705882352941176,
+      "eval_runtime": 3.1171,
+      "eval_samples_per_second": 65.446,
+      "eval_steps_per_second": 8.341,
+      "step": 25
+    },
+    {
+      "epoch": 2.980392156862745,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9803921568627451,
+      "eval_loss": 0.06114682927727699,
+      "eval_precision": 0.9803921568627451,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.2163,
+      "eval_samples_per_second": 63.428,
+      "eval_steps_per_second": 8.084,
+      "step": 38
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9852722698274712,
+      "eval_loss": 0.049169763922691345,
+      "eval_precision": 0.9853018065952722,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1223,
+      "eval_samples_per_second": 65.336,
+      "eval_steps_per_second": 8.327,
+      "step": 51
+    },
+    {
+      "epoch": 4.9411764705882355,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9804969685242518,
+      "eval_loss": 0.05879249796271324,
+      "eval_precision": 0.9813976872800402,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.1449,
+      "eval_samples_per_second": 64.868,
+      "eval_steps_per_second": 8.267,
+      "step": 63
+    },
+    {
+      "epoch": 5.96078431372549,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9853150765112866,
+      "eval_loss": 0.03680075705051422,
+      "eval_precision": 0.9853868369053048,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1698,
+      "eval_samples_per_second": 64.358,
+      "eval_steps_per_second": 8.203,
+      "step": 76
+    },
+    {
+      "epoch": 6.980392156862745,
+      "eval_accuracy": 0.9901960784313726,
+      "eval_f1": 0.9901663478316141,
+      "eval_loss": 0.0382298119366169,
+      "eval_precision": 0.9903446226975638,
+      "eval_recall": 0.9901960784313726,
+      "eval_runtime": 3.1376,
+      "eval_samples_per_second": 65.019,
+      "eval_steps_per_second": 8.287,
+      "step": 89
+    },
+    {
+      "epoch": 8.0,
+      "eval_accuracy": 0.9950980392156863,
+      "eval_f1": 0.995090756609157,
+      "eval_loss": 0.03175761550664902,
+      "eval_precision": 0.995135458763658,
+      "eval_recall": 0.9950980392156863,
+      "eval_runtime": 2.949,
+      "eval_samples_per_second": 69.175,
+      "eval_steps_per_second": 8.816,
+      "step": 102
+    },
+    {
+      "epoch": 8.941176470588236,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9853150765112866,
+      "eval_loss": 0.033123087137937546,
+      "eval_precision": 0.9853868369053048,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 2.9458,
+      "eval_samples_per_second": 69.251,
+      "eval_steps_per_second": 8.826,
+      "step": 114
+    },
+    {
+      "epoch": 9.411764705882353,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9853150765112866,
+      "eval_loss": 0.033173661679029465,
+      "eval_precision": 0.9853868369053048,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 2.9666,
+      "eval_samples_per_second": 68.766,
+      "eval_steps_per_second": 8.764,
+      "step": 120
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 120,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 3,
+        "early_stopping_threshold": 0.0
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.237670053721906e+17,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-120/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
+size 5240

checkpoint-25/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:457aaf1ca73f2bd8fdf652ff897b1db85473a23401cdea192ccda04c31e902f9
 size 94763496

 version https://git-lfs.github.com/spec/v1
+oid sha256:da1949ab9da06d9f94ddb053df98c408f27159d75669cf1d2eb4e1cc47323344
 size 94763496

checkpoint-25/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0f78eeb88abcee76fe1f3cb427847a3366d60d465ad4933bdf631baef11c677d
 size 189552570

 version https://git-lfs.github.com/spec/v1
+oid sha256:64fe5dbcc580831e63b26cf1b5d7e9409f5b456d1141636612d7fca115a01a87
 size 189552570

checkpoint-25/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8e5c954d42fa0d2b945cf8a644f5bb95c0ecae8f78ef6f89815808920b5b330c
-size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:272c079a133d684090b7a24b10497f4bd703dbf9ecfecafe1a788c62b4404ce6
+size 14308

checkpoint-25/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:91532783b102a4c8ff5ee86df37d3662ca7a62e198729a349c132e2c9a68d5d0
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:6633f18d367676ea03844228fc7112a6a9464032824bb5f9f17a85ee888f12e8
 size 1064

checkpoint-25/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.9558823529411765,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-25",
   "epoch": 1.9607843137254903,
   "eval_steps": 500,
@@ -10,33 +10,33 @@
   "log_history": [
     {
       "epoch": 0.9411764705882353,
-      "eval_accuracy": 0.9509803921568627,
-      "eval_f1": 0.9509803921568627,
-      "eval_loss": 0.19337645173072815,
-      "eval_precision": 0.9509803921568627,
-      "eval_recall": 0.9509803921568627,
-      "eval_runtime": 2.9937,
-      "eval_samples_per_second": 68.144,
-      "eval_steps_per_second": 8.685,
       "step": 12
     },
     {
       "epoch": 1.9607843137254903,
-      "eval_accuracy": 0.9558823529411765,
-      "eval_f1": 0.9558168094824137,
-      "eval_loss": 0.11207430809736252,
-      "eval_precision": 0.9558008500901145,
-      "eval_recall": 0.9558823529411765,
-      "eval_runtime": 2.9789,
-      "eval_samples_per_second": 68.481,
-      "eval_steps_per_second": 8.728,
       "step": 25
     }
   ],
   "logging_steps": 500,
-  "max_steps": 48,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 4,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
@@ -59,7 +59,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 2.632285534507315e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.9705882352941176,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-25",
   "epoch": 1.9607843137254903,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
       "step": 12
     },
     {
       "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9705882352941176,
+      "eval_f1": 0.9704025549613785,
+      "eval_loss": 0.09495726972818375,
+      "eval_precision": 0.971039759187257,
+      "eval_recall": 0.9705882352941176,
+      "eval_runtime": 3.1171,
+      "eval_samples_per_second": 65.446,
+      "eval_steps_per_second": 8.341,
       "step": 25
     }
   ],
   "logging_steps": 500,
+  "max_steps": 120,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
       "attributes": {}
     }
   },
+  "total_flos": 2.630848254506803e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

checkpoint-25/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b08c1ef2199623b781e926f1d827964186fca47326620731302bfe37c5d058b9
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
 size 5240

checkpoint-38/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:365a9fb794f55008ff39b21086b11700c109a194efb2127a6db2145604a614b6
 size 94763496

 version https://git-lfs.github.com/spec/v1
+oid sha256:d8bc28d8ebd1dbdd73656a784624c72928eb10e21d9e6acdce2e1d312d787010
 size 94763496

checkpoint-38/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:198372300c7cb71ea5cd197e4b8f17970da74cfc971f4a284751e8c5c2fe5397
 size 189552570

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ee1b6c4df5d7a5ef50f7350cb964bab9875222b057b8eb71768826fceb9156f
 size 189552570

checkpoint-38/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:780c51c50482e6e8f628b4687957abc3bb4ff7f96b977c02d8538cf6f0d2d494
-size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:4d19f57e20f91b35ae6289880b02cdfa14033ed6b20b4d1730bfb179a9264102
+size 14308

checkpoint-38/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96ddec5715a7e2a3cc7175b7f159a7e1fd2303094015b4bffdae6a236e889974
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:5df84074f7631c8ca35330b9e20d4190996409e954261c1b476ad0fabe74b93b
 size 1064

checkpoint-38/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.9607843137254902,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-38",
   "epoch": 2.980392156862745,
   "eval_steps": 500,
@@ -10,45 +10,45 @@
   "log_history": [
     {
       "epoch": 0.9411764705882353,
-      "eval_accuracy": 0.9509803921568627,
-      "eval_f1": 0.9509803921568627,
-      "eval_loss": 0.19337645173072815,
-      "eval_precision": 0.9509803921568627,
-      "eval_recall": 0.9509803921568627,
-      "eval_runtime": 2.9937,
-      "eval_samples_per_second": 68.144,
-      "eval_steps_per_second": 8.685,
       "step": 12
     },
     {
       "epoch": 1.9607843137254903,
-      "eval_accuracy": 0.9558823529411765,
-      "eval_f1": 0.9558168094824137,
-      "eval_loss": 0.11207430809736252,
-      "eval_precision": 0.9558008500901145,
-      "eval_recall": 0.9558823529411765,
-      "eval_runtime": 2.9789,
-      "eval_samples_per_second": 68.481,
-      "eval_steps_per_second": 8.728,
       "step": 25
     },
     {
       "epoch": 2.980392156862745,
-      "eval_accuracy": 0.9607843137254902,
-      "eval_f1": 0.9608937528499771,
-      "eval_loss": 0.08983828127384186,
-      "eval_precision": 0.9611995291537668,
-      "eval_recall": 0.9607843137254902,
-      "eval_runtime": 2.927,
-      "eval_samples_per_second": 69.695,
-      "eval_steps_per_second": 8.883,
       "step": 38
     }
   ],
   "logging_steps": 500,
-  "max_steps": 48,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 4,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
@@ -71,7 +71,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 3.947040143988326e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.9803921568627451,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-38",
   "epoch": 2.980392156862745,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
       "step": 12
     },
     {
       "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9705882352941176,
+      "eval_f1": 0.9704025549613785,
+      "eval_loss": 0.09495726972818375,
+      "eval_precision": 0.971039759187257,
+      "eval_recall": 0.9705882352941176,
+      "eval_runtime": 3.1171,
+      "eval_samples_per_second": 65.446,
+      "eval_steps_per_second": 8.341,
       "step": 25
     },
     {
       "epoch": 2.980392156862745,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9803921568627451,
+      "eval_loss": 0.06114682927727699,
+      "eval_precision": 0.9803921568627451,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.2163,
+      "eval_samples_per_second": 63.428,
+      "eval_steps_per_second": 8.084,
       "step": 38
     }
   ],
   "logging_steps": 500,
+  "max_steps": 120,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
       "attributes": {}
     }
   },
+  "total_flos": 3.946056334924685e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

checkpoint-38/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b08c1ef2199623b781e926f1d827964186fca47326620731302bfe37c5d058b9
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
 size 5240

checkpoint-51/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8e9b6729c50f84d9b261120a8e72c4b3a3da69e27bb43431fdcd37c673c45006
 size 94763496

 version https://git-lfs.github.com/spec/v1
+oid sha256:072781416d7434132c8e1b73276d4503dca0b1b8db503afa1a8ba07bc69b3ae9
 size 94763496

checkpoint-51/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:461ec76d1bc7a1e71c52a5302f7d5be7e5eec1ad9fc45cdec1c8d7a0e5e545c1
 size 189552570

 version https://git-lfs.github.com/spec/v1
+oid sha256:da71c2ca09d32a4c673ba10e3259d6198c7a2fbaa9004a4a0eaa7d9cc8d8fecb
 size 189552570

checkpoint-51/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bfb428aabf8fc7d0150525679311cfec661fbbda39191a37add4ec1737f1b54
-size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdc415b22b0f41c29b31b3bf40c83a0c3865a35793ba92c48d3d575e69ed5279
+size 14308

checkpoint-51/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bec8121eea0c42c283a1e74848057f68b938b9185ee7ce8d2f0f77b15cf4fe84
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:99f2e94f9942cdbd4528ad8ed9baf4498c04d7503c2ef6dab9521dfcb4021a49
 size 1064

checkpoint-51/trainer_state.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "best_metric": 0.9705882352941176,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-51",
   "epoch": 4.0,
   "eval_steps": 500,
@@ -10,57 +10,57 @@
   "log_history": [
     {
       "epoch": 0.9411764705882353,
-      "eval_accuracy": 0.9558823529411765,
-      "eval_f1": 0.9558168094824137,
-      "eval_loss": 0.18768352270126343,
-      "eval_precision": 0.9558008500901145,
-      "eval_recall": 0.9558823529411765,
-      "eval_runtime": 3.1767,
-      "eval_samples_per_second": 64.218,
-      "eval_steps_per_second": 8.185,
       "step": 12
     },
     {
       "epoch": 1.9607843137254903,
-      "eval_accuracy": 0.9607843137254902,
-      "eval_f1": 0.9603980954872683,
-      "eval_loss": 0.10839918255805969,
-      "eval_precision": 0.961865628604383,
-      "eval_recall": 0.9607843137254902,
-      "eval_runtime": 3.1396,
-      "eval_samples_per_second": 64.977,
-      "eval_steps_per_second": 8.281,
       "step": 25
     },
     {
       "epoch": 2.980392156862745,
-      "eval_accuracy": 0.9607843137254902,
-      "eval_f1": 0.9608937528499771,
-      "eval_loss": 0.07022649049758911,
-      "eval_precision": 0.9611995291537668,
-      "eval_recall": 0.9607843137254902,
-      "eval_runtime": 3.1392,
-      "eval_samples_per_second": 64.985,
-      "eval_steps_per_second": 8.282,
       "step": 38
     },
     {
       "epoch": 4.0,
-      "eval_accuracy": 0.9705882352941176,
-      "eval_f1": 0.9707454527863777,
-      "eval_loss": 0.05151732638478279,
-      "eval_precision": 0.9716895305130601,
-      "eval_recall": 0.9705882352941176,
-      "eval_runtime": 3.1558,
-      "eval_samples_per_second": 64.644,
-      "eval_steps_per_second": 8.239,
       "step": 51
     }
   ],
   "logging_steps": 500,
-  "max_steps": 96,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 8,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
@@ -83,7 +83,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 5.25877328162016e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
+  "best_metric": 0.9852941176470589,
   "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-51",
   "epoch": 4.0,
   "eval_steps": 500,
   "log_history": [
     {
       "epoch": 0.9411764705882353,
+      "eval_accuracy": 0.9362745098039216,
+      "eval_f1": 0.9365356058160116,
+      "eval_loss": 0.19313116371631622,
+      "eval_precision": 0.9372234219385678,
+      "eval_recall": 0.9362745098039216,
+      "eval_runtime": 3.0986,
+      "eval_samples_per_second": 65.836,
+      "eval_steps_per_second": 8.391,
       "step": 12
     },
     {
       "epoch": 1.9607843137254903,
+      "eval_accuracy": 0.9705882352941176,
+      "eval_f1": 0.9704025549613785,
+      "eval_loss": 0.09495726972818375,
+      "eval_precision": 0.971039759187257,
+      "eval_recall": 0.9705882352941176,
+      "eval_runtime": 3.1171,
+      "eval_samples_per_second": 65.446,
+      "eval_steps_per_second": 8.341,
       "step": 25
     },
     {
       "epoch": 2.980392156862745,
+      "eval_accuracy": 0.9803921568627451,
+      "eval_f1": 0.9803921568627451,
+      "eval_loss": 0.06114682927727699,
+      "eval_precision": 0.9803921568627451,
+      "eval_recall": 0.9803921568627451,
+      "eval_runtime": 3.2163,
+      "eval_samples_per_second": 63.428,
+      "eval_steps_per_second": 8.084,
       "step": 38
     },
     {
       "epoch": 4.0,
+      "eval_accuracy": 0.9852941176470589,
+      "eval_f1": 0.9852722698274712,
+      "eval_loss": 0.049169763922691345,
+      "eval_precision": 0.9853018065952722,
+      "eval_recall": 0.9852941176470589,
+      "eval_runtime": 3.1223,
+      "eval_samples_per_second": 65.336,
+      "eval_steps_per_second": 8.327,
       "step": 51
     }
   ],
   "logging_steps": 500,
+  "max_steps": 120,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 10,
   "save_steps": 500,
   "stateful_callbacks": {
     "EarlyStoppingCallback": {
       "attributes": {}
     }
   },
+  "total_flos": 5.261731531342733e+16,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

checkpoint-51/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ecc689edbe3573cb27ca0a4ddd21670a9f672918abacfb53cac5b55b680695a7
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:3b77b2a33ca88330b7909aacab81332695e9c9dcf797e7a7757ca31ffcde6f31
 size 5240

checkpoint-63/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc362a1585df3481e2dcd870193d28d930ae325d6150daaaad1493b1996de42f
 size 94763496

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c1568086524c8dced6705098aa1db3285da46fd4a5391fa6b9d6eb7df4502d4
 size 94763496