diff --git a/README.md b/README.md index 417a04d01ae5eaa82c450f544fa58c9cdab2e011..be579bc95277f8c0ff84913be5c67b1b4c186407 100644 --- a/README.md +++ b/README.md @@ -21,11 +21,11 @@ should probably proofread and complete it, then remove this comment. --> This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on an unknown dataset. It achieves the following results on the evaluation set: -- Loss: 0.0625 -- Accuracy: 0.9824 -- Precision: 0.9825 -- Recall: 0.9824 -- F1: 0.9824 +- Loss: 0.0338 +- Accuracy: 0.9912 +- Precision: 0.9912 +- Recall: 0.9912 +- F1: 0.9912 ## Model description @@ -53,16 +53,22 @@ The following hyperparameters were used during training: - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08 - lr_scheduler_type: cosine - lr_scheduler_warmup_ratio: 0.001 -- num_epochs: 4 +- num_epochs: 10 ### Training results | Training Loss | Epoch | Step | Validation Loss | Accuracy | Precision | Recall | F1 | |:-------------:|:------:|:----:|:---------------:|:--------:|:---------:|:------:|:------:| -| No log | 0.9956 | 85 | 0.1378 | 0.9546 | 0.9543 | 0.9546 | 0.9544 | -| No log | 1.9912 | 170 | 0.0802 | 0.9714 | 0.9713 | 0.9714 | 0.9714 | -| No log | 2.9985 | 256 | 0.0682 | 0.9780 | 0.9783 | 0.9780 | 0.9781 | -| No log | 3.9824 | 340 | 0.0625 | 0.9824 | 0.9825 | 0.9824 | 0.9824 | +| No log | 0.9956 | 85 | 0.1197 | 0.9538 | 0.9535 | 0.9538 | 0.9536 | +| No log | 1.9912 | 170 | 0.0601 | 0.9832 | 0.9831 | 0.9832 | 0.9831 | +| No log | 2.9985 | 256 | 0.0506 | 0.9868 | 0.9868 | 0.9868 | 0.9868 | +| No log | 3.9941 | 341 | 0.0461 | 0.9861 | 0.9864 | 0.9861 | 0.9862 | +| No log | 4.9898 | 426 | 0.0439 | 0.9890 | 0.9891 | 0.9890 | 0.9890 | +| 0.0779 | 5.9971 | 512 | 0.0396 | 0.9905 | 0.9905 | 0.9905 | 0.9905 | +| 0.0779 | 6.9927 | 597 | 0.0350 | 0.9919 | 0.9919 | 0.9919 | 0.9919 | +| 0.0779 | 8.0 | 683 | 0.0335 | 0.9912 | 0.9912 | 0.9912 | 0.9912 | +| 0.0779 | 8.9956 | 768 | 0.0337 | 0.9912 | 0.9912 | 0.9912 | 0.9912 | +| 0.0779 | 9.9561 | 850 | 0.0338 | 0.9912 | 0.9912 | 0.9912 | 0.9912 | ### Framework versions diff --git a/checkpoint-170/config.json b/checkpoint-170/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-170/config.json +++ b/checkpoint-170/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-170/model.safetensors b/checkpoint-170/model.safetensors index 6a50e39f6a58d280dbbe271aa2c56c8d349f4f48..74c739d41a0b1174ceca3d8a32599306e4bafacb 100644 --- a/checkpoint-170/model.safetensors +++ b/checkpoint-170/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e8a90553b00c4439fad5a7ed1ff0a9f76e60e707d76e5d455fd77360dff39ae0 +oid sha256:c27ce70effb26d2c4fae3a9e5f9435a7adf1d9096be67f3e04eaf7266135f148 size 94763496 diff --git a/checkpoint-170/optimizer.pt b/checkpoint-170/optimizer.pt index 41017a1dd3bed2b3c2a99fc13943f3bfde425111..fd36b76e26698568e8094163549ea04b0860f06f 100644 --- a/checkpoint-170/optimizer.pt +++ b/checkpoint-170/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2dba3cd8b01d3153e53635bf2a218b801d4fb4cfcf7a5f02fc1c0e0d267aeace +oid sha256:f521c92737364b558a7a1f423ef220dcbbcf0650e982c3e4d1b202ec007872c8 size 189552570 diff --git a/checkpoint-170/scheduler.pt b/checkpoint-170/scheduler.pt index ccec86cfa137b40efead0ae6ec0e51e94de1c9ab..ff6c0e1dcc11d85fbad00be1957ade82b7bc8cae 100644 --- a/checkpoint-170/scheduler.pt +++ b/checkpoint-170/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:44565a4b1d8937c55d485ff9cf817bf33c36c26adc047340853e15a70d1a023d +oid sha256:ba2c60537414c36d76239817fe1c8be075bed144e4b9d191a70b981deda17823 size 1064 diff --git a/checkpoint-170/trainer_state.json b/checkpoint-170/trainer_state.json index fbbe16677b26f57942aaa1321c7efa45e0855706..ae3705ed21ebef2070ac1d83a93f932b55b631be 100644 --- a/checkpoint-170/trainer_state.json +++ b/checkpoint-170/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9714285714285714, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-170", + "best_metric": 0.9831501831501831, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-170", "epoch": 1.9912152269399708, "eval_steps": 500, "global_step": 170, @@ -10,33 +10,33 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9545787545787546, - "eval_f1": 0.9543924849872077, - "eval_loss": 0.13782845437526703, - "eval_precision": 0.9543323172404159, - "eval_recall": 0.9545787545787546, - "eval_runtime": 6.1437, - "eval_samples_per_second": 222.18, - "eval_steps_per_second": 27.834, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.9714285714285714, - "eval_f1": 0.9713707024010776, - "eval_loss": 0.0802176371216774, - "eval_precision": 0.9713449610559759, - "eval_recall": 0.9714285714285714, - "eval_runtime": 6.0836, - "eval_samples_per_second": 224.373, - "eval_steps_per_second": 28.108, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 } ], "logging_steps": 500, - "max_steps": 340, + "max_steps": 850, "num_input_tokens_seen": 0, - "num_train_epochs": 4, + "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { diff --git a/checkpoint-170/training_args.bin b/checkpoint-170/training_args.bin index 7bfc5bd20dcd0c05fb8658eb0e6ae87fef5fc784..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-170/training_args.bin +++ b/checkpoint-170/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7bd8e997c05f23ae464180f8e5e9f881e9c68322e4fcd3f855e79e2e5d54fbb +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-256/config.json b/checkpoint-256/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-256/config.json +++ b/checkpoint-256/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-256/model.safetensors b/checkpoint-256/model.safetensors index 6a4a4697475ccbcddde58e08288809bf4960107d..456bede8b1b657b71434c461505cd95e6bf223a7 100644 --- a/checkpoint-256/model.safetensors +++ b/checkpoint-256/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:18d5013bf626b187ac7bbd42a7fb1a1b824c821cd062c951de17f19d9fb95944 +oid sha256:2992b8dfd27781b5920e6b800dd0bec2a8809a5eb8c0508b6726dd68807c3b6d size 94763496 diff --git a/checkpoint-256/optimizer.pt b/checkpoint-256/optimizer.pt index ee6bf2bf45058d8732b2308240150cd20cff9ca4..c4dc9890ba210142b5e5118838cdb443ab0df30c 100644 --- a/checkpoint-256/optimizer.pt +++ b/checkpoint-256/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7187577ead7a6d35f35a5dc44c0b76b32036040837b41821bc67970a2dde3ed2 +oid sha256:cb0f801198c29f1cc11cf39d019a185562336bfbfdee4056f15cc25e0604767a size 189552570 diff --git a/checkpoint-256/scheduler.pt b/checkpoint-256/scheduler.pt index 3f4b5df0a8d3938beefed6ffad1da45947190f87..f7900b290ffe4d627970ae8b847c339b29330299 100644 --- a/checkpoint-256/scheduler.pt +++ b/checkpoint-256/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eed9846f2cf239e8810dae264b4e0fe505a115ec40d5b4f9abdb240e9e0a0fae +oid sha256:0ea8c99bcd3f4c186db34ca4e9cbe89b586ea3bd6cf9703b17e9ec1f6c1ff961 size 1064 diff --git a/checkpoint-256/trainer_state.json b/checkpoint-256/trainer_state.json index d4e75f1332545bc1e7ad81fd6e0e7c8b6e2877b8..72077a24ee62b34804e883d99889ae723f9b3b24 100644 --- a/checkpoint-256/trainer_state.json +++ b/checkpoint-256/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.978021978021978, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-256", + "best_metric": 0.9868131868131869, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-256", "epoch": 2.998535871156662, "eval_steps": 500, "global_step": 256, @@ -10,45 +10,45 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9545787545787546, - "eval_f1": 0.9543924849872077, - "eval_loss": 0.13782845437526703, - "eval_precision": 0.9543323172404159, - "eval_recall": 0.9545787545787546, - "eval_runtime": 6.1437, - "eval_samples_per_second": 222.18, - "eval_steps_per_second": 27.834, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.9714285714285714, - "eval_f1": 0.9713707024010776, - "eval_loss": 0.0802176371216774, - "eval_precision": 0.9713449610559759, - "eval_recall": 0.9714285714285714, - "eval_runtime": 6.0836, - "eval_samples_per_second": 224.373, - "eval_steps_per_second": 28.108, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, - "eval_accuracy": 0.978021978021978, - "eval_f1": 0.9781077738703647, - "eval_loss": 0.06824816763401031, - "eval_precision": 0.9783204609221348, - "eval_recall": 0.978021978021978, - "eval_runtime": 6.0791, - "eval_samples_per_second": 224.54, - "eval_steps_per_second": 28.129, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 } ], "logging_steps": 500, - "max_steps": 340, + "max_steps": 850, "num_input_tokens_seen": 0, - "num_train_epochs": 4, + "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { diff --git a/checkpoint-256/training_args.bin b/checkpoint-256/training_args.bin index 7bfc5bd20dcd0c05fb8658eb0e6ae87fef5fc784..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-256/training_args.bin +++ b/checkpoint-256/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7bd8e997c05f23ae464180f8e5e9f881e9c68322e4fcd3f855e79e2e5d54fbb +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-341/config.json b/checkpoint-341/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-341/config.json +++ b/checkpoint-341/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-341/model.safetensors b/checkpoint-341/model.safetensors index 85df0ea5910a70822c5c241a6778444ef41e16db..0bb22ba16803df8e9019103965f08818bb330dfb 100644 --- a/checkpoint-341/model.safetensors +++ b/checkpoint-341/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4aef887b699e0e2fffd8fb2dabc3a3ee00a823581110ae055322fc7dccddae5f +oid sha256:a3fb881f587c38faf027d9d2f92c1142607ce7f334b76baccc3fafe76fbc4f38 size 94763496 diff --git a/checkpoint-341/optimizer.pt b/checkpoint-341/optimizer.pt index 47a44b97570594c94ef6b875dbfef719c3440439..ec5f176cb7c35b1ce96e960b54b3d15da589e84e 100644 --- a/checkpoint-341/optimizer.pt +++ b/checkpoint-341/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1f9a8acfee398336615756edc66f296d1f801d2fde4edac691df5318d5bad0e5 +oid sha256:62cf0c2fa4abd219e7fa80805ad290927ba54a46ecf6203e78bc102ea268400c size 189552570 diff --git a/checkpoint-341/trainer_state.json b/checkpoint-341/trainer_state.json index d497e4469373528427057e2a6460d6b8fcc42799..63137027efece7c37d018e4d0a85c48f7b7388c1 100644 --- a/checkpoint-341/trainer_state.json +++ b/checkpoint-341/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9875457875457876, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341", + "best_metric": 0.9868131868131869, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-256", "epoch": 3.994143484626647, "eval_steps": 500, "global_step": 341, @@ -10,50 +10,50 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9663003663003663, - "eval_f1": 0.9661425019393345, - "eval_loss": 0.10625720024108887, - "eval_precision": 0.966167198143384, - "eval_recall": 0.9663003663003663, - "eval_runtime": 6.2148, - "eval_samples_per_second": 219.638, - "eval_steps_per_second": 27.515, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.9824175824175824, - "eval_f1": 0.9824569651195038, - "eval_loss": 0.06455090641975403, - "eval_precision": 0.9825418778671476, - "eval_recall": 0.9824175824175824, - "eval_runtime": 5.7635, - "eval_samples_per_second": 236.835, - "eval_steps_per_second": 29.669, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, "eval_accuracy": 0.9868131868131869, - "eval_f1": 0.9868427238396278, - "eval_loss": 0.04568345472216606, - "eval_precision": 0.98691808355097, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, "eval_recall": 0.9868131868131869, - "eval_runtime": 6.1234, - "eval_samples_per_second": 222.916, - "eval_steps_per_second": 27.926, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 }, { "epoch": 3.994143484626647, - "eval_accuracy": 0.9875457875457876, - "eval_f1": 0.9875962963533335, - "eval_loss": 0.049539219588041306, - "eval_precision": 0.9877998892958556, - "eval_recall": 0.9875457875457876, - "eval_runtime": 6.1353, - "eval_samples_per_second": 222.481, - "eval_steps_per_second": 27.871, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, "step": 341 } ], diff --git a/checkpoint-341/training_args.bin b/checkpoint-341/training_args.bin index 269ba3bdd5c1bb997989b9e397e30230a149b155..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-341/training_args.bin +++ b/checkpoint-341/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:325406b343874b92345e9a863970ee7cd441131f2850f47ab026ed810d19a88c +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-426/config.json b/checkpoint-426/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-426/config.json +++ b/checkpoint-426/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-426/model.safetensors b/checkpoint-426/model.safetensors index 40e42894fea84b3487a8e019665920772c7ecfe9..18afb142bcc571295e545241979243713c8324fc 100644 --- a/checkpoint-426/model.safetensors +++ b/checkpoint-426/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4ccd0853b18fcef29f6c50370c40938c3fc157e6d6ab4f5a8cc0ee4de4c2a330 +oid sha256:f21392d62c0aae2cb86ef601a6fdd136f97139074d9fc1a5418821cfd21d8f2f size 94763496 diff --git a/checkpoint-426/optimizer.pt b/checkpoint-426/optimizer.pt index 1854f76a3aad589600291c3f40383d77f129cd61..f49936db5710a0ec5b1ca921318167f781837af8 100644 --- a/checkpoint-426/optimizer.pt +++ b/checkpoint-426/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:58cf1896c9f8575d9e790921f864e581859c2dd6014460c20f2981f52787a4a4 +oid sha256:54aacdf3b8335705d217fdd88584f914b41fdc67436f327708a19652d4774b8e size 189552570 diff --git a/checkpoint-426/scheduler.pt b/checkpoint-426/scheduler.pt index a89efae5254e3592d2d5203ed5f84b811fc226c9..4fbb1b94a920ce7ed1be2a946161afff20aa8894 100644 --- a/checkpoint-426/scheduler.pt +++ b/checkpoint-426/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:77da8d31fe5105cdaffd1de28e960ad7041d43ef167667465d3bd1e966ae27b0 +oid sha256:579ef0f1564878cc661672a4c8ce1e561a689fa403a5862a5af2e3ad39ed51e9 size 1064 diff --git a/checkpoint-426/trainer_state.json b/checkpoint-426/trainer_state.json index a8266b4c2cb62d48037fc15d11b66a9d6a13eb22..36a45a01a7729b138cf1358b471c8deb20b15b4e 100644 --- a/checkpoint-426/trainer_state.json +++ b/checkpoint-426/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.991941391941392, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341", + "best_metric": 0.989010989010989, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-426", "epoch": 4.989751098096632, "eval_steps": 500, "global_step": 426, @@ -10,69 +10,69 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9597069597069597, - "eval_f1": 0.9599836188656065, - "eval_loss": 0.12706419825553894, - "eval_precision": 0.960694098126733, - "eval_recall": 0.9597069597069597, - "eval_runtime": 6.1839, - "eval_samples_per_second": 220.733, - "eval_steps_per_second": 27.652, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.9787545787545787, - "eval_f1": 0.9788099592207686, - "eval_loss": 0.07009062170982361, - "eval_precision": 0.9789268917610887, - "eval_recall": 0.9787545787545787, - "eval_runtime": 6.2624, - "eval_samples_per_second": 217.969, - "eval_steps_per_second": 27.306, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, - "eval_accuracy": 0.9831501831501831, - "eval_f1": 0.9831941055888854, - "eval_loss": 0.06720960885286331, - "eval_precision": 0.9832999772248476, - "eval_recall": 0.9831501831501831, - "eval_runtime": 5.9845, - "eval_samples_per_second": 228.09, - "eval_steps_per_second": 28.574, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 }, { "epoch": 3.994143484626647, - "eval_accuracy": 0.991941391941392, - "eval_f1": 0.9919444380146174, - "eval_loss": 0.04145079106092453, - "eval_precision": 0.9919487758943655, - "eval_recall": 0.991941391941392, - "eval_runtime": 6.1222, - "eval_samples_per_second": 222.958, - "eval_steps_per_second": 27.931, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, "step": 341 }, { "epoch": 4.989751098096632, - "eval_accuracy": 0.991941391941392, - "eval_f1": 0.9919444380146174, - "eval_loss": 0.037522196769714355, - "eval_precision": 0.9919487758943655, - "eval_recall": 0.991941391941392, - "eval_runtime": 6.1601, - "eval_samples_per_second": 221.586, - "eval_steps_per_second": 27.759, + "eval_accuracy": 0.989010989010989, + "eval_f1": 0.9890246085529585, + "eval_loss": 0.0438910573720932, + "eval_precision": 0.989050109460552, + "eval_recall": 0.989010989010989, + "eval_runtime": 5.937, + "eval_samples_per_second": 229.913, + "eval_steps_per_second": 28.802, "step": 426 } ], "logging_steps": 500, - "max_steps": 510, + "max_steps": 850, "num_input_tokens_seen": 0, - "num_train_epochs": 6, + "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { diff --git a/checkpoint-426/training_args.bin b/checkpoint-426/training_args.bin index bff11f0a04d7786ba1f282509a88be97e3ad2b24..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-426/training_args.bin +++ b/checkpoint-426/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a0f29e363429f3041b65000237638d975c16df70ba592fd3c2ce610392338bd3 +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-512/config.json b/checkpoint-512/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-512/config.json +++ b/checkpoint-512/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-512/model.safetensors b/checkpoint-512/model.safetensors index ffc5085730344dc748586075c23f9e3dedac3fd4..2cd2c0c49bf6bf257a0bcff41f417f55b69399a6 100644 --- a/checkpoint-512/model.safetensors +++ b/checkpoint-512/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:35b0d90358beea477341c41eb5ba7259fabcc0922d7900d91362f0fbaf06bab2 +oid sha256:35f0fba66e2bc44178994b63877f32d5ef3660e920cd130dae9ccbf8e054d15a size 94763496 diff --git a/checkpoint-512/optimizer.pt b/checkpoint-512/optimizer.pt index 609b48ac794913beb8177765b8b79fb756c4e60b..2065eee72c21c59ff9e28cff440af6e49b3acbef 100644 --- a/checkpoint-512/optimizer.pt +++ b/checkpoint-512/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:648b988b59d53cdfb9a307e0c1ecb64a428672a7b441f4145e8d3d009ae2cfbe +oid sha256:32489c4cc27d23701cd78e51f1daf46563d47112b4e3520ad9568800f0b86fb3 size 189552570 diff --git a/checkpoint-512/scheduler.pt b/checkpoint-512/scheduler.pt index 2385095d97e6dacd421cedc28fca7f7c0fcb622a..de194de68892e68443bc6755bc456b7851254a2a 100644 --- a/checkpoint-512/scheduler.pt +++ b/checkpoint-512/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f1f22cb39573891adcd854d571d182ed521927c0644cb49b42c5a9a0f0635791 +oid sha256:0643374a18b5da11030bd13ba87a30fd86ee77d7702b1fa1d0aee2f444563b7c size 1064 diff --git a/checkpoint-512/trainer_state.json b/checkpoint-512/trainer_state.json index 5352cc318e50edd99bbc1e4d722dd64c23eb12a5..cec88267637b2d56f1e27682544c2e83c6457846 100644 --- a/checkpoint-512/trainer_state.json +++ b/checkpoint-512/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9897435897435898, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341", + "best_metric": 0.9904761904761905, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-512", "epoch": 5.997071742313324, "eval_steps": 500, "global_step": 512, @@ -11,80 +11,80 @@ { "epoch": 0.9956076134699854, "eval_accuracy": 0.9538461538461539, - "eval_f1": 0.953235199825453, - "eval_loss": 0.13410410284996033, - "eval_precision": 0.9543176332312968, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, "eval_recall": 0.9538461538461539, - "eval_runtime": 5.9191, - "eval_samples_per_second": 230.61, - "eval_steps_per_second": 28.89, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.96996336996337, - "eval_f1": 0.970275727358029, - "eval_loss": 0.08308757096529007, - "eval_precision": 0.9720059808561178, - "eval_recall": 0.96996336996337, - "eval_runtime": 5.9321, - "eval_samples_per_second": 230.105, - "eval_steps_per_second": 28.826, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, - "eval_accuracy": 0.9846153846153847, - "eval_f1": 0.9845587007434289, - "eval_loss": 0.05695493519306183, - "eval_precision": 0.984652882646444, - "eval_recall": 0.9846153846153847, - "eval_runtime": 5.924, - "eval_samples_per_second": 230.421, - "eval_steps_per_second": 28.866, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 }, { "epoch": 3.994143484626647, - "eval_accuracy": 0.9897435897435898, - "eval_f1": 0.9897502348272303, - "eval_loss": 0.03400224819779396, - "eval_precision": 0.9897618176566864, - "eval_recall": 0.9897435897435898, - "eval_runtime": 5.9234, - "eval_samples_per_second": 230.441, - "eval_steps_per_second": 28.868, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, "step": 341 }, { "epoch": 4.989751098096632, - "eval_accuracy": 0.9875457875457876, - "eval_f1": 0.9876042969414931, - "eval_loss": 0.04599935933947563, - "eval_precision": 0.9879353582239604, - "eval_recall": 0.9875457875457876, - "eval_runtime": 5.9141, - "eval_samples_per_second": 230.803, - "eval_steps_per_second": 28.914, + "eval_accuracy": 0.989010989010989, + "eval_f1": 0.9890246085529585, + "eval_loss": 0.0438910573720932, + "eval_precision": 0.989050109460552, + "eval_recall": 0.989010989010989, + "eval_runtime": 5.937, + "eval_samples_per_second": 229.913, + "eval_steps_per_second": 28.802, "step": 426 }, { "epoch": 5.856515373352855, - "grad_norm": 0.020362911745905876, - "learning_rate": 1.819507083000514e-05, - "loss": 0.0707, + "grad_norm": 0.08060992509126663, + "learning_rate": 1.0917042498003083e-05, + "loss": 0.0779, "step": 500 }, { "epoch": 5.997071742313324, - "eval_accuracy": 0.9897435897435898, - "eval_f1": 0.9897761336599745, - "eval_loss": 0.04312068223953247, - "eval_precision": 0.9899308989239506, - "eval_recall": 0.9897435897435898, - "eval_runtime": 5.5776, - "eval_samples_per_second": 244.727, - "eval_steps_per_second": 30.658, + "eval_accuracy": 0.9904761904761905, + "eval_f1": 0.9904879940792306, + "eval_loss": 0.0396205335855484, + "eval_precision": 0.9905117057078526, + "eval_recall": 0.9904761904761905, + "eval_runtime": 5.9047, + "eval_samples_per_second": 231.172, + "eval_steps_per_second": 28.96, "step": 512 } ], diff --git a/checkpoint-512/training_args.bin b/checkpoint-512/training_args.bin index 317a4a3be78b110b93637f697893ca201288d8b5..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-512/training_args.bin +++ b/checkpoint-512/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334 +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-597/config.json b/checkpoint-597/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-597/config.json +++ b/checkpoint-597/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-597/model.safetensors b/checkpoint-597/model.safetensors index 81c855a1983f1d26680522236cc808d8c71f4582..e8250db40335ef01374cc2551da82b034b606100 100644 --- a/checkpoint-597/model.safetensors +++ b/checkpoint-597/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c617973600d573c483f588a59837c6d45814ca8e16c64575f5523b65246f0c5e +oid sha256:3fefc9fc9e0c6f521d52f6944550be09ad08cf2a406465b2bad96d43e8e656a9 size 94763496 diff --git a/checkpoint-597/optimizer.pt b/checkpoint-597/optimizer.pt index 3f237baa37f8e5624d3572326b286dd953424681..3565d64748269cfc78487e0d67ba82c7232de423 100644 --- a/checkpoint-597/optimizer.pt +++ b/checkpoint-597/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:86268f89454cc35e41155e346d8e2ca8d5a9b6f579d1fef2bbfc8b823eace3b9 +oid sha256:de0a5be77c65d20eadb1a24d44af2c728f76e6c9b01b584c11efa9dac4bab929 size 189552570 diff --git a/checkpoint-597/scheduler.pt b/checkpoint-597/scheduler.pt index cc92241b39bfb840d796fe1c25231b6277559b05..ac6539dc565deadbfc22c08a347e7afaf5b998f5 100644 --- a/checkpoint-597/scheduler.pt +++ b/checkpoint-597/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3c216d743853a404a50b6a598e3c4bf36fa1dc8935b24320ebe609a9c5c9b437 +oid sha256:65e5b7798f882f09e50f351045d72a3f8133a68153dae42b3d7541432cd2e9e0 size 1064 diff --git a/checkpoint-597/trainer_state.json b/checkpoint-597/trainer_state.json index 4acea211177ab58598a65c2108d5494cb0af0946..3302504f5e75a2ff20311a356ac642889cb4d06b 100644 --- a/checkpoint-597/trainer_state.json +++ b/checkpoint-597/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9897435897435898, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-341", + "best_metric": 0.991941391941392, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597", "epoch": 6.992679355783309, "eval_steps": 500, "global_step": 597, @@ -11,92 +11,92 @@ { "epoch": 0.9956076134699854, "eval_accuracy": 0.9538461538461539, - "eval_f1": 0.953235199825453, - "eval_loss": 0.13410410284996033, - "eval_precision": 0.9543176332312968, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, "eval_recall": 0.9538461538461539, - "eval_runtime": 5.9191, - "eval_samples_per_second": 230.61, - "eval_steps_per_second": 28.89, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.96996336996337, - "eval_f1": 0.970275727358029, - "eval_loss": 0.08308757096529007, - "eval_precision": 0.9720059808561178, - "eval_recall": 0.96996336996337, - "eval_runtime": 5.9321, - "eval_samples_per_second": 230.105, - "eval_steps_per_second": 28.826, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, - "eval_accuracy": 0.9846153846153847, - "eval_f1": 0.9845587007434289, - "eval_loss": 0.05695493519306183, - "eval_precision": 0.984652882646444, - "eval_recall": 0.9846153846153847, - "eval_runtime": 5.924, - "eval_samples_per_second": 230.421, - "eval_steps_per_second": 28.866, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 }, { "epoch": 3.994143484626647, - "eval_accuracy": 0.9897435897435898, - "eval_f1": 0.9897502348272303, - "eval_loss": 0.03400224819779396, - "eval_precision": 0.9897618176566864, - "eval_recall": 0.9897435897435898, - "eval_runtime": 5.9234, - "eval_samples_per_second": 230.441, - "eval_steps_per_second": 28.868, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, "step": 341 }, { "epoch": 4.989751098096632, - "eval_accuracy": 0.9875457875457876, - "eval_f1": 0.9876042969414931, - "eval_loss": 0.04599935933947563, - "eval_precision": 0.9879353582239604, - "eval_recall": 0.9875457875457876, - "eval_runtime": 5.9141, - "eval_samples_per_second": 230.803, - "eval_steps_per_second": 28.914, + "eval_accuracy": 0.989010989010989, + "eval_f1": 0.9890246085529585, + "eval_loss": 0.0438910573720932, + "eval_precision": 0.989050109460552, + "eval_recall": 0.989010989010989, + "eval_runtime": 5.937, + "eval_samples_per_second": 229.913, + "eval_steps_per_second": 28.802, "step": 426 }, { "epoch": 5.856515373352855, - "grad_norm": 0.020362911745905876, - "learning_rate": 1.819507083000514e-05, - "loss": 0.0707, + "grad_norm": 0.08060992509126663, + "learning_rate": 1.0917042498003083e-05, + "loss": 0.0779, "step": 500 }, { "epoch": 5.997071742313324, - "eval_accuracy": 0.9897435897435898, - "eval_f1": 0.9897761336599745, - "eval_loss": 0.04312068223953247, - "eval_precision": 0.9899308989239506, - "eval_recall": 0.9897435897435898, - "eval_runtime": 5.5776, - "eval_samples_per_second": 244.727, - "eval_steps_per_second": 30.658, + "eval_accuracy": 0.9904761904761905, + "eval_f1": 0.9904879940792306, + "eval_loss": 0.0396205335855484, + "eval_precision": 0.9905117057078526, + "eval_recall": 0.9904761904761905, + "eval_runtime": 5.9047, + "eval_samples_per_second": 231.172, + "eval_steps_per_second": 28.96, "step": 512 }, { "epoch": 6.992679355783309, - "eval_accuracy": 0.9882783882783883, - "eval_f1": 0.9882934987415589, - "eval_loss": 0.035927049815654755, - "eval_precision": 0.9883282714000319, - "eval_recall": 0.9882783882783883, - "eval_runtime": 5.5806, - "eval_samples_per_second": 244.596, - "eval_steps_per_second": 30.642, + "eval_accuracy": 0.991941391941392, + "eval_f1": 0.9919447375447602, + "eval_loss": 0.035047151148319244, + "eval_precision": 0.9919494135494136, + "eval_recall": 0.991941391941392, + "eval_runtime": 6.0502, + "eval_samples_per_second": 225.612, + "eval_steps_per_second": 28.264, "step": 597 } ], @@ -121,7 +121,7 @@ "should_evaluate": false, "should_log": false, "should_save": true, - "should_training_stop": true + "should_training_stop": false }, "attributes": {} } diff --git a/checkpoint-597/training_args.bin b/checkpoint-597/training_args.bin index 317a4a3be78b110b93637f697893ca201288d8b5..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-597/training_args.bin +++ b/checkpoint-597/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:831297954221509dc3f32e8eaf01789c3f660cf430e186799d52e58ec3b5b334 +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-683/config.json b/checkpoint-683/config.json index 4550a22abfa803293b5dc6b2633d0201ac2ff44d..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-683/config.json +++ b/checkpoint-683/config.json @@ -45,6 +45,7 @@ "feat_proj_dropout": 0.0, "feat_proj_layer_norm": false, "final_dropout": 0.0, + "finetuning_task": "audio-classification", "hidden_act": "gelu", "hidden_dropout": 0.1, "hidden_size": 768, @@ -54,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": "0", - "no_crying": "1" - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-683/model.safetensors b/checkpoint-683/model.safetensors index 76ff8f4962f83077487c86d992a40f3b5c77216d..95fc634bb7b4d975d5c4ae420e9a73c72dda3e27 100644 --- a/checkpoint-683/model.safetensors +++ b/checkpoint-683/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:52ec3a122dd4e1c3f5b4ae3dc2e2256f512a563d42eb82426ac3f8094e0c4490 +oid sha256:47eb6b3cfe6fa933d4d9bda0995a1e235c1d9ec1d2481708bed5a4149e8262a4 size 94763496 diff --git a/checkpoint-683/optimizer.pt b/checkpoint-683/optimizer.pt index c5e5c8cbd55e730746df23bff2f60d84585bf836..ceea371366afe5bd81e61c0f5fed75f8744ea999 100644 --- a/checkpoint-683/optimizer.pt +++ b/checkpoint-683/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b6591188ba0c4025fcbff86219e7c2755b85671c8b4d10202fa03cef2f8831a1 +oid sha256:ccd75da0e8ea0bf33fb98b23e1d8b9fc9f33d7c31a91837683d49c15ae856034 size 189552570 diff --git a/checkpoint-683/scheduler.pt b/checkpoint-683/scheduler.pt index 4d01af1fdde6c62ebd7697d31558faa49bd9d0bc..7eb9416c890ff10681aeb947132d9fcdc637e1a8 100644 --- a/checkpoint-683/scheduler.pt +++ b/checkpoint-683/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b712ee88015e952bb23b1f5495f272411d9c19a17334b27df15dc1ebbac98f35 +oid sha256:bde01021f76a64b9ec7866fcc536e72a45008d7566739a02f03c4c895a14c72c size 1064 diff --git a/checkpoint-683/trainer_state.json b/checkpoint-683/trainer_state.json index 2c4e628f04f9eb93a9af83739635e132ce3979d3..7e0a0a13ceefaf93cd74376583b275bf94680454 100644 --- a/checkpoint-683/trainer_state.json +++ b/checkpoint-683/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9926739926739927, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-512", + "best_metric": 0.991941391941392, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597", "epoch": 8.0, "eval_steps": 500, "global_step": 683, @@ -10,81 +10,105 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9772893772893773, - "eval_loss": 0.06922276318073273, - "eval_runtime": 15.5305, - "eval_samples_per_second": 87.892, - "eval_steps_per_second": 11.011, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.9860805860805861, - "eval_loss": 0.04661192744970322, - "eval_runtime": 15.4605, - "eval_samples_per_second": 88.29, - "eval_steps_per_second": 11.06, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, - "eval_accuracy": 0.9853479853479854, - "eval_loss": 0.04894961416721344, - "eval_runtime": 15.5622, - "eval_samples_per_second": 87.713, - "eval_steps_per_second": 10.988, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 }, { "epoch": 3.994143484626647, - "eval_accuracy": 0.9897435897435898, - "eval_loss": 0.04228556528687477, - "eval_runtime": 15.6217, - "eval_samples_per_second": 87.378, - "eval_steps_per_second": 10.946, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, "step": 341 }, { "epoch": 4.989751098096632, - "eval_accuracy": 0.991941391941392, - "eval_loss": 0.044283464550971985, - "eval_runtime": 15.0667, - "eval_samples_per_second": 90.597, - "eval_steps_per_second": 11.35, + "eval_accuracy": 0.989010989010989, + "eval_f1": 0.9890246085529585, + "eval_loss": 0.0438910573720932, + "eval_precision": 0.989050109460552, + "eval_recall": 0.989010989010989, + "eval_runtime": 5.937, + "eval_samples_per_second": 229.913, + "eval_steps_per_second": 28.802, "step": 426 }, { "epoch": 5.856515373352855, - "grad_norm": 0.008579956367611885, - "learning_rate": 3.639014166001028e-05, - "loss": 0.055, + "grad_norm": 0.08060992509126663, + "learning_rate": 1.0917042498003083e-05, + "loss": 0.0779, "step": 500 }, { "epoch": 5.997071742313324, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.04338795691728592, - "eval_runtime": 14.898, - "eval_samples_per_second": 91.623, - "eval_steps_per_second": 11.478, + "eval_accuracy": 0.9904761904761905, + "eval_f1": 0.9904879940792306, + "eval_loss": 0.0396205335855484, + "eval_precision": 0.9905117057078526, + "eval_recall": 0.9904761904761905, + "eval_runtime": 5.9047, + "eval_samples_per_second": 231.172, + "eval_steps_per_second": 28.96, "step": 512 }, { "epoch": 6.992679355783309, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.04399614781141281, - "eval_runtime": 15.2426, - "eval_samples_per_second": 89.552, - "eval_steps_per_second": 11.219, + "eval_accuracy": 0.991941391941392, + "eval_f1": 0.9919447375447602, + "eval_loss": 0.035047151148319244, + "eval_precision": 0.9919494135494136, + "eval_recall": 0.991941391941392, + "eval_runtime": 6.0502, + "eval_samples_per_second": 225.612, + "eval_steps_per_second": 28.264, "step": 597 }, { "epoch": 8.0, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.045955102890729904, - "eval_runtime": 15.1372, - "eval_samples_per_second": 90.175, - "eval_steps_per_second": 11.297, + "eval_accuracy": 0.9912087912087912, + "eval_f1": 0.9912160728160728, + "eval_loss": 0.03350323066115379, + "eval_precision": 0.9912286614059304, + "eval_recall": 0.9912087912087912, + "eval_runtime": 5.79, + "eval_samples_per_second": 235.751, + "eval_steps_per_second": 29.534, "step": 683 } ], diff --git a/checkpoint-683/training_args.bin b/checkpoint-683/training_args.bin index ba89ffbbb5f921e8486f25ee9c3f0a763e7c1271..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-683/training_args.bin +++ b/checkpoint-683/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84d763bc52a548d7900e672478766167dea5015bedfc4ad077e5cffda9256cc8 +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-768/config.json b/checkpoint-768/config.json index 4550a22abfa803293b5dc6b2633d0201ac2ff44d..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-768/config.json +++ b/checkpoint-768/config.json @@ -45,6 +45,7 @@ "feat_proj_dropout": 0.0, "feat_proj_layer_norm": false, "final_dropout": 0.0, + "finetuning_task": "audio-classification", "hidden_act": "gelu", "hidden_dropout": 0.1, "hidden_size": 768, @@ -54,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": "0", - "no_crying": "1" - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-768/model.safetensors b/checkpoint-768/model.safetensors index b2519b9c8a86a0f16a98d310dd372f04edd055b7..a9fe76eac0515f91351cc953bf05dfdb8ae8fb24 100644 --- a/checkpoint-768/model.safetensors +++ b/checkpoint-768/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0e5671ffc6960b29ad80f820b4317ec548ff0deefca2464ad359c421c360e64f +oid sha256:589720455553dad3b547e7fc5aac19151dbefadb26d39a6a04c708e344cfd310 size 94763496 diff --git a/checkpoint-768/optimizer.pt b/checkpoint-768/optimizer.pt index b033c12db74cd598ec9bf76fb199a48a614fbda2..2a4af901cf891c719064b83475447bea2a5d696b 100644 --- a/checkpoint-768/optimizer.pt +++ b/checkpoint-768/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7516d91f602bba3efff25344b03b35e85d41b8ce4db2a56619d6dcf6cd2cc2df +oid sha256:b863d95ad20867c4606dfd4b07ae1866e1bfbd283086e4449d924ccf79d9d2dc size 189552570 diff --git a/checkpoint-768/scheduler.pt b/checkpoint-768/scheduler.pt index 9bde14cf908ff3342ecb27c3673a3de161412e6e..2edb81480f1cbcf6da1f2d65c03bdf83d4200e06 100644 --- a/checkpoint-768/scheduler.pt +++ b/checkpoint-768/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:46a9a21b9ea0c395732aadaa7b885d80eaa4d81c9d9d1eea099d6180e939da87 +oid sha256:acb83cb237d82342af5936197af5c426903999a84d7161b385fa3b80c0070365 size 1064 diff --git a/checkpoint-768/trainer_state.json b/checkpoint-768/trainer_state.json index cb85d0fc6daf72dd3976edf5ef9f792179416b10..265a05dcef5383b63046a81e28a44f894ce4ea49 100644 --- a/checkpoint-768/trainer_state.json +++ b/checkpoint-768/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9926739926739927, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-512", + "best_metric": 0.991941391941392, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597", "epoch": 8.995607613469986, "eval_steps": 500, "global_step": 768, @@ -10,90 +10,117 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9772893772893773, - "eval_loss": 0.06922276318073273, - "eval_runtime": 15.5305, - "eval_samples_per_second": 87.892, - "eval_steps_per_second": 11.011, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 }, { "epoch": 1.9912152269399708, - "eval_accuracy": 0.9860805860805861, - "eval_loss": 0.04661192744970322, - "eval_runtime": 15.4605, - "eval_samples_per_second": 88.29, - "eval_steps_per_second": 11.06, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, "step": 170 }, { "epoch": 2.998535871156662, - "eval_accuracy": 0.9853479853479854, - "eval_loss": 0.04894961416721344, - "eval_runtime": 15.5622, - "eval_samples_per_second": 87.713, - "eval_steps_per_second": 10.988, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, "step": 256 }, { "epoch": 3.994143484626647, - "eval_accuracy": 0.9897435897435898, - "eval_loss": 0.04228556528687477, - "eval_runtime": 15.6217, - "eval_samples_per_second": 87.378, - "eval_steps_per_second": 10.946, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, "step": 341 }, { "epoch": 4.989751098096632, - "eval_accuracy": 0.991941391941392, - "eval_loss": 0.044283464550971985, - "eval_runtime": 15.0667, - "eval_samples_per_second": 90.597, - "eval_steps_per_second": 11.35, + "eval_accuracy": 0.989010989010989, + "eval_f1": 0.9890246085529585, + "eval_loss": 0.0438910573720932, + "eval_precision": 0.989050109460552, + "eval_recall": 0.989010989010989, + "eval_runtime": 5.937, + "eval_samples_per_second": 229.913, + "eval_steps_per_second": 28.802, "step": 426 }, { "epoch": 5.856515373352855, - "grad_norm": 0.008579956367611885, - "learning_rate": 3.639014166001028e-05, - "loss": 0.055, + "grad_norm": 0.08060992509126663, + "learning_rate": 1.0917042498003083e-05, + "loss": 0.0779, "step": 500 }, { "epoch": 5.997071742313324, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.04338795691728592, - "eval_runtime": 14.898, - "eval_samples_per_second": 91.623, - "eval_steps_per_second": 11.478, + "eval_accuracy": 0.9904761904761905, + "eval_f1": 0.9904879940792306, + "eval_loss": 0.0396205335855484, + "eval_precision": 0.9905117057078526, + "eval_recall": 0.9904761904761905, + "eval_runtime": 5.9047, + "eval_samples_per_second": 231.172, + "eval_steps_per_second": 28.96, "step": 512 }, { "epoch": 6.992679355783309, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.04399614781141281, - "eval_runtime": 15.2426, - "eval_samples_per_second": 89.552, - "eval_steps_per_second": 11.219, + "eval_accuracy": 0.991941391941392, + "eval_f1": 0.9919447375447602, + "eval_loss": 0.035047151148319244, + "eval_precision": 0.9919494135494136, + "eval_recall": 0.991941391941392, + "eval_runtime": 6.0502, + "eval_samples_per_second": 225.612, + "eval_steps_per_second": 28.264, "step": 597 }, { "epoch": 8.0, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.045955102890729904, - "eval_runtime": 15.1372, - "eval_samples_per_second": 90.175, - "eval_steps_per_second": 11.297, + "eval_accuracy": 0.9912087912087912, + "eval_f1": 0.9912160728160728, + "eval_loss": 0.03350323066115379, + "eval_precision": 0.9912286614059304, + "eval_recall": 0.9912087912087912, + "eval_runtime": 5.79, + "eval_samples_per_second": 235.751, + "eval_steps_per_second": 29.534, "step": 683 }, { "epoch": 8.995607613469986, - "eval_accuracy": 0.9926739926739927, - "eval_loss": 0.04587433487176895, - "eval_runtime": 15.0807, - "eval_samples_per_second": 90.513, - "eval_steps_per_second": 11.339, + "eval_accuracy": 0.9912087912087912, + "eval_f1": 0.9912160728160728, + "eval_loss": 0.03368490934371948, + "eval_precision": 0.9912286614059304, + "eval_recall": 0.9912087912087912, + "eval_runtime": 5.7784, + "eval_samples_per_second": 236.224, + "eval_steps_per_second": 29.593, "step": 768 } ], @@ -118,7 +145,7 @@ "should_evaluate": false, "should_log": false, "should_save": true, - "should_training_stop": true + "should_training_stop": false }, "attributes": {} } diff --git a/checkpoint-768/training_args.bin b/checkpoint-768/training_args.bin index ba89ffbbb5f921e8486f25ee9c3f0a763e7c1271..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-768/training_args.bin +++ b/checkpoint-768/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84d763bc52a548d7900e672478766167dea5015bedfc4ad077e5cffda9256cc8 +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-85/config.json b/checkpoint-85/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/checkpoint-85/config.json +++ b/checkpoint-85/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/checkpoint-85/model.safetensors b/checkpoint-85/model.safetensors index 5a5eb58204b64e5f354c72302b0e3b9121863ea5..204cc892563ddf46d3c2771026ac8c9c508c326f 100644 --- a/checkpoint-85/model.safetensors +++ b/checkpoint-85/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:667f991dfd621ded0f030ae62bee9e55c4e297c107c7ab609989f56ba7da4287 +oid sha256:23b104b8e2a8ab0ab3becb4267c1082a46bc58158acb8a209710fb47609d3b4f size 94763496 diff --git a/checkpoint-85/optimizer.pt b/checkpoint-85/optimizer.pt index 1276ecc3f69cf6e7e5f96287b4063d3c57a973be..26164efff4d635ac81f8913f65485c95122eff3c 100644 --- a/checkpoint-85/optimizer.pt +++ b/checkpoint-85/optimizer.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2b7d98f10852c7c698f2667e9c22700b698aaca9caf2c11ddb129f3cb85eeb89 +oid sha256:7714c072df6c6ff0ac19030de12768b584908ae115f48402f0620bb30e33ac6a size 189552570 diff --git a/checkpoint-85/scheduler.pt b/checkpoint-85/scheduler.pt index 27c0f660ce4033e628f1a38f7cdeb037930a3405..0f9c6bfe27d4ace1e3c5af7dc8e8a2d3e97c8bce 100644 --- a/checkpoint-85/scheduler.pt +++ b/checkpoint-85/scheduler.pt @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:793aa52bb071f6372012884f8d464f730e19ee122d0faba28c109d42d303933f +oid sha256:4a9512c594f58b73a89140b2cabaa00dc63beddab8e8c45433318c9396e38e96 size 1064 diff --git a/checkpoint-85/trainer_state.json b/checkpoint-85/trainer_state.json index e113a404e0223bc125ab18b5d188bdaba9ca5227..1652e5f5a5b9c95ca72e601eff21813d1395c9cd 100644 --- a/checkpoint-85/trainer_state.json +++ b/checkpoint-85/trainer_state.json @@ -1,6 +1,6 @@ { - "best_metric": 0.9545787545787546, - "best_model_checkpoint": "distilhubert-finetuned-cry-detector/checkpoint-85", + "best_metric": 0.9538461538461539, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-85", "epoch": 0.9956076134699854, "eval_steps": 500, "global_step": 85, @@ -10,21 +10,21 @@ "log_history": [ { "epoch": 0.9956076134699854, - "eval_accuracy": 0.9545787545787546, - "eval_f1": 0.9543924849872077, - "eval_loss": 0.13782845437526703, - "eval_precision": 0.9543323172404159, - "eval_recall": 0.9545787545787546, - "eval_runtime": 6.1437, - "eval_samples_per_second": 222.18, - "eval_steps_per_second": 27.834, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, "step": 85 } ], "logging_steps": 500, - "max_steps": 340, + "max_steps": 850, "num_input_tokens_seen": 0, - "num_train_epochs": 4, + "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { diff --git a/checkpoint-85/training_args.bin b/checkpoint-85/training_args.bin index 7bfc5bd20dcd0c05fb8658eb0e6ae87fef5fc784..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/checkpoint-85/training_args.bin +++ b/checkpoint-85/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7bd8e997c05f23ae464180f8e5e9f881e9c68322e4fcd3f855e79e2e5d54fbb +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240 diff --git a/checkpoint-850/config.json b/checkpoint-850/config.json new file mode 100644 index 0000000000000000000000000000000000000000..23cd00c8f7806f9961fb35e24a24f5d256693560 --- /dev/null +++ b/checkpoint-850/config.json @@ -0,0 +1,77 @@ +{ + "_name_or_path": "ntu-spml/distilhubert", + "activation_dropout": 0.1, + "apply_spec_augment": false, + "architectures": [ + "HubertForSequenceClassification" + ], + "attention_dropout": 0.1, + "bos_token_id": 1, + "classifier_proj_size": 256, + "conv_bias": false, + "conv_dim": [ + 512, + 512, + 512, + 512, + 512, + 512, + 512 + ], + "conv_kernel": [ + 10, + 3, + 3, + 3, + 3, + 2, + 2 + ], + "conv_stride": [ + 5, + 2, + 2, + 2, + 2, + 2, + 2 + ], + "ctc_loss_reduction": "sum", + "ctc_zero_infinity": false, + "do_stable_layer_norm": false, + "eos_token_id": 2, + "feat_extract_activation": "gelu", + "feat_extract_norm": "group", + "feat_proj_dropout": 0.0, + "feat_proj_layer_norm": false, + "final_dropout": 0.0, + "finetuning_task": "audio-classification", + "hidden_act": "gelu", + "hidden_dropout": 0.1, + "hidden_size": 768, + "id2label": { + "0": "crying", + "1": "no_crying" + }, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_norm_eps": 1e-05, + "layerdrop": 0.0, + "mask_feature_length": 10, + "mask_feature_min_masks": 0, + "mask_feature_prob": 0.0, + "mask_time_length": 10, + "mask_time_min_masks": 2, + "mask_time_prob": 0.05, + "model_type": "hubert", + "num_attention_heads": 12, + "num_conv_pos_embedding_groups": 16, + "num_conv_pos_embeddings": 128, + "num_feat_extract_layers": 7, + "num_hidden_layers": 2, + "pad_token_id": 0, + "torch_dtype": "float32", + "transformers_version": "4.44.2", + "use_weighted_layer_sum": false, + "vocab_size": 32 +} diff --git a/checkpoint-850/model.safetensors b/checkpoint-850/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2067c632a46109718398070a886ec86b5eeec61b --- /dev/null +++ b/checkpoint-850/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1aeb7940df69c378c58475392e88d579506d2aa5b347841cf22ed734af56f6 +size 94763496 diff --git a/checkpoint-850/optimizer.pt b/checkpoint-850/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..81eaffc062ba5f4573e3ac972cc84f560d3066a4 --- /dev/null +++ b/checkpoint-850/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82e0287f6c90921af053bde2cd7c30093c390b1f44677e85333e67097d2fcf96 +size 189552570 diff --git a/checkpoint-850/rng_state.pth b/checkpoint-850/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..6272e5d03b4b7fbc668ab5cc906fe87b7d936dfb --- /dev/null +++ b/checkpoint-850/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c4cf7220fb2362263b7cc4bddb6085bdf34c006ec7852148c9f91df123bc35 +size 14308 diff --git a/checkpoint-850/scheduler.pt b/checkpoint-850/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcc320930cf16c603072cb69243b17e8dcdbfcd7 --- /dev/null +++ b/checkpoint-850/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e2f64fbcb1f1581011bf45464f1ecf4abc0a0908ecae18e97d933454491798 +size 1064 diff --git a/checkpoint-850/trainer_state.json b/checkpoint-850/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..e6f8905670b8804bf2e0474b4f745bac932b6e16 --- /dev/null +++ b/checkpoint-850/trainer_state.json @@ -0,0 +1,169 @@ +{ + "best_metric": 0.991941391941392, + "best_model_checkpoint": "A-POR-LOS-8000/distilhubert-finetuned-cry-detector/checkpoint-597", + "epoch": 9.956076134699854, + "eval_steps": 500, + "global_step": 850, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.9956076134699854, + "eval_accuracy": 0.9538461538461539, + "eval_f1": 0.9535883665206972, + "eval_loss": 0.11965569853782654, + "eval_precision": 0.9535470731605858, + "eval_recall": 0.9538461538461539, + "eval_runtime": 5.8661, + "eval_samples_per_second": 232.691, + "eval_steps_per_second": 29.15, + "step": 85 + }, + { + "epoch": 1.9912152269399708, + "eval_accuracy": 0.9831501831501831, + "eval_f1": 0.983143153392684, + "eval_loss": 0.060115572065114975, + "eval_precision": 0.9831374404084774, + "eval_recall": 0.9831501831501831, + "eval_runtime": 5.9254, + "eval_samples_per_second": 230.365, + "eval_steps_per_second": 28.859, + "step": 170 + }, + { + "epoch": 2.998535871156662, + "eval_accuracy": 0.9868131868131869, + "eval_f1": 0.9868241092241091, + "eval_loss": 0.05060575157403946, + "eval_precision": 0.9868403029537207, + "eval_recall": 0.9868131868131869, + "eval_runtime": 5.9299, + "eval_samples_per_second": 230.189, + "eval_steps_per_second": 28.837, + "step": 256 + }, + { + "epoch": 3.994143484626647, + "eval_accuracy": 0.9860805860805861, + "eval_f1": 0.9861535269385863, + "eval_loss": 0.04610973969101906, + "eval_precision": 0.986445121171901, + "eval_recall": 0.9860805860805861, + "eval_runtime": 5.9428, + "eval_samples_per_second": 229.69, + "eval_steps_per_second": 28.774, + "step": 341 + }, + { + "epoch": 4.989751098096632, + "eval_accuracy": 0.989010989010989, + "eval_f1": 0.9890246085529585, + "eval_loss": 0.0438910573720932, + "eval_precision": 0.989050109460552, + "eval_recall": 0.989010989010989, + "eval_runtime": 5.937, + "eval_samples_per_second": 229.913, + "eval_steps_per_second": 28.802, + "step": 426 + }, + { + "epoch": 5.856515373352855, + "grad_norm": 0.08060992509126663, + "learning_rate": 1.0917042498003083e-05, + "loss": 0.0779, + "step": 500 + }, + { + "epoch": 5.997071742313324, + "eval_accuracy": 0.9904761904761905, + "eval_f1": 0.9904879940792306, + "eval_loss": 0.0396205335855484, + "eval_precision": 0.9905117057078526, + "eval_recall": 0.9904761904761905, + "eval_runtime": 5.9047, + "eval_samples_per_second": 231.172, + "eval_steps_per_second": 28.96, + "step": 512 + }, + { + "epoch": 6.992679355783309, + "eval_accuracy": 0.991941391941392, + "eval_f1": 0.9919447375447602, + "eval_loss": 0.035047151148319244, + "eval_precision": 0.9919494135494136, + "eval_recall": 0.991941391941392, + "eval_runtime": 6.0502, + "eval_samples_per_second": 225.612, + "eval_steps_per_second": 28.264, + "step": 597 + }, + { + "epoch": 8.0, + "eval_accuracy": 0.9912087912087912, + "eval_f1": 0.9912160728160728, + "eval_loss": 0.03350323066115379, + "eval_precision": 0.9912286614059304, + "eval_recall": 0.9912087912087912, + "eval_runtime": 5.79, + "eval_samples_per_second": 235.751, + "eval_steps_per_second": 29.534, + "step": 683 + }, + { + "epoch": 8.995607613469986, + "eval_accuracy": 0.9912087912087912, + "eval_f1": 0.9912160728160728, + "eval_loss": 0.03368490934371948, + "eval_precision": 0.9912286614059304, + "eval_recall": 0.9912087912087912, + "eval_runtime": 5.7784, + "eval_samples_per_second": 236.224, + "eval_steps_per_second": 29.593, + "step": 768 + }, + { + "epoch": 9.956076134699854, + "eval_accuracy": 0.9912087912087912, + "eval_f1": 0.9912160728160728, + "eval_loss": 0.03377429023385048, + "eval_precision": 0.9912286614059304, + "eval_recall": 0.9912087912087912, + "eval_runtime": 5.7829, + "eval_samples_per_second": 236.039, + "eval_steps_per_second": 29.57, + "step": 850 + } + ], + "logging_steps": 500, + "max_steps": 850, + "num_input_tokens_seen": 0, + "num_train_epochs": 10, + "save_steps": 500, + "stateful_callbacks": { + "EarlyStoppingCallback": { + "args": { + "early_stopping_patience": 3, + "early_stopping_threshold": 0.0 + }, + "attributes": { + "early_stopping_patience_counter": 0 + } + }, + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 1.23633370170624e+17, + "train_batch_size": 8, + "trial_name": null, + "trial_params": null +} diff --git a/checkpoint-850/training_args.bin b/checkpoint-850/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d762b1cb8eeee08ab8703debb3a686abe8615eb --- /dev/null +++ b/checkpoint-850/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b +size 5240 diff --git a/config.json b/config.json index a8097f6a414b056b727b26aa15ffac67f0897e4b..23cd00c8f7806f9961fb35e24a24f5d256693560 100644 --- a/config.json +++ b/config.json @@ -55,10 +55,6 @@ }, "initializer_range": 0.02, "intermediate_size": 3072, - "label2id": { - "crying": 0, - "no_crying": 1 - }, "layer_norm_eps": 1e-05, "layerdrop": 0.0, "mask_feature_length": 10, diff --git a/model.safetensors b/model.safetensors index 64b2a950633e3643aa02355c551366d54855bb4c..e8250db40335ef01374cc2551da82b034b606100 100644 --- a/model.safetensors +++ b/model.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:02108e5b5b6258f37f5cf8b56d34f77aa8b483e760491525d71597e196663a68 +oid sha256:3fefc9fc9e0c6f521d52f6944550be09ad08cf2a406465b2bad96d43e8e656a9 size 94763496 diff --git a/runs/Sep08_20-50-08_ubumarcos/events.out.tfevents.1725821409.ubumarcos b/runs/Sep08_20-50-08_ubumarcos/events.out.tfevents.1725821409.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..0b4995966f63bf08c5b73e426197e2ff174b0af1 --- /dev/null +++ b/runs/Sep08_20-50-08_ubumarcos/events.out.tfevents.1725821409.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5768e1b2ef1f125c46448a0f0312aa445c089532fcbc42786546948ae639471 +size 5851 diff --git a/runs/Sep08_21-13-48_ubumarcos/events.out.tfevents.1725822829.ubumarcos b/runs/Sep08_21-13-48_ubumarcos/events.out.tfevents.1725822829.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..01d75cc636b1eb3af8e125cac453bf06fc058776 --- /dev/null +++ b/runs/Sep08_21-13-48_ubumarcos/events.out.tfevents.1725822829.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c153806ae01a35e7a58505365504750dd5e77f9aaf2443fbd040dbde644bf19 +size 5851 diff --git a/runs/Sep09_13-04-47_ubumarcos/events.out.tfevents.1725879901.ubumarcos b/runs/Sep09_13-04-47_ubumarcos/events.out.tfevents.1725879901.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..f844959e519ebc022dd9c23a1e8793a377a1d6e7 --- /dev/null +++ b/runs/Sep09_13-04-47_ubumarcos/events.out.tfevents.1725879901.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47298f4c14c6e2cf02c4292c80880d69075f152fc6c1a4831ca87fbc76f22b09 +size 5850 diff --git a/runs/Sep09_17-59-20_ubumarcos/events.out.tfevents.1725897561.ubumarcos b/runs/Sep09_17-59-20_ubumarcos/events.out.tfevents.1725897561.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..b639e521477ccdb0e037b49cec1c321e5c8cce31 --- /dev/null +++ b/runs/Sep09_17-59-20_ubumarcos/events.out.tfevents.1725897561.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c28fcdd52aa17c8decbfa612d39ed8f37b4f19ca76a7dcf5d53daa3c4eec98 +size 5850 diff --git a/runs/Sep09_18-10-13_ubumarcos/events.out.tfevents.1725898215.ubumarcos b/runs/Sep09_18-10-13_ubumarcos/events.out.tfevents.1725898215.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..9d8ec1257a85eb4213cac8d306b26b2b4c310165 --- /dev/null +++ b/runs/Sep09_18-10-13_ubumarcos/events.out.tfevents.1725898215.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1453d6a698695ab52020a0169ee70ccc02d50962abbbcea675588977658416d +size 5850 diff --git a/runs/Sep09_18-10-24_ubumarcos/events.out.tfevents.1725898225.ubumarcos b/runs/Sep09_18-10-24_ubumarcos/events.out.tfevents.1725898225.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..1522708989e6bdee98952dc08a2d0d0790edc44f --- /dev/null +++ b/runs/Sep09_18-10-24_ubumarcos/events.out.tfevents.1725898225.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1ecb0f9cd5fe60d6c3860a19c06287a8807fe4957df9d0ec0a51fd3e854d2cd +size 5850 diff --git a/runs/Sep10_00-34-48_ubumarcos/events.out.tfevents.1725921289.ubumarcos b/runs/Sep10_00-34-48_ubumarcos/events.out.tfevents.1725921289.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..9b8fe97610612391158800755b7ea74251324a54 --- /dev/null +++ b/runs/Sep10_00-34-48_ubumarcos/events.out.tfevents.1725921289.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb66c596890f453c4964d7708c7b6346ad792ecbcbc59053bee44e821fd377f7 +size 5850 diff --git a/runs/Sep10_13-50-43_ubumarcos/events.out.tfevents.1725969044.ubumarcos b/runs/Sep10_13-50-43_ubumarcos/events.out.tfevents.1725969044.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..3d6a625a02cbaef21cb758403738f22aca6ed7aa --- /dev/null +++ b/runs/Sep10_13-50-43_ubumarcos/events.out.tfevents.1725969044.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37edd17201d0bc62c8b8b5344e6e8fc7ddf073ad1fc6bb8a34b5b165226060b9 +size 5850 diff --git a/runs/Sep10_16-47-34_ubumarcos/events.out.tfevents.1725979656.ubumarcos b/runs/Sep10_16-47-34_ubumarcos/events.out.tfevents.1725979656.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..38d1b444fc96edc8968a9056a55c57f6be2a0a75 --- /dev/null +++ b/runs/Sep10_16-47-34_ubumarcos/events.out.tfevents.1725979656.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12599642296c095f6826a911e19bbb8b4439d9ed7f11525268ae7190fb567a6 +size 5895 diff --git a/runs/Sep10_17-01-28_ubumarcos/events.out.tfevents.1725980489.ubumarcos b/runs/Sep10_17-01-28_ubumarcos/events.out.tfevents.1725980489.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..5ae30290aeb4eaaccfa100a3a43b7be002fcefb6 --- /dev/null +++ b/runs/Sep10_17-01-28_ubumarcos/events.out.tfevents.1725980489.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ffb32a05139f32d56b3853240a7838d94ce8d59df1fecc27d3b9499230209e +size 5838 diff --git a/runs/Sep10_17-06-04_ubumarcos/events.out.tfevents.1725980765.ubumarcos b/runs/Sep10_17-06-04_ubumarcos/events.out.tfevents.1725980765.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..75929a2b35d196a6d11ace3b1b451aef7ad8eec9 --- /dev/null +++ b/runs/Sep10_17-06-04_ubumarcos/events.out.tfevents.1725980765.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3198032e9802108cdfb6f181a0f32cbe5c27d10c4a05b61a78aafdcea4b41f7c +size 5838 diff --git a/runs/Sep10_17-23-08_ubumarcos/events.out.tfevents.1725981789.ubumarcos b/runs/Sep10_17-23-08_ubumarcos/events.out.tfevents.1725981789.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..d6dacf8e50e1f046ad80e1742ba1de5fee33706f --- /dev/null +++ b/runs/Sep10_17-23-08_ubumarcos/events.out.tfevents.1725981789.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e944ae7b013d8d85703888c2a3b9547ab8959391073cef32db20fa86891fbd0 +size 9698 diff --git a/runs/Sep10_17-49-25_ubumarcos/events.out.tfevents.1725983366.ubumarcos b/runs/Sep10_17-49-25_ubumarcos/events.out.tfevents.1725983366.ubumarcos new file mode 100644 index 0000000000000000000000000000000000000000..53d29c9792f96427a24b88c0962a93a82b9fc77e --- /dev/null +++ b/runs/Sep10_17-49-25_ubumarcos/events.out.tfevents.1725983366.ubumarcos @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd035f18cc496265a8e5ffb4695bc4c0b9df3f2924dd33a96bb3b742269cf7f8 +size 11114 diff --git a/training_args.bin b/training_args.bin index 7bfc5bd20dcd0c05fb8658eb0e6ae87fef5fc784..5d762b1cb8eeee08ab8703debb3a686abe8615eb 100644 --- a/training_args.bin +++ b/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7bd8e997c05f23ae464180f8e5e9f881e9c68322e4fcd3f855e79e2e5d54fbb +oid sha256:39b105bc8a63684c00e408cee2101863b9ae4fed57fb146361599a16b19b549b size 5240