|
{ |
|
"best_metric": 0.6297643780708313, |
|
"best_model_checkpoint": "/models/hfhub/DewiBrynJones/wav2vec2-xlsr-53-ft-btb-cy/checkpoint-1000", |
|
"epoch": 5.657708628005658, |
|
"eval_steps": 500, |
|
"global_step": 2000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.1315417256011315, |
|
"grad_norm": 1.0976253747940063, |
|
"learning_rate": 0.000147375, |
|
"loss": 4.9658, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.4144271570014144, |
|
"eval_loss": 1.1673808097839355, |
|
"eval_runtime": 174.6298, |
|
"eval_samples_per_second": 32.389, |
|
"eval_steps_per_second": 1.014, |
|
"eval_wer": 0.802891945242413, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.263083451202263, |
|
"grad_norm": 2.727048397064209, |
|
"learning_rate": 0.00029587499999999997, |
|
"loss": 1.2376, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.828854314002829, |
|
"eval_loss": 0.6297643780708313, |
|
"eval_runtime": 181.3206, |
|
"eval_samples_per_second": 31.193, |
|
"eval_steps_per_second": 0.976, |
|
"eval_wer": 0.4413827414100239, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 3.3946251768033946, |
|
"grad_norm": 4.206020832061768, |
|
"learning_rate": 0.0002723571428571428, |
|
"loss": 0.8262, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 4.243281471004243, |
|
"eval_loss": 1.9106061458587646, |
|
"eval_runtime": 170.5081, |
|
"eval_samples_per_second": 33.171, |
|
"eval_steps_per_second": 1.038, |
|
"eval_wer": 0.8612444030748985, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.526166902404526, |
|
"grad_norm": 0.0, |
|
"learning_rate": 0.0002462142857142857, |
|
"loss": 1.653, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 5.657708628005658, |
|
"grad_norm": 0.0, |
|
"learning_rate": 0.00021792857142857142, |
|
"loss": 1.9941, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.657708628005658, |
|
"eval_loss": 1.9103525876998901, |
|
"eval_runtime": 170.4356, |
|
"eval_samples_per_second": 33.186, |
|
"eval_steps_per_second": 1.039, |
|
"eval_wer": 0.8610999662980854, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.657708628005658, |
|
"step": 2000, |
|
"total_flos": 1.5333464503060175e+19, |
|
"train_loss": 2.1353194427490236, |
|
"train_runtime": 5639.522, |
|
"train_samples_per_second": 56.742, |
|
"train_steps_per_second": 0.887 |
|
} |
|
], |
|
"logging_steps": 400, |
|
"max_steps": 5000, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 15, |
|
"save_steps": 500, |
|
"total_flos": 1.5333464503060175e+19, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|