whisper-large-v2-eu-cv16_1 / trainer_state.json
zuazo's picture
End of training
f576733 verified
raw
history blame
204 kB
{
"best_metric": 7.451735188369549,
"best_model_checkpoint": "./checkpoint-13000",
"epoch": 401.50564617314933,
"eval_steps": 1000,
"global_step": 40000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.25,
"learning_rate": 5.000000000000001e-07,
"loss": 1.0482,
"step": 25
},
{
"epoch": 0.5,
"learning_rate": 9.800000000000001e-07,
"loss": 0.6567,
"step": 50
},
{
"epoch": 0.75,
"learning_rate": 1.48e-06,
"loss": 0.477,
"step": 75
},
{
"epoch": 1.0,
"learning_rate": 1.98e-06,
"loss": 0.4014,
"step": 100
},
{
"epoch": 1.25,
"learning_rate": 2.4800000000000004e-06,
"loss": 0.3432,
"step": 125
},
{
"epoch": 1.51,
"learning_rate": 2.9800000000000003e-06,
"loss": 0.301,
"step": 150
},
{
"epoch": 1.76,
"learning_rate": 3.48e-06,
"loss": 0.2734,
"step": 175
},
{
"epoch": 2.01,
"learning_rate": 3.980000000000001e-06,
"loss": 0.2445,
"step": 200
},
{
"epoch": 2.26,
"learning_rate": 4.48e-06,
"loss": 0.1973,
"step": 225
},
{
"epoch": 2.51,
"learning_rate": 4.960000000000001e-06,
"loss": 0.1906,
"step": 250
},
{
"epoch": 2.76,
"learning_rate": 5.460000000000001e-06,
"loss": 0.1791,
"step": 275
},
{
"epoch": 3.01,
"learning_rate": 5.9600000000000005e-06,
"loss": 0.1715,
"step": 300
},
{
"epoch": 3.26,
"learning_rate": 6.460000000000001e-06,
"loss": 0.1248,
"step": 325
},
{
"epoch": 3.51,
"learning_rate": 6.96e-06,
"loss": 0.1223,
"step": 350
},
{
"epoch": 3.76,
"learning_rate": 7.4600000000000006e-06,
"loss": 0.1242,
"step": 375
},
{
"epoch": 4.02,
"learning_rate": 7.960000000000002e-06,
"loss": 0.1217,
"step": 400
},
{
"epoch": 4.27,
"learning_rate": 8.46e-06,
"loss": 0.0816,
"step": 425
},
{
"epoch": 4.52,
"learning_rate": 8.96e-06,
"loss": 0.0817,
"step": 450
},
{
"epoch": 4.77,
"learning_rate": 9.460000000000001e-06,
"loss": 0.0858,
"step": 475
},
{
"epoch": 5.02,
"learning_rate": 9.960000000000001e-06,
"loss": 0.0818,
"step": 500
},
{
"epoch": 5.27,
"learning_rate": 9.994177215189874e-06,
"loss": 0.0518,
"step": 525
},
{
"epoch": 5.52,
"learning_rate": 9.987848101265824e-06,
"loss": 0.054,
"step": 550
},
{
"epoch": 5.77,
"learning_rate": 9.981518987341773e-06,
"loss": 0.0552,
"step": 575
},
{
"epoch": 6.02,
"learning_rate": 9.975189873417723e-06,
"loss": 0.0543,
"step": 600
},
{
"epoch": 6.27,
"learning_rate": 9.968860759493672e-06,
"loss": 0.0344,
"step": 625
},
{
"epoch": 6.52,
"learning_rate": 9.962531645569621e-06,
"loss": 0.0353,
"step": 650
},
{
"epoch": 6.78,
"learning_rate": 9.956202531645571e-06,
"loss": 0.0365,
"step": 675
},
{
"epoch": 7.03,
"learning_rate": 9.94987341772152e-06,
"loss": 0.0332,
"step": 700
},
{
"epoch": 7.28,
"learning_rate": 9.943544303797468e-06,
"loss": 0.021,
"step": 725
},
{
"epoch": 7.53,
"learning_rate": 9.937215189873417e-06,
"loss": 0.0227,
"step": 750
},
{
"epoch": 7.78,
"learning_rate": 9.930886075949367e-06,
"loss": 0.0216,
"step": 775
},
{
"epoch": 8.03,
"learning_rate": 9.924556962025316e-06,
"loss": 0.0223,
"step": 800
},
{
"epoch": 8.28,
"learning_rate": 9.918227848101266e-06,
"loss": 0.0145,
"step": 825
},
{
"epoch": 8.53,
"learning_rate": 9.911898734177215e-06,
"loss": 0.0146,
"step": 850
},
{
"epoch": 8.78,
"learning_rate": 9.905569620253165e-06,
"loss": 0.0157,
"step": 875
},
{
"epoch": 9.03,
"learning_rate": 9.899240506329116e-06,
"loss": 0.0157,
"step": 900
},
{
"epoch": 9.28,
"learning_rate": 9.892911392405065e-06,
"loss": 0.0105,
"step": 925
},
{
"epoch": 9.54,
"learning_rate": 9.886582278481015e-06,
"loss": 0.0101,
"step": 950
},
{
"epoch": 9.79,
"learning_rate": 9.880253164556964e-06,
"loss": 0.0109,
"step": 975
},
{
"epoch": 10.04,
"learning_rate": 9.873924050632913e-06,
"loss": 0.0112,
"step": 1000
},
{
"epoch": 10.04,
"eval_loss": 0.21815913915634155,
"eval_runtime": 2849.5314,
"eval_samples_per_second": 4.472,
"eval_steps_per_second": 0.28,
"eval_wer": 10.157104892918555,
"step": 1000
},
{
"epoch": 10.29,
"learning_rate": 9.867594936708861e-06,
"loss": 0.008,
"step": 1025
},
{
"epoch": 10.54,
"learning_rate": 9.86126582278481e-06,
"loss": 0.0089,
"step": 1050
},
{
"epoch": 10.79,
"learning_rate": 9.85493670886076e-06,
"loss": 0.0098,
"step": 1075
},
{
"epoch": 11.04,
"learning_rate": 9.84860759493671e-06,
"loss": 0.008,
"step": 1100
},
{
"epoch": 11.29,
"learning_rate": 9.842278481012659e-06,
"loss": 0.0055,
"step": 1125
},
{
"epoch": 11.54,
"learning_rate": 9.835949367088608e-06,
"loss": 0.0063,
"step": 1150
},
{
"epoch": 11.79,
"learning_rate": 9.829620253164558e-06,
"loss": 0.0067,
"step": 1175
},
{
"epoch": 12.05,
"learning_rate": 9.823291139240507e-06,
"loss": 0.0069,
"step": 1200
},
{
"epoch": 12.3,
"learning_rate": 9.816962025316457e-06,
"loss": 0.006,
"step": 1225
},
{
"epoch": 12.55,
"learning_rate": 9.810632911392406e-06,
"loss": 0.0067,
"step": 1250
},
{
"epoch": 12.8,
"learning_rate": 9.804303797468355e-06,
"loss": 0.0067,
"step": 1275
},
{
"epoch": 13.05,
"learning_rate": 9.797974683544305e-06,
"loss": 0.0061,
"step": 1300
},
{
"epoch": 13.3,
"learning_rate": 9.791645569620254e-06,
"loss": 0.0049,
"step": 1325
},
{
"epoch": 13.55,
"learning_rate": 9.785316455696204e-06,
"loss": 0.0043,
"step": 1350
},
{
"epoch": 13.8,
"learning_rate": 9.778987341772153e-06,
"loss": 0.0048,
"step": 1375
},
{
"epoch": 14.05,
"learning_rate": 9.772658227848103e-06,
"loss": 0.0057,
"step": 1400
},
{
"epoch": 14.3,
"learning_rate": 9.766329113924052e-06,
"loss": 0.0045,
"step": 1425
},
{
"epoch": 14.55,
"learning_rate": 9.760000000000001e-06,
"loss": 0.0047,
"step": 1450
},
{
"epoch": 14.81,
"learning_rate": 9.75367088607595e-06,
"loss": 0.0057,
"step": 1475
},
{
"epoch": 15.06,
"learning_rate": 9.747341772151899e-06,
"loss": 0.0061,
"step": 1500
},
{
"epoch": 15.31,
"learning_rate": 9.741012658227848e-06,
"loss": 0.0046,
"step": 1525
},
{
"epoch": 15.56,
"learning_rate": 9.734683544303797e-06,
"loss": 0.005,
"step": 1550
},
{
"epoch": 15.81,
"learning_rate": 9.728354430379747e-06,
"loss": 0.0047,
"step": 1575
},
{
"epoch": 16.06,
"learning_rate": 9.722025316455696e-06,
"loss": 0.0053,
"step": 1600
},
{
"epoch": 16.31,
"learning_rate": 9.715696202531646e-06,
"loss": 0.0042,
"step": 1625
},
{
"epoch": 16.56,
"learning_rate": 9.709367088607595e-06,
"loss": 0.0035,
"step": 1650
},
{
"epoch": 16.81,
"learning_rate": 9.703037974683545e-06,
"loss": 0.0034,
"step": 1675
},
{
"epoch": 17.06,
"learning_rate": 9.696708860759494e-06,
"loss": 0.0037,
"step": 1700
},
{
"epoch": 17.31,
"learning_rate": 9.690379746835445e-06,
"loss": 0.0033,
"step": 1725
},
{
"epoch": 17.57,
"learning_rate": 9.684050632911393e-06,
"loss": 0.0034,
"step": 1750
},
{
"epoch": 17.82,
"learning_rate": 9.677721518987342e-06,
"loss": 0.0033,
"step": 1775
},
{
"epoch": 18.07,
"learning_rate": 9.671392405063292e-06,
"loss": 0.0033,
"step": 1800
},
{
"epoch": 18.32,
"learning_rate": 9.665063291139241e-06,
"loss": 0.0033,
"step": 1825
},
{
"epoch": 18.57,
"learning_rate": 9.65873417721519e-06,
"loss": 0.0035,
"step": 1850
},
{
"epoch": 18.82,
"learning_rate": 9.65240506329114e-06,
"loss": 0.0036,
"step": 1875
},
{
"epoch": 19.07,
"learning_rate": 9.64607594936709e-06,
"loss": 0.0045,
"step": 1900
},
{
"epoch": 19.32,
"learning_rate": 9.639746835443039e-06,
"loss": 0.0041,
"step": 1925
},
{
"epoch": 19.57,
"learning_rate": 9.633417721518988e-06,
"loss": 0.0041,
"step": 1950
},
{
"epoch": 19.82,
"learning_rate": 9.627088607594938e-06,
"loss": 0.0039,
"step": 1975
},
{
"epoch": 20.08,
"learning_rate": 9.620759493670887e-06,
"loss": 0.0052,
"step": 2000
},
{
"epoch": 20.08,
"eval_loss": 0.23722027242183685,
"eval_runtime": 2841.2175,
"eval_samples_per_second": 4.485,
"eval_steps_per_second": 0.281,
"eval_wer": 9.627559793653274,
"step": 2000
},
{
"epoch": 20.33,
"learning_rate": 9.614430379746837e-06,
"loss": 0.0039,
"step": 2025
},
{
"epoch": 20.58,
"learning_rate": 9.608101265822786e-06,
"loss": 0.0037,
"step": 2050
},
{
"epoch": 20.83,
"learning_rate": 9.601772151898735e-06,
"loss": 0.004,
"step": 2075
},
{
"epoch": 21.08,
"learning_rate": 9.595443037974685e-06,
"loss": 0.0044,
"step": 2100
},
{
"epoch": 21.33,
"learning_rate": 9.589113924050634e-06,
"loss": 0.0032,
"step": 2125
},
{
"epoch": 21.58,
"learning_rate": 9.582784810126584e-06,
"loss": 0.0036,
"step": 2150
},
{
"epoch": 21.83,
"learning_rate": 9.576455696202533e-06,
"loss": 0.0038,
"step": 2175
},
{
"epoch": 22.08,
"learning_rate": 9.570126582278481e-06,
"loss": 0.0036,
"step": 2200
},
{
"epoch": 22.33,
"learning_rate": 9.56379746835443e-06,
"loss": 0.0035,
"step": 2225
},
{
"epoch": 22.58,
"learning_rate": 9.55746835443038e-06,
"loss": 0.0042,
"step": 2250
},
{
"epoch": 22.84,
"learning_rate": 9.551139240506329e-06,
"loss": 0.0039,
"step": 2275
},
{
"epoch": 23.09,
"learning_rate": 9.544810126582279e-06,
"loss": 0.0038,
"step": 2300
},
{
"epoch": 23.34,
"learning_rate": 9.538481012658228e-06,
"loss": 0.0038,
"step": 2325
},
{
"epoch": 23.59,
"learning_rate": 9.532151898734177e-06,
"loss": 0.0037,
"step": 2350
},
{
"epoch": 23.84,
"learning_rate": 9.525822784810127e-06,
"loss": 0.005,
"step": 2375
},
{
"epoch": 24.09,
"learning_rate": 9.519493670886076e-06,
"loss": 0.0043,
"step": 2400
},
{
"epoch": 24.34,
"learning_rate": 9.513164556962026e-06,
"loss": 0.0035,
"step": 2425
},
{
"epoch": 24.59,
"learning_rate": 9.506835443037975e-06,
"loss": 0.0032,
"step": 2450
},
{
"epoch": 24.84,
"learning_rate": 9.500506329113925e-06,
"loss": 0.0041,
"step": 2475
},
{
"epoch": 25.09,
"learning_rate": 9.494177215189874e-06,
"loss": 0.0029,
"step": 2500
},
{
"epoch": 25.35,
"learning_rate": 9.487848101265823e-06,
"loss": 0.0023,
"step": 2525
},
{
"epoch": 25.6,
"learning_rate": 9.481518987341773e-06,
"loss": 0.0022,
"step": 2550
},
{
"epoch": 25.85,
"learning_rate": 9.475189873417722e-06,
"loss": 0.003,
"step": 2575
},
{
"epoch": 26.1,
"learning_rate": 9.468860759493672e-06,
"loss": 0.0037,
"step": 2600
},
{
"epoch": 26.35,
"learning_rate": 9.462531645569621e-06,
"loss": 0.0027,
"step": 2625
},
{
"epoch": 26.6,
"learning_rate": 9.45620253164557e-06,
"loss": 0.0032,
"step": 2650
},
{
"epoch": 26.85,
"learning_rate": 9.44987341772152e-06,
"loss": 0.0033,
"step": 2675
},
{
"epoch": 27.1,
"learning_rate": 9.44354430379747e-06,
"loss": 0.0037,
"step": 2700
},
{
"epoch": 27.35,
"learning_rate": 9.437215189873419e-06,
"loss": 0.0031,
"step": 2725
},
{
"epoch": 27.6,
"learning_rate": 9.430886075949368e-06,
"loss": 0.0027,
"step": 2750
},
{
"epoch": 27.85,
"learning_rate": 9.424556962025318e-06,
"loss": 0.003,
"step": 2775
},
{
"epoch": 28.11,
"learning_rate": 9.418227848101267e-06,
"loss": 0.003,
"step": 2800
},
{
"epoch": 28.36,
"learning_rate": 9.411898734177217e-06,
"loss": 0.0025,
"step": 2825
},
{
"epoch": 28.61,
"learning_rate": 9.405569620253166e-06,
"loss": 0.0023,
"step": 2850
},
{
"epoch": 28.86,
"learning_rate": 9.399240506329115e-06,
"loss": 0.0027,
"step": 2875
},
{
"epoch": 29.11,
"learning_rate": 9.392911392405065e-06,
"loss": 0.0023,
"step": 2900
},
{
"epoch": 29.36,
"learning_rate": 9.386582278481014e-06,
"loss": 0.0022,
"step": 2925
},
{
"epoch": 29.61,
"learning_rate": 9.380253164556962e-06,
"loss": 0.0018,
"step": 2950
},
{
"epoch": 29.86,
"learning_rate": 9.373924050632911e-06,
"loss": 0.0018,
"step": 2975
},
{
"epoch": 30.11,
"learning_rate": 9.367594936708861e-06,
"loss": 0.0017,
"step": 3000
},
{
"epoch": 30.11,
"eval_loss": 0.24174295365810394,
"eval_runtime": 2833.8733,
"eval_samples_per_second": 4.496,
"eval_steps_per_second": 0.281,
"eval_wer": 9.014967953728311,
"step": 3000
},
{
"epoch": 30.36,
"learning_rate": 9.36126582278481e-06,
"loss": 0.0024,
"step": 3025
},
{
"epoch": 30.61,
"learning_rate": 9.355189873417723e-06,
"loss": 0.002,
"step": 3050
},
{
"epoch": 30.87,
"learning_rate": 9.348860759493671e-06,
"loss": 0.0025,
"step": 3075
},
{
"epoch": 31.12,
"learning_rate": 9.34253164556962e-06,
"loss": 0.0026,
"step": 3100
},
{
"epoch": 31.37,
"learning_rate": 9.33620253164557e-06,
"loss": 0.0024,
"step": 3125
},
{
"epoch": 31.62,
"learning_rate": 9.32987341772152e-06,
"loss": 0.0019,
"step": 3150
},
{
"epoch": 31.87,
"learning_rate": 9.323544303797469e-06,
"loss": 0.003,
"step": 3175
},
{
"epoch": 32.12,
"learning_rate": 9.317215189873418e-06,
"loss": 0.0026,
"step": 3200
},
{
"epoch": 32.37,
"learning_rate": 9.310886075949368e-06,
"loss": 0.003,
"step": 3225
},
{
"epoch": 32.62,
"learning_rate": 9.304556962025317e-06,
"loss": 0.0027,
"step": 3250
},
{
"epoch": 32.87,
"learning_rate": 9.298227848101267e-06,
"loss": 0.0032,
"step": 3275
},
{
"epoch": 33.12,
"learning_rate": 9.291898734177216e-06,
"loss": 0.0022,
"step": 3300
},
{
"epoch": 33.38,
"learning_rate": 9.285569620253165e-06,
"loss": 0.0018,
"step": 3325
},
{
"epoch": 33.63,
"learning_rate": 9.279240506329115e-06,
"loss": 0.0019,
"step": 3350
},
{
"epoch": 33.88,
"learning_rate": 9.272911392405064e-06,
"loss": 0.0019,
"step": 3375
},
{
"epoch": 34.13,
"learning_rate": 9.266582278481014e-06,
"loss": 0.0017,
"step": 3400
},
{
"epoch": 34.38,
"learning_rate": 9.260253164556963e-06,
"loss": 0.0015,
"step": 3425
},
{
"epoch": 34.63,
"learning_rate": 9.253924050632913e-06,
"loss": 0.0011,
"step": 3450
},
{
"epoch": 34.88,
"learning_rate": 9.247594936708862e-06,
"loss": 0.0015,
"step": 3475
},
{
"epoch": 35.13,
"learning_rate": 9.241265822784811e-06,
"loss": 0.0018,
"step": 3500
},
{
"epoch": 35.38,
"learning_rate": 9.23493670886076e-06,
"loss": 0.0014,
"step": 3525
},
{
"epoch": 35.63,
"learning_rate": 9.228607594936709e-06,
"loss": 0.002,
"step": 3550
},
{
"epoch": 35.88,
"learning_rate": 9.222278481012658e-06,
"loss": 0.0024,
"step": 3575
},
{
"epoch": 36.14,
"learning_rate": 9.215949367088607e-06,
"loss": 0.0026,
"step": 3600
},
{
"epoch": 36.39,
"learning_rate": 9.209620253164557e-06,
"loss": 0.0029,
"step": 3625
},
{
"epoch": 36.64,
"learning_rate": 9.203291139240506e-06,
"loss": 0.0032,
"step": 3650
},
{
"epoch": 36.89,
"learning_rate": 9.196962025316456e-06,
"loss": 0.0033,
"step": 3675
},
{
"epoch": 37.14,
"learning_rate": 9.190632911392405e-06,
"loss": 0.0036,
"step": 3700
},
{
"epoch": 37.39,
"learning_rate": 9.184303797468355e-06,
"loss": 0.0032,
"step": 3725
},
{
"epoch": 37.64,
"learning_rate": 9.177974683544306e-06,
"loss": 0.0027,
"step": 3750
},
{
"epoch": 37.89,
"learning_rate": 9.171645569620255e-06,
"loss": 0.0033,
"step": 3775
},
{
"epoch": 38.14,
"learning_rate": 9.165316455696205e-06,
"loss": 0.0032,
"step": 3800
},
{
"epoch": 38.39,
"learning_rate": 9.158987341772152e-06,
"loss": 0.0023,
"step": 3825
},
{
"epoch": 38.64,
"learning_rate": 9.152658227848102e-06,
"loss": 0.0024,
"step": 3850
},
{
"epoch": 38.9,
"learning_rate": 9.146329113924051e-06,
"loss": 0.003,
"step": 3875
},
{
"epoch": 39.15,
"learning_rate": 9.14e-06,
"loss": 0.0024,
"step": 3900
},
{
"epoch": 39.4,
"learning_rate": 9.13367088607595e-06,
"loss": 0.0018,
"step": 3925
},
{
"epoch": 39.65,
"learning_rate": 9.1273417721519e-06,
"loss": 0.0023,
"step": 3950
},
{
"epoch": 39.9,
"learning_rate": 9.121012658227849e-06,
"loss": 0.0023,
"step": 3975
},
{
"epoch": 40.15,
"learning_rate": 9.114683544303798e-06,
"loss": 0.0022,
"step": 4000
},
{
"epoch": 40.15,
"eval_loss": 0.2340633124113083,
"eval_runtime": 2834.4887,
"eval_samples_per_second": 4.495,
"eval_steps_per_second": 0.281,
"eval_wer": 8.893817414413006,
"step": 4000
},
{
"epoch": 40.4,
"learning_rate": 9.108354430379748e-06,
"loss": 0.0021,
"step": 4025
},
{
"epoch": 40.65,
"learning_rate": 9.102025316455697e-06,
"loss": 0.002,
"step": 4050
},
{
"epoch": 40.9,
"learning_rate": 9.095696202531647e-06,
"loss": 0.0022,
"step": 4075
},
{
"epoch": 41.15,
"learning_rate": 9.089367088607596e-06,
"loss": 0.0021,
"step": 4100
},
{
"epoch": 41.41,
"learning_rate": 9.083037974683545e-06,
"loss": 0.0023,
"step": 4125
},
{
"epoch": 41.66,
"learning_rate": 9.076708860759495e-06,
"loss": 0.0025,
"step": 4150
},
{
"epoch": 41.91,
"learning_rate": 9.070379746835444e-06,
"loss": 0.0028,
"step": 4175
},
{
"epoch": 42.16,
"learning_rate": 9.064050632911394e-06,
"loss": 0.0028,
"step": 4200
},
{
"epoch": 42.41,
"learning_rate": 9.057721518987343e-06,
"loss": 0.0022,
"step": 4225
},
{
"epoch": 42.66,
"learning_rate": 9.051392405063293e-06,
"loss": 0.0017,
"step": 4250
},
{
"epoch": 42.91,
"learning_rate": 9.04506329113924e-06,
"loss": 0.0022,
"step": 4275
},
{
"epoch": 43.16,
"learning_rate": 9.03873417721519e-06,
"loss": 0.0019,
"step": 4300
},
{
"epoch": 43.41,
"learning_rate": 9.03240506329114e-06,
"loss": 0.0014,
"step": 4325
},
{
"epoch": 43.66,
"learning_rate": 9.026075949367089e-06,
"loss": 0.0025,
"step": 4350
},
{
"epoch": 43.91,
"learning_rate": 9.019746835443038e-06,
"loss": 0.0021,
"step": 4375
},
{
"epoch": 44.17,
"learning_rate": 9.013417721518987e-06,
"loss": 0.0021,
"step": 4400
},
{
"epoch": 44.42,
"learning_rate": 9.007088607594937e-06,
"loss": 0.0022,
"step": 4425
},
{
"epoch": 44.67,
"learning_rate": 9.000759493670886e-06,
"loss": 0.0019,
"step": 4450
},
{
"epoch": 44.92,
"learning_rate": 8.994430379746836e-06,
"loss": 0.0023,
"step": 4475
},
{
"epoch": 45.17,
"learning_rate": 8.988101265822785e-06,
"loss": 0.002,
"step": 4500
},
{
"epoch": 45.42,
"learning_rate": 8.981772151898735e-06,
"loss": 0.0018,
"step": 4525
},
{
"epoch": 45.67,
"learning_rate": 8.975443037974684e-06,
"loss": 0.0025,
"step": 4550
},
{
"epoch": 45.92,
"learning_rate": 8.969113924050633e-06,
"loss": 0.0021,
"step": 4575
},
{
"epoch": 46.17,
"learning_rate": 8.962784810126583e-06,
"loss": 0.0018,
"step": 4600
},
{
"epoch": 46.42,
"learning_rate": 8.956455696202532e-06,
"loss": 0.0021,
"step": 4625
},
{
"epoch": 46.68,
"learning_rate": 8.950126582278482e-06,
"loss": 0.0019,
"step": 4650
},
{
"epoch": 46.93,
"learning_rate": 8.943797468354431e-06,
"loss": 0.0024,
"step": 4675
},
{
"epoch": 47.18,
"learning_rate": 8.93746835443038e-06,
"loss": 0.0019,
"step": 4700
},
{
"epoch": 47.43,
"learning_rate": 8.93113924050633e-06,
"loss": 0.0021,
"step": 4725
},
{
"epoch": 47.68,
"learning_rate": 8.92481012658228e-06,
"loss": 0.0026,
"step": 4750
},
{
"epoch": 47.93,
"learning_rate": 8.918481012658229e-06,
"loss": 0.002,
"step": 4775
},
{
"epoch": 48.18,
"learning_rate": 8.912151898734178e-06,
"loss": 0.0023,
"step": 4800
},
{
"epoch": 48.43,
"learning_rate": 8.905822784810128e-06,
"loss": 0.002,
"step": 4825
},
{
"epoch": 48.68,
"learning_rate": 8.899493670886077e-06,
"loss": 0.0021,
"step": 4850
},
{
"epoch": 48.93,
"learning_rate": 8.893164556962027e-06,
"loss": 0.0022,
"step": 4875
},
{
"epoch": 49.18,
"learning_rate": 8.886835443037976e-06,
"loss": 0.0015,
"step": 4900
},
{
"epoch": 49.44,
"learning_rate": 8.880506329113925e-06,
"loss": 0.0014,
"step": 4925
},
{
"epoch": 49.69,
"learning_rate": 8.874177215189875e-06,
"loss": 0.002,
"step": 4950
},
{
"epoch": 49.94,
"learning_rate": 8.867848101265824e-06,
"loss": 0.0023,
"step": 4975
},
{
"epoch": 50.19,
"learning_rate": 8.861518987341772e-06,
"loss": 0.0023,
"step": 5000
},
{
"epoch": 50.19,
"eval_loss": 0.24509792029857635,
"eval_runtime": 2843.0455,
"eval_samples_per_second": 4.482,
"eval_steps_per_second": 0.28,
"eval_wer": 8.93876035641707,
"step": 5000
},
{
"epoch": 50.44,
"learning_rate": 8.855189873417721e-06,
"loss": 0.002,
"step": 5025
},
{
"epoch": 50.69,
"learning_rate": 8.848860759493671e-06,
"loss": 0.002,
"step": 5050
},
{
"epoch": 50.94,
"learning_rate": 8.84253164556962e-06,
"loss": 0.0021,
"step": 5075
},
{
"epoch": 51.19,
"learning_rate": 8.83620253164557e-06,
"loss": 0.0018,
"step": 5100
},
{
"epoch": 51.44,
"learning_rate": 8.829873417721519e-06,
"loss": 0.0017,
"step": 5125
},
{
"epoch": 51.69,
"learning_rate": 8.823544303797469e-06,
"loss": 0.0023,
"step": 5150
},
{
"epoch": 51.94,
"learning_rate": 8.817215189873418e-06,
"loss": 0.0023,
"step": 5175
},
{
"epoch": 52.2,
"learning_rate": 8.810886075949367e-06,
"loss": 0.0015,
"step": 5200
},
{
"epoch": 52.45,
"learning_rate": 8.804556962025317e-06,
"loss": 0.0023,
"step": 5225
},
{
"epoch": 52.7,
"learning_rate": 8.798227848101266e-06,
"loss": 0.0022,
"step": 5250
},
{
"epoch": 52.95,
"learning_rate": 8.791898734177216e-06,
"loss": 0.0028,
"step": 5275
},
{
"epoch": 53.2,
"learning_rate": 8.785569620253165e-06,
"loss": 0.0019,
"step": 5300
},
{
"epoch": 53.45,
"learning_rate": 8.779240506329115e-06,
"loss": 0.002,
"step": 5325
},
{
"epoch": 53.7,
"learning_rate": 8.772911392405064e-06,
"loss": 0.002,
"step": 5350
},
{
"epoch": 53.95,
"learning_rate": 8.766582278481013e-06,
"loss": 0.0019,
"step": 5375
},
{
"epoch": 54.2,
"learning_rate": 8.760253164556963e-06,
"loss": 0.0012,
"step": 5400
},
{
"epoch": 54.45,
"learning_rate": 8.753924050632912e-06,
"loss": 0.0012,
"step": 5425
},
{
"epoch": 54.71,
"learning_rate": 8.747594936708862e-06,
"loss": 0.0013,
"step": 5450
},
{
"epoch": 54.96,
"learning_rate": 8.741265822784811e-06,
"loss": 0.0018,
"step": 5475
},
{
"epoch": 55.21,
"learning_rate": 8.73493670886076e-06,
"loss": 0.0014,
"step": 5500
},
{
"epoch": 55.46,
"learning_rate": 8.72860759493671e-06,
"loss": 0.0017,
"step": 5525
},
{
"epoch": 55.71,
"learning_rate": 8.72227848101266e-06,
"loss": 0.0015,
"step": 5550
},
{
"epoch": 55.96,
"learning_rate": 8.715949367088609e-06,
"loss": 0.0017,
"step": 5575
},
{
"epoch": 56.21,
"learning_rate": 8.709620253164558e-06,
"loss": 0.0009,
"step": 5600
},
{
"epoch": 56.46,
"learning_rate": 8.703291139240508e-06,
"loss": 0.0008,
"step": 5625
},
{
"epoch": 56.71,
"learning_rate": 8.696962025316457e-06,
"loss": 0.0012,
"step": 5650
},
{
"epoch": 56.96,
"learning_rate": 8.690632911392407e-06,
"loss": 0.0014,
"step": 5675
},
{
"epoch": 57.21,
"learning_rate": 8.684303797468356e-06,
"loss": 0.0012,
"step": 5700
},
{
"epoch": 57.47,
"learning_rate": 8.677974683544305e-06,
"loss": 0.0007,
"step": 5725
},
{
"epoch": 57.72,
"learning_rate": 8.671645569620253e-06,
"loss": 0.0008,
"step": 5750
},
{
"epoch": 57.97,
"learning_rate": 8.665316455696203e-06,
"loss": 0.0014,
"step": 5775
},
{
"epoch": 58.22,
"learning_rate": 8.658987341772152e-06,
"loss": 0.0011,
"step": 5800
},
{
"epoch": 58.47,
"learning_rate": 8.652658227848101e-06,
"loss": 0.0009,
"step": 5825
},
{
"epoch": 58.72,
"learning_rate": 8.646329113924051e-06,
"loss": 0.0012,
"step": 5850
},
{
"epoch": 58.97,
"learning_rate": 8.64e-06,
"loss": 0.0011,
"step": 5875
},
{
"epoch": 59.22,
"learning_rate": 8.63367088607595e-06,
"loss": 0.0008,
"step": 5900
},
{
"epoch": 59.47,
"learning_rate": 8.627341772151899e-06,
"loss": 0.0006,
"step": 5925
},
{
"epoch": 59.72,
"learning_rate": 8.621012658227849e-06,
"loss": 0.0006,
"step": 5950
},
{
"epoch": 59.97,
"learning_rate": 8.614683544303798e-06,
"loss": 0.0007,
"step": 5975
},
{
"epoch": 60.23,
"learning_rate": 8.608354430379747e-06,
"loss": 0.0006,
"step": 6000
},
{
"epoch": 60.23,
"eval_loss": 0.25170740485191345,
"eval_runtime": 2836.0485,
"eval_samples_per_second": 4.493,
"eval_steps_per_second": 0.281,
"eval_wer": 8.416054400500235,
"step": 6000
},
{
"epoch": 60.48,
"learning_rate": 8.602025316455697e-06,
"loss": 0.0008,
"step": 6025
},
{
"epoch": 60.73,
"learning_rate": 8.595696202531646e-06,
"loss": 0.0007,
"step": 6050
},
{
"epoch": 60.98,
"learning_rate": 8.589367088607596e-06,
"loss": 0.001,
"step": 6075
},
{
"epoch": 61.23,
"learning_rate": 8.583037974683545e-06,
"loss": 0.0007,
"step": 6100
},
{
"epoch": 61.48,
"learning_rate": 8.576708860759495e-06,
"loss": 0.0009,
"step": 6125
},
{
"epoch": 61.73,
"learning_rate": 8.570379746835444e-06,
"loss": 0.0015,
"step": 6150
},
{
"epoch": 61.98,
"learning_rate": 8.564050632911393e-06,
"loss": 0.0012,
"step": 6175
},
{
"epoch": 62.23,
"learning_rate": 8.557721518987341e-06,
"loss": 0.0012,
"step": 6200
},
{
"epoch": 62.48,
"learning_rate": 8.551392405063292e-06,
"loss": 0.0016,
"step": 6225
},
{
"epoch": 62.74,
"learning_rate": 8.545063291139242e-06,
"loss": 0.0013,
"step": 6250
},
{
"epoch": 62.99,
"learning_rate": 8.538734177215191e-06,
"loss": 0.0019,
"step": 6275
},
{
"epoch": 63.24,
"learning_rate": 8.53240506329114e-06,
"loss": 0.002,
"step": 6300
},
{
"epoch": 63.49,
"learning_rate": 8.52607594936709e-06,
"loss": 0.0026,
"step": 6325
},
{
"epoch": 63.74,
"learning_rate": 8.51974683544304e-06,
"loss": 0.0024,
"step": 6350
},
{
"epoch": 63.99,
"learning_rate": 8.513417721518989e-06,
"loss": 0.0027,
"step": 6375
},
{
"epoch": 64.24,
"learning_rate": 8.507088607594938e-06,
"loss": 0.0018,
"step": 6400
},
{
"epoch": 64.49,
"learning_rate": 8.500759493670888e-06,
"loss": 0.0017,
"step": 6425
},
{
"epoch": 64.74,
"learning_rate": 8.494430379746837e-06,
"loss": 0.0021,
"step": 6450
},
{
"epoch": 64.99,
"learning_rate": 8.488101265822787e-06,
"loss": 0.002,
"step": 6475
},
{
"epoch": 65.24,
"learning_rate": 8.481772151898734e-06,
"loss": 0.0017,
"step": 6500
},
{
"epoch": 65.5,
"learning_rate": 8.475443037974684e-06,
"loss": 0.002,
"step": 6525
},
{
"epoch": 65.75,
"learning_rate": 8.469113924050633e-06,
"loss": 0.0022,
"step": 6550
},
{
"epoch": 66.0,
"learning_rate": 8.462784810126583e-06,
"loss": 0.0018,
"step": 6575
},
{
"epoch": 66.25,
"learning_rate": 8.456455696202532e-06,
"loss": 0.0015,
"step": 6600
},
{
"epoch": 66.5,
"learning_rate": 8.450126582278481e-06,
"loss": 0.0011,
"step": 6625
},
{
"epoch": 66.75,
"learning_rate": 8.443797468354431e-06,
"loss": 0.0019,
"step": 6650
},
{
"epoch": 67.0,
"learning_rate": 8.43746835443038e-06,
"loss": 0.0018,
"step": 6675
},
{
"epoch": 67.25,
"learning_rate": 8.43113924050633e-06,
"loss": 0.0021,
"step": 6700
},
{
"epoch": 67.5,
"learning_rate": 8.424810126582279e-06,
"loss": 0.0016,
"step": 6725
},
{
"epoch": 67.75,
"learning_rate": 8.418481012658229e-06,
"loss": 0.0016,
"step": 6750
},
{
"epoch": 68.01,
"learning_rate": 8.412151898734178e-06,
"loss": 0.0025,
"step": 6775
},
{
"epoch": 68.26,
"learning_rate": 8.405822784810127e-06,
"loss": 0.0016,
"step": 6800
},
{
"epoch": 68.51,
"learning_rate": 8.399493670886077e-06,
"loss": 0.0017,
"step": 6825
},
{
"epoch": 68.76,
"learning_rate": 8.393164556962026e-06,
"loss": 0.0012,
"step": 6850
},
{
"epoch": 69.01,
"learning_rate": 8.386835443037976e-06,
"loss": 0.0014,
"step": 6875
},
{
"epoch": 69.26,
"learning_rate": 8.380506329113925e-06,
"loss": 0.0008,
"step": 6900
},
{
"epoch": 69.51,
"learning_rate": 8.374177215189873e-06,
"loss": 0.0007,
"step": 6925
},
{
"epoch": 69.76,
"learning_rate": 8.367848101265822e-06,
"loss": 0.0009,
"step": 6950
},
{
"epoch": 70.01,
"learning_rate": 8.361518987341772e-06,
"loss": 0.0009,
"step": 6975
},
{
"epoch": 70.26,
"learning_rate": 8.355189873417721e-06,
"loss": 0.0006,
"step": 7000
},
{
"epoch": 70.26,
"eval_loss": 0.24993743002414703,
"eval_runtime": 2839.6991,
"eval_samples_per_second": 4.487,
"eval_steps_per_second": 0.281,
"eval_wer": 8.098522745036735,
"step": 7000
},
{
"epoch": 70.51,
"learning_rate": 8.34886075949367e-06,
"loss": 0.0006,
"step": 7025
},
{
"epoch": 70.77,
"learning_rate": 8.342531645569622e-06,
"loss": 0.0006,
"step": 7050
},
{
"epoch": 71.02,
"learning_rate": 8.336202531645571e-06,
"loss": 0.0004,
"step": 7075
},
{
"epoch": 71.27,
"learning_rate": 8.32987341772152e-06,
"loss": 0.0005,
"step": 7100
},
{
"epoch": 71.52,
"learning_rate": 8.32354430379747e-06,
"loss": 0.0004,
"step": 7125
},
{
"epoch": 71.77,
"learning_rate": 8.31721518987342e-06,
"loss": 0.0004,
"step": 7150
},
{
"epoch": 72.02,
"learning_rate": 8.310886075949369e-06,
"loss": 0.0005,
"step": 7175
},
{
"epoch": 72.27,
"learning_rate": 8.304556962025318e-06,
"loss": 0.001,
"step": 7200
},
{
"epoch": 72.52,
"learning_rate": 8.298227848101266e-06,
"loss": 0.0015,
"step": 7225
},
{
"epoch": 72.77,
"learning_rate": 8.291898734177215e-06,
"loss": 0.0015,
"step": 7250
},
{
"epoch": 73.02,
"learning_rate": 8.285569620253165e-06,
"loss": 0.0015,
"step": 7275
},
{
"epoch": 73.27,
"learning_rate": 8.279240506329114e-06,
"loss": 0.0016,
"step": 7300
},
{
"epoch": 73.53,
"learning_rate": 8.272911392405064e-06,
"loss": 0.001,
"step": 7325
},
{
"epoch": 73.78,
"learning_rate": 8.266582278481013e-06,
"loss": 0.0015,
"step": 7350
},
{
"epoch": 74.03,
"learning_rate": 8.260253164556963e-06,
"loss": 0.0023,
"step": 7375
},
{
"epoch": 74.28,
"learning_rate": 8.253924050632912e-06,
"loss": 0.0016,
"step": 7400
},
{
"epoch": 74.53,
"learning_rate": 8.247594936708861e-06,
"loss": 0.0017,
"step": 7425
},
{
"epoch": 74.78,
"learning_rate": 8.24126582278481e-06,
"loss": 0.0016,
"step": 7450
},
{
"epoch": 75.03,
"learning_rate": 8.23493670886076e-06,
"loss": 0.0019,
"step": 7475
},
{
"epoch": 75.28,
"learning_rate": 8.22860759493671e-06,
"loss": 0.0022,
"step": 7500
},
{
"epoch": 75.53,
"learning_rate": 8.222278481012659e-06,
"loss": 0.0017,
"step": 7525
},
{
"epoch": 75.78,
"learning_rate": 8.215949367088609e-06,
"loss": 0.0016,
"step": 7550
},
{
"epoch": 76.04,
"learning_rate": 8.209620253164558e-06,
"loss": 0.0014,
"step": 7575
},
{
"epoch": 76.29,
"learning_rate": 8.203291139240507e-06,
"loss": 0.0013,
"step": 7600
},
{
"epoch": 76.54,
"learning_rate": 8.196962025316457e-06,
"loss": 0.0013,
"step": 7625
},
{
"epoch": 76.79,
"learning_rate": 8.190632911392406e-06,
"loss": 0.0014,
"step": 7650
},
{
"epoch": 77.04,
"learning_rate": 8.184303797468354e-06,
"loss": 0.0017,
"step": 7675
},
{
"epoch": 77.29,
"learning_rate": 8.177974683544303e-06,
"loss": 0.0016,
"step": 7700
},
{
"epoch": 77.54,
"learning_rate": 8.171645569620253e-06,
"loss": 0.0013,
"step": 7725
},
{
"epoch": 77.79,
"learning_rate": 8.165316455696202e-06,
"loss": 0.0014,
"step": 7750
},
{
"epoch": 78.04,
"learning_rate": 8.158987341772152e-06,
"loss": 0.0009,
"step": 7775
},
{
"epoch": 78.29,
"learning_rate": 8.152658227848101e-06,
"loss": 0.0007,
"step": 7800
},
{
"epoch": 78.54,
"learning_rate": 8.14632911392405e-06,
"loss": 0.0009,
"step": 7825
},
{
"epoch": 78.8,
"learning_rate": 8.14e-06,
"loss": 0.0005,
"step": 7850
},
{
"epoch": 79.05,
"learning_rate": 8.133670886075951e-06,
"loss": 0.0012,
"step": 7875
},
{
"epoch": 79.3,
"learning_rate": 8.1273417721519e-06,
"loss": 0.0009,
"step": 7900
},
{
"epoch": 79.55,
"learning_rate": 8.12101265822785e-06,
"loss": 0.0006,
"step": 7925
},
{
"epoch": 79.8,
"learning_rate": 8.1146835443038e-06,
"loss": 0.0008,
"step": 7950
},
{
"epoch": 80.05,
"learning_rate": 8.108354430379747e-06,
"loss": 0.0008,
"step": 7975
},
{
"epoch": 80.3,
"learning_rate": 8.102025316455697e-06,
"loss": 0.0008,
"step": 8000
},
{
"epoch": 80.3,
"eval_loss": 0.25484558939933777,
"eval_runtime": 2843.0839,
"eval_samples_per_second": 4.482,
"eval_steps_per_second": 0.28,
"eval_wer": 8.34668594653744,
"step": 8000
},
{
"epoch": 80.55,
"learning_rate": 8.095696202531646e-06,
"loss": 0.0014,
"step": 8025
},
{
"epoch": 80.8,
"learning_rate": 8.089367088607595e-06,
"loss": 0.0012,
"step": 8050
},
{
"epoch": 81.05,
"learning_rate": 8.083037974683545e-06,
"loss": 0.0018,
"step": 8075
},
{
"epoch": 81.3,
"learning_rate": 8.076708860759494e-06,
"loss": 0.0017,
"step": 8100
},
{
"epoch": 81.56,
"learning_rate": 8.070379746835444e-06,
"loss": 0.0011,
"step": 8125
},
{
"epoch": 81.81,
"learning_rate": 8.064050632911393e-06,
"loss": 0.0011,
"step": 8150
},
{
"epoch": 82.06,
"learning_rate": 8.057721518987343e-06,
"loss": 0.0012,
"step": 8175
},
{
"epoch": 82.31,
"learning_rate": 8.051392405063292e-06,
"loss": 0.0009,
"step": 8200
},
{
"epoch": 82.56,
"learning_rate": 8.045063291139241e-06,
"loss": 0.0011,
"step": 8225
},
{
"epoch": 82.81,
"learning_rate": 8.03873417721519e-06,
"loss": 0.0013,
"step": 8250
},
{
"epoch": 83.06,
"learning_rate": 8.03240506329114e-06,
"loss": 0.0012,
"step": 8275
},
{
"epoch": 83.31,
"learning_rate": 8.02607594936709e-06,
"loss": 0.0009,
"step": 8300
},
{
"epoch": 83.56,
"learning_rate": 8.019746835443039e-06,
"loss": 0.0012,
"step": 8325
},
{
"epoch": 83.81,
"learning_rate": 8.013417721518989e-06,
"loss": 0.001,
"step": 8350
},
{
"epoch": 84.07,
"learning_rate": 8.007088607594938e-06,
"loss": 0.001,
"step": 8375
},
{
"epoch": 84.32,
"learning_rate": 8.000759493670887e-06,
"loss": 0.0006,
"step": 8400
},
{
"epoch": 84.57,
"learning_rate": 7.994430379746835e-06,
"loss": 0.0006,
"step": 8425
},
{
"epoch": 84.82,
"learning_rate": 7.988101265822785e-06,
"loss": 0.0007,
"step": 8450
},
{
"epoch": 85.07,
"learning_rate": 7.981772151898734e-06,
"loss": 0.0008,
"step": 8475
},
{
"epoch": 85.32,
"learning_rate": 7.975443037974683e-06,
"loss": 0.0009,
"step": 8500
},
{
"epoch": 85.57,
"learning_rate": 7.969113924050633e-06,
"loss": 0.0015,
"step": 8525
},
{
"epoch": 85.82,
"learning_rate": 7.962784810126582e-06,
"loss": 0.0013,
"step": 8550
},
{
"epoch": 86.07,
"learning_rate": 7.956455696202532e-06,
"loss": 0.0014,
"step": 8575
},
{
"epoch": 86.32,
"learning_rate": 7.950126582278481e-06,
"loss": 0.0016,
"step": 8600
},
{
"epoch": 86.57,
"learning_rate": 7.94379746835443e-06,
"loss": 0.0013,
"step": 8625
},
{
"epoch": 86.83,
"learning_rate": 7.93746835443038e-06,
"loss": 0.0014,
"step": 8650
},
{
"epoch": 87.08,
"learning_rate": 7.93113924050633e-06,
"loss": 0.0015,
"step": 8675
},
{
"epoch": 87.33,
"learning_rate": 7.924810126582279e-06,
"loss": 0.0017,
"step": 8700
},
{
"epoch": 87.58,
"learning_rate": 7.918481012658228e-06,
"loss": 0.0018,
"step": 8725
},
{
"epoch": 87.83,
"learning_rate": 7.912151898734178e-06,
"loss": 0.0016,
"step": 8750
},
{
"epoch": 88.08,
"learning_rate": 7.905822784810127e-06,
"loss": 0.0015,
"step": 8775
},
{
"epoch": 88.33,
"learning_rate": 7.899493670886077e-06,
"loss": 0.0014,
"step": 8800
},
{
"epoch": 88.58,
"learning_rate": 7.893164556962026e-06,
"loss": 0.0011,
"step": 8825
},
{
"epoch": 88.83,
"learning_rate": 7.886835443037975e-06,
"loss": 0.0011,
"step": 8850
},
{
"epoch": 89.08,
"learning_rate": 7.880506329113925e-06,
"loss": 0.0011,
"step": 8875
},
{
"epoch": 89.34,
"learning_rate": 7.874177215189874e-06,
"loss": 0.0009,
"step": 8900
},
{
"epoch": 89.59,
"learning_rate": 7.867848101265824e-06,
"loss": 0.001,
"step": 8925
},
{
"epoch": 89.84,
"learning_rate": 7.861518987341773e-06,
"loss": 0.0008,
"step": 8950
},
{
"epoch": 90.09,
"learning_rate": 7.855189873417723e-06,
"loss": 0.0005,
"step": 8975
},
{
"epoch": 90.34,
"learning_rate": 7.848860759493672e-06,
"loss": 0.0004,
"step": 9000
},
{
"epoch": 90.34,
"eval_loss": 0.2497812658548355,
"eval_runtime": 2842.9475,
"eval_samples_per_second": 4.482,
"eval_steps_per_second": 0.28,
"eval_wer": 7.955877755197749,
"step": 9000
},
{
"epoch": 90.59,
"learning_rate": 7.842531645569621e-06,
"loss": 0.0003,
"step": 9025
},
{
"epoch": 90.84,
"learning_rate": 7.83620253164557e-06,
"loss": 0.0005,
"step": 9050
},
{
"epoch": 91.09,
"learning_rate": 7.82987341772152e-06,
"loss": 0.0007,
"step": 9075
},
{
"epoch": 91.34,
"learning_rate": 7.82354430379747e-06,
"loss": 0.0012,
"step": 9100
},
{
"epoch": 91.59,
"learning_rate": 7.817215189873419e-06,
"loss": 0.0014,
"step": 9125
},
{
"epoch": 91.84,
"learning_rate": 7.810886075949367e-06,
"loss": 0.0012,
"step": 9150
},
{
"epoch": 92.1,
"learning_rate": 7.804556962025316e-06,
"loss": 0.001,
"step": 9175
},
{
"epoch": 92.35,
"learning_rate": 7.798227848101266e-06,
"loss": 0.001,
"step": 9200
},
{
"epoch": 92.6,
"learning_rate": 7.791898734177215e-06,
"loss": 0.0009,
"step": 9225
},
{
"epoch": 92.85,
"learning_rate": 7.785569620253165e-06,
"loss": 0.0008,
"step": 9250
},
{
"epoch": 93.1,
"learning_rate": 7.779240506329114e-06,
"loss": 0.0012,
"step": 9275
},
{
"epoch": 93.35,
"learning_rate": 7.772911392405063e-06,
"loss": 0.0008,
"step": 9300
},
{
"epoch": 93.6,
"learning_rate": 7.766582278481013e-06,
"loss": 0.001,
"step": 9325
},
{
"epoch": 93.85,
"learning_rate": 7.760253164556962e-06,
"loss": 0.0017,
"step": 9350
},
{
"epoch": 94.1,
"learning_rate": 7.753924050632912e-06,
"loss": 0.0017,
"step": 9375
},
{
"epoch": 94.35,
"learning_rate": 7.747594936708861e-06,
"loss": 0.0011,
"step": 9400
},
{
"epoch": 94.6,
"learning_rate": 7.74126582278481e-06,
"loss": 0.0015,
"step": 9425
},
{
"epoch": 94.86,
"learning_rate": 7.73493670886076e-06,
"loss": 0.0012,
"step": 9450
},
{
"epoch": 95.11,
"learning_rate": 7.72860759493671e-06,
"loss": 0.001,
"step": 9475
},
{
"epoch": 95.36,
"learning_rate": 7.722278481012659e-06,
"loss": 0.001,
"step": 9500
},
{
"epoch": 95.61,
"learning_rate": 7.715949367088608e-06,
"loss": 0.0011,
"step": 9525
},
{
"epoch": 95.86,
"learning_rate": 7.709620253164558e-06,
"loss": 0.0011,
"step": 9550
},
{
"epoch": 96.11,
"learning_rate": 7.703291139240507e-06,
"loss": 0.0009,
"step": 9575
},
{
"epoch": 96.36,
"learning_rate": 7.696962025316457e-06,
"loss": 0.0014,
"step": 9600
},
{
"epoch": 96.61,
"learning_rate": 7.690632911392406e-06,
"loss": 0.0017,
"step": 9625
},
{
"epoch": 96.86,
"learning_rate": 7.684303797468355e-06,
"loss": 0.0013,
"step": 9650
},
{
"epoch": 97.11,
"learning_rate": 7.677974683544305e-06,
"loss": 0.001,
"step": 9675
},
{
"epoch": 97.37,
"learning_rate": 7.671645569620254e-06,
"loss": 0.0009,
"step": 9700
},
{
"epoch": 97.62,
"learning_rate": 7.665316455696204e-06,
"loss": 0.0007,
"step": 9725
},
{
"epoch": 97.87,
"learning_rate": 7.658987341772153e-06,
"loss": 0.0008,
"step": 9750
},
{
"epoch": 98.12,
"learning_rate": 7.652658227848103e-06,
"loss": 0.0007,
"step": 9775
},
{
"epoch": 98.37,
"learning_rate": 7.646329113924052e-06,
"loss": 0.0007,
"step": 9800
},
{
"epoch": 98.62,
"learning_rate": 7.640000000000001e-06,
"loss": 0.0005,
"step": 9825
},
{
"epoch": 98.87,
"learning_rate": 7.63367088607595e-06,
"loss": 0.0005,
"step": 9850
},
{
"epoch": 99.12,
"learning_rate": 7.627341772151899e-06,
"loss": 0.0002,
"step": 9875
},
{
"epoch": 99.37,
"learning_rate": 7.621012658227849e-06,
"loss": 0.0003,
"step": 9900
},
{
"epoch": 99.62,
"learning_rate": 7.614683544303798e-06,
"loss": 0.0003,
"step": 9925
},
{
"epoch": 99.87,
"learning_rate": 7.608354430379748e-06,
"loss": 0.0003,
"step": 9950
},
{
"epoch": 100.13,
"learning_rate": 7.602025316455697e-06,
"loss": 0.0002,
"step": 9975
},
{
"epoch": 100.38,
"learning_rate": 7.595696202531646e-06,
"loss": 0.0003,
"step": 10000
},
{
"epoch": 100.38,
"eval_loss": 0.24893002212047577,
"eval_runtime": 2830.2725,
"eval_samples_per_second": 4.502,
"eval_steps_per_second": 0.282,
"eval_wer": 7.694036267000157,
"step": 10000
},
{
"epoch": 100.63,
"learning_rate": 7.589367088607595e-06,
"loss": 0.0002,
"step": 10025
},
{
"epoch": 100.88,
"learning_rate": 7.5830379746835445e-06,
"loss": 0.0001,
"step": 10050
},
{
"epoch": 101.13,
"learning_rate": 7.576708860759494e-06,
"loss": 0.0001,
"step": 10075
},
{
"epoch": 101.38,
"learning_rate": 7.570379746835443e-06,
"loss": 0.0001,
"step": 10100
},
{
"epoch": 101.63,
"learning_rate": 7.564050632911393e-06,
"loss": 0.0001,
"step": 10125
},
{
"epoch": 101.88,
"learning_rate": 7.557721518987342e-06,
"loss": 0.0001,
"step": 10150
},
{
"epoch": 102.13,
"learning_rate": 7.551392405063292e-06,
"loss": 0.0001,
"step": 10175
},
{
"epoch": 102.38,
"learning_rate": 7.545063291139241e-06,
"loss": 0.0001,
"step": 10200
},
{
"epoch": 102.63,
"learning_rate": 7.53873417721519e-06,
"loss": 0.0001,
"step": 10225
},
{
"epoch": 102.89,
"learning_rate": 7.532405063291139e-06,
"loss": 0.0001,
"step": 10250
},
{
"epoch": 103.14,
"learning_rate": 7.5260759493670885e-06,
"loss": 0.0001,
"step": 10275
},
{
"epoch": 103.39,
"learning_rate": 7.519746835443038e-06,
"loss": 0.0,
"step": 10300
},
{
"epoch": 103.64,
"learning_rate": 7.513417721518987e-06,
"loss": 0.0,
"step": 10325
},
{
"epoch": 103.89,
"learning_rate": 7.507088607594938e-06,
"loss": 0.0,
"step": 10350
},
{
"epoch": 104.14,
"learning_rate": 7.500759493670887e-06,
"loss": 0.0001,
"step": 10375
},
{
"epoch": 104.39,
"learning_rate": 7.4944303797468365e-06,
"loss": 0.0,
"step": 10400
},
{
"epoch": 104.64,
"learning_rate": 7.488101265822786e-06,
"loss": 0.0,
"step": 10425
},
{
"epoch": 104.89,
"learning_rate": 7.481772151898735e-06,
"loss": 0.0001,
"step": 10450
},
{
"epoch": 105.14,
"learning_rate": 7.475443037974685e-06,
"loss": 0.0,
"step": 10475
},
{
"epoch": 105.4,
"learning_rate": 7.469113924050634e-06,
"loss": 0.0,
"step": 10500
},
{
"epoch": 105.65,
"learning_rate": 7.462784810126583e-06,
"loss": 0.0,
"step": 10525
},
{
"epoch": 105.9,
"learning_rate": 7.456455696202532e-06,
"loss": 0.0001,
"step": 10550
},
{
"epoch": 106.15,
"learning_rate": 7.450126582278482e-06,
"loss": 0.0,
"step": 10575
},
{
"epoch": 106.4,
"learning_rate": 7.443797468354431e-06,
"loss": 0.0,
"step": 10600
},
{
"epoch": 106.65,
"learning_rate": 7.4374683544303805e-06,
"loss": 0.0,
"step": 10625
},
{
"epoch": 106.9,
"learning_rate": 7.43113924050633e-06,
"loss": 0.0,
"step": 10650
},
{
"epoch": 107.15,
"learning_rate": 7.424810126582279e-06,
"loss": 0.0,
"step": 10675
},
{
"epoch": 107.4,
"learning_rate": 7.418481012658229e-06,
"loss": 0.0,
"step": 10700
},
{
"epoch": 107.65,
"learning_rate": 7.412151898734178e-06,
"loss": 0.0,
"step": 10725
},
{
"epoch": 107.9,
"learning_rate": 7.405822784810127e-06,
"loss": 0.0,
"step": 10750
},
{
"epoch": 108.16,
"learning_rate": 7.399493670886076e-06,
"loss": 0.0,
"step": 10775
},
{
"epoch": 108.41,
"learning_rate": 7.393164556962026e-06,
"loss": 0.0,
"step": 10800
},
{
"epoch": 108.66,
"learning_rate": 7.386835443037975e-06,
"loss": 0.0,
"step": 10825
},
{
"epoch": 108.91,
"learning_rate": 7.3805063291139245e-06,
"loss": 0.0,
"step": 10850
},
{
"epoch": 109.16,
"learning_rate": 7.374177215189874e-06,
"loss": 0.0,
"step": 10875
},
{
"epoch": 109.41,
"learning_rate": 7.367848101265823e-06,
"loss": 0.0,
"step": 10900
},
{
"epoch": 109.66,
"learning_rate": 7.361518987341773e-06,
"loss": 0.0,
"step": 10925
},
{
"epoch": 109.91,
"learning_rate": 7.355189873417722e-06,
"loss": 0.0,
"step": 10950
},
{
"epoch": 110.16,
"learning_rate": 7.348860759493671e-06,
"loss": 0.0,
"step": 10975
},
{
"epoch": 110.41,
"learning_rate": 7.34253164556962e-06,
"loss": 0.0,
"step": 11000
},
{
"epoch": 110.41,
"eval_loss": 0.2905968129634857,
"eval_runtime": 2826.8699,
"eval_samples_per_second": 4.507,
"eval_steps_per_second": 0.282,
"eval_wer": 7.545529154291073,
"step": 11000
},
{
"epoch": 110.66,
"learning_rate": 7.33620253164557e-06,
"loss": 0.0,
"step": 11025
},
{
"epoch": 110.92,
"learning_rate": 7.329873417721519e-06,
"loss": 0.0,
"step": 11050
},
{
"epoch": 111.17,
"learning_rate": 7.3235443037974685e-06,
"loss": 0.0,
"step": 11075
},
{
"epoch": 111.42,
"learning_rate": 7.317215189873418e-06,
"loss": 0.0,
"step": 11100
},
{
"epoch": 111.67,
"learning_rate": 7.310886075949367e-06,
"loss": 0.0,
"step": 11125
},
{
"epoch": 111.92,
"learning_rate": 7.304556962025317e-06,
"loss": 0.0,
"step": 11150
},
{
"epoch": 112.17,
"learning_rate": 7.298227848101267e-06,
"loss": 0.0,
"step": 11175
},
{
"epoch": 112.42,
"learning_rate": 7.2918987341772165e-06,
"loss": 0.0,
"step": 11200
},
{
"epoch": 112.67,
"learning_rate": 7.285569620253166e-06,
"loss": 0.0,
"step": 11225
},
{
"epoch": 112.92,
"learning_rate": 7.2792405063291145e-06,
"loss": 0.0,
"step": 11250
},
{
"epoch": 113.17,
"learning_rate": 7.272911392405064e-06,
"loss": 0.0,
"step": 11275
},
{
"epoch": 113.43,
"learning_rate": 7.266582278481013e-06,
"loss": 0.0,
"step": 11300
},
{
"epoch": 113.68,
"learning_rate": 7.260253164556963e-06,
"loss": 0.0,
"step": 11325
},
{
"epoch": 113.93,
"learning_rate": 7.253924050632912e-06,
"loss": 0.0,
"step": 11350
},
{
"epoch": 114.18,
"learning_rate": 7.247594936708862e-06,
"loss": 0.0,
"step": 11375
},
{
"epoch": 114.43,
"learning_rate": 7.241265822784811e-06,
"loss": 0.0,
"step": 11400
},
{
"epoch": 114.68,
"learning_rate": 7.2349367088607605e-06,
"loss": 0.0,
"step": 11425
},
{
"epoch": 114.93,
"learning_rate": 7.22860759493671e-06,
"loss": 0.0,
"step": 11450
},
{
"epoch": 115.18,
"learning_rate": 7.2222784810126585e-06,
"loss": 0.0,
"step": 11475
},
{
"epoch": 115.43,
"learning_rate": 7.215949367088608e-06,
"loss": 0.0,
"step": 11500
},
{
"epoch": 115.68,
"learning_rate": 7.209620253164557e-06,
"loss": 0.0,
"step": 11525
},
{
"epoch": 115.93,
"learning_rate": 7.203291139240507e-06,
"loss": 0.0,
"step": 11550
},
{
"epoch": 116.19,
"learning_rate": 7.196962025316456e-06,
"loss": 0.0,
"step": 11575
},
{
"epoch": 116.44,
"learning_rate": 7.190632911392406e-06,
"loss": 0.0,
"step": 11600
},
{
"epoch": 116.69,
"learning_rate": 7.184303797468355e-06,
"loss": 0.0,
"step": 11625
},
{
"epoch": 116.94,
"learning_rate": 7.1779746835443045e-06,
"loss": 0.0,
"step": 11650
},
{
"epoch": 117.19,
"learning_rate": 7.171645569620254e-06,
"loss": 0.0,
"step": 11675
},
{
"epoch": 117.44,
"learning_rate": 7.1653164556962025e-06,
"loss": 0.0,
"step": 11700
},
{
"epoch": 117.69,
"learning_rate": 7.158987341772152e-06,
"loss": 0.0,
"step": 11725
},
{
"epoch": 117.94,
"learning_rate": 7.152658227848101e-06,
"loss": 0.0,
"step": 11750
},
{
"epoch": 118.19,
"learning_rate": 7.146329113924051e-06,
"loss": 0.0,
"step": 11775
},
{
"epoch": 118.44,
"learning_rate": 7.14e-06,
"loss": 0.0,
"step": 11800
},
{
"epoch": 118.7,
"learning_rate": 7.13367088607595e-06,
"loss": 0.0,
"step": 11825
},
{
"epoch": 118.95,
"learning_rate": 7.127341772151899e-06,
"loss": 0.0,
"step": 11850
},
{
"epoch": 119.2,
"learning_rate": 7.1210126582278485e-06,
"loss": 0.0,
"step": 11875
},
{
"epoch": 119.45,
"learning_rate": 7.114683544303798e-06,
"loss": 0.0,
"step": 11900
},
{
"epoch": 119.7,
"learning_rate": 7.1083544303797465e-06,
"loss": 0.0,
"step": 11925
},
{
"epoch": 119.95,
"learning_rate": 7.102025316455696e-06,
"loss": 0.0,
"step": 11950
},
{
"epoch": 120.2,
"learning_rate": 7.095696202531647e-06,
"loss": 0.0,
"step": 11975
},
{
"epoch": 120.45,
"learning_rate": 7.089367088607596e-06,
"loss": 0.0,
"step": 12000
},
{
"epoch": 120.45,
"eval_loss": 0.3027211129665375,
"eval_runtime": 2829.6888,
"eval_samples_per_second": 4.503,
"eval_steps_per_second": 0.282,
"eval_wer": 7.459551352196342,
"step": 12000
},
{
"epoch": 120.7,
"learning_rate": 7.083037974683545e-06,
"loss": 0.0,
"step": 12025
},
{
"epoch": 120.95,
"learning_rate": 7.0767088607594945e-06,
"loss": 0.0,
"step": 12050
},
{
"epoch": 121.2,
"learning_rate": 7.070379746835444e-06,
"loss": 0.0,
"step": 12075
},
{
"epoch": 121.46,
"learning_rate": 7.064050632911393e-06,
"loss": 0.0,
"step": 12100
},
{
"epoch": 121.71,
"learning_rate": 7.057721518987343e-06,
"loss": 0.0,
"step": 12125
},
{
"epoch": 121.96,
"learning_rate": 7.051392405063292e-06,
"loss": 0.0,
"step": 12150
},
{
"epoch": 122.21,
"learning_rate": 7.045063291139242e-06,
"loss": 0.0,
"step": 12175
},
{
"epoch": 122.46,
"learning_rate": 7.038734177215191e-06,
"loss": 0.0,
"step": 12200
},
{
"epoch": 122.71,
"learning_rate": 7.03240506329114e-06,
"loss": 0.0,
"step": 12225
},
{
"epoch": 122.96,
"learning_rate": 7.026075949367089e-06,
"loss": 0.0,
"step": 12250
},
{
"epoch": 123.21,
"learning_rate": 7.0197468354430385e-06,
"loss": 0.0,
"step": 12275
},
{
"epoch": 123.46,
"learning_rate": 7.013417721518988e-06,
"loss": 0.0,
"step": 12300
},
{
"epoch": 123.71,
"learning_rate": 7.007088607594937e-06,
"loss": 0.0,
"step": 12325
},
{
"epoch": 123.96,
"learning_rate": 7.000759493670887e-06,
"loss": 0.0,
"step": 12350
},
{
"epoch": 124.22,
"learning_rate": 6.994430379746836e-06,
"loss": 0.0,
"step": 12375
},
{
"epoch": 124.47,
"learning_rate": 6.988101265822786e-06,
"loss": 0.0,
"step": 12400
},
{
"epoch": 124.72,
"learning_rate": 6.981772151898735e-06,
"loss": 0.0,
"step": 12425
},
{
"epoch": 124.97,
"learning_rate": 6.975443037974684e-06,
"loss": 0.0,
"step": 12450
},
{
"epoch": 125.22,
"learning_rate": 6.969113924050633e-06,
"loss": 0.0,
"step": 12475
},
{
"epoch": 125.47,
"learning_rate": 6.9627848101265825e-06,
"loss": 0.0,
"step": 12500
},
{
"epoch": 125.72,
"learning_rate": 6.956455696202532e-06,
"loss": 0.0,
"step": 12525
},
{
"epoch": 125.97,
"learning_rate": 6.950126582278481e-06,
"loss": 0.0,
"step": 12550
},
{
"epoch": 126.22,
"learning_rate": 6.943797468354431e-06,
"loss": 0.0,
"step": 12575
},
{
"epoch": 126.47,
"learning_rate": 6.93746835443038e-06,
"loss": 0.0,
"step": 12600
},
{
"epoch": 126.73,
"learning_rate": 6.93113924050633e-06,
"loss": 0.0,
"step": 12625
},
{
"epoch": 126.98,
"learning_rate": 6.924810126582279e-06,
"loss": 0.0,
"step": 12650
},
{
"epoch": 127.23,
"learning_rate": 6.918481012658228e-06,
"loss": 0.0,
"step": 12675
},
{
"epoch": 127.48,
"learning_rate": 6.912151898734177e-06,
"loss": 0.0,
"step": 12700
},
{
"epoch": 127.73,
"learning_rate": 6.9058227848101265e-06,
"loss": 0.0,
"step": 12725
},
{
"epoch": 127.98,
"learning_rate": 6.899493670886076e-06,
"loss": 0.0,
"step": 12750
},
{
"epoch": 128.23,
"learning_rate": 6.893164556962025e-06,
"loss": 0.0,
"step": 12775
},
{
"epoch": 128.48,
"learning_rate": 6.886835443037976e-06,
"loss": 0.0,
"step": 12800
},
{
"epoch": 128.73,
"learning_rate": 6.880506329113925e-06,
"loss": 0.0,
"step": 12825
},
{
"epoch": 128.98,
"learning_rate": 6.8741772151898745e-06,
"loss": 0.0,
"step": 12850
},
{
"epoch": 129.23,
"learning_rate": 6.867848101265824e-06,
"loss": 0.0,
"step": 12875
},
{
"epoch": 129.49,
"learning_rate": 6.861518987341773e-06,
"loss": 0.0,
"step": 12900
},
{
"epoch": 129.74,
"learning_rate": 6.855189873417723e-06,
"loss": 0.0,
"step": 12925
},
{
"epoch": 129.99,
"learning_rate": 6.848860759493671e-06,
"loss": 0.0,
"step": 12950
},
{
"epoch": 130.24,
"learning_rate": 6.842531645569621e-06,
"loss": 0.0,
"step": 12975
},
{
"epoch": 130.49,
"learning_rate": 6.83620253164557e-06,
"loss": 0.0,
"step": 13000
},
{
"epoch": 130.49,
"eval_loss": 0.31367388367652893,
"eval_runtime": 2826.8322,
"eval_samples_per_second": 4.508,
"eval_steps_per_second": 0.282,
"eval_wer": 7.451735188369549,
"step": 13000
},
{
"epoch": 130.74,
"learning_rate": 6.82987341772152e-06,
"loss": 0.0,
"step": 13025
},
{
"epoch": 130.99,
"learning_rate": 6.823544303797469e-06,
"loss": 0.0,
"step": 13050
},
{
"epoch": 131.24,
"learning_rate": 6.8172151898734185e-06,
"loss": 0.0,
"step": 13075
},
{
"epoch": 131.49,
"learning_rate": 6.810886075949368e-06,
"loss": 0.0,
"step": 13100
},
{
"epoch": 131.74,
"learning_rate": 6.804556962025317e-06,
"loss": 0.0,
"step": 13125
},
{
"epoch": 131.99,
"learning_rate": 6.798227848101267e-06,
"loss": 0.0,
"step": 13150
},
{
"epoch": 132.25,
"learning_rate": 6.791898734177215e-06,
"loss": 0.0,
"step": 13175
},
{
"epoch": 132.5,
"learning_rate": 6.785569620253165e-06,
"loss": 0.0,
"step": 13200
},
{
"epoch": 132.75,
"learning_rate": 6.779240506329114e-06,
"loss": 0.0,
"step": 13225
},
{
"epoch": 133.0,
"learning_rate": 6.772911392405064e-06,
"loss": 0.0,
"step": 13250
},
{
"epoch": 133.25,
"learning_rate": 6.766582278481013e-06,
"loss": 0.0,
"step": 13275
},
{
"epoch": 133.5,
"learning_rate": 6.7602531645569625e-06,
"loss": 0.0,
"step": 13300
},
{
"epoch": 133.75,
"learning_rate": 6.753924050632912e-06,
"loss": 0.0,
"step": 13325
},
{
"epoch": 134.0,
"learning_rate": 6.747594936708861e-06,
"loss": 0.0,
"step": 13350
},
{
"epoch": 134.25,
"learning_rate": 6.741265822784811e-06,
"loss": 0.0,
"step": 13375
},
{
"epoch": 134.5,
"learning_rate": 6.734936708860759e-06,
"loss": 0.0,
"step": 13400
},
{
"epoch": 134.76,
"learning_rate": 6.728607594936709e-06,
"loss": 0.0,
"step": 13425
},
{
"epoch": 135.01,
"learning_rate": 6.722278481012658e-06,
"loss": 0.0,
"step": 13450
},
{
"epoch": 135.26,
"learning_rate": 6.715949367088608e-06,
"loss": 0.0,
"step": 13475
},
{
"epoch": 135.51,
"learning_rate": 6.709620253164557e-06,
"loss": 0.0,
"step": 13500
},
{
"epoch": 135.76,
"learning_rate": 6.7032911392405065e-06,
"loss": 0.0,
"step": 13525
},
{
"epoch": 136.01,
"learning_rate": 6.696962025316456e-06,
"loss": 0.0,
"step": 13550
},
{
"epoch": 136.26,
"learning_rate": 6.690632911392405e-06,
"loss": 0.0,
"step": 13575
},
{
"epoch": 136.51,
"learning_rate": 6.684303797468355e-06,
"loss": 0.0,
"step": 13600
},
{
"epoch": 136.76,
"learning_rate": 6.677974683544305e-06,
"loss": 0.0,
"step": 13625
},
{
"epoch": 137.01,
"learning_rate": 6.6716455696202545e-06,
"loss": 0.0,
"step": 13650
},
{
"epoch": 137.26,
"learning_rate": 6.665316455696204e-06,
"loss": 0.0,
"step": 13675
},
{
"epoch": 137.52,
"learning_rate": 6.6589873417721525e-06,
"loss": 0.0,
"step": 13700
},
{
"epoch": 137.77,
"learning_rate": 6.652658227848102e-06,
"loss": 0.0,
"step": 13725
},
{
"epoch": 138.02,
"learning_rate": 6.646329113924051e-06,
"loss": 0.0,
"step": 13750
},
{
"epoch": 138.27,
"learning_rate": 6.640000000000001e-06,
"loss": 0.0,
"step": 13775
},
{
"epoch": 138.52,
"learning_rate": 6.63367088607595e-06,
"loss": 0.0,
"step": 13800
},
{
"epoch": 138.77,
"learning_rate": 6.6273417721519e-06,
"loss": 0.0,
"step": 13825
},
{
"epoch": 139.02,
"learning_rate": 6.621012658227849e-06,
"loss": 0.0,
"step": 13850
},
{
"epoch": 139.27,
"learning_rate": 6.6146835443037985e-06,
"loss": 0.0,
"step": 13875
},
{
"epoch": 139.52,
"learning_rate": 6.608354430379748e-06,
"loss": 0.0,
"step": 13900
},
{
"epoch": 139.77,
"learning_rate": 6.6020253164556965e-06,
"loss": 0.0,
"step": 13925
},
{
"epoch": 140.03,
"learning_rate": 6.595696202531646e-06,
"loss": 0.0,
"step": 13950
},
{
"epoch": 140.28,
"learning_rate": 6.589367088607595e-06,
"loss": 0.0,
"step": 13975
},
{
"epoch": 140.53,
"learning_rate": 6.583037974683545e-06,
"loss": 0.0,
"step": 14000
},
{
"epoch": 140.53,
"eval_loss": 0.32425281405448914,
"eval_runtime": 2828.1904,
"eval_samples_per_second": 4.505,
"eval_steps_per_second": 0.282,
"eval_wer": 7.464436454588089,
"step": 14000
},
{
"epoch": 140.78,
"learning_rate": 6.576708860759494e-06,
"loss": 0.0,
"step": 14025
},
{
"epoch": 141.03,
"learning_rate": 6.570379746835444e-06,
"loss": 0.0,
"step": 14050
},
{
"epoch": 141.28,
"learning_rate": 6.564050632911393e-06,
"loss": 0.0,
"step": 14075
},
{
"epoch": 141.53,
"learning_rate": 6.5577215189873425e-06,
"loss": 0.0,
"step": 14100
},
{
"epoch": 141.78,
"learning_rate": 6.551392405063292e-06,
"loss": 0.0,
"step": 14125
},
{
"epoch": 142.03,
"learning_rate": 6.5450632911392405e-06,
"loss": 0.0,
"step": 14150
},
{
"epoch": 142.28,
"learning_rate": 6.53873417721519e-06,
"loss": 0.0,
"step": 14175
},
{
"epoch": 142.53,
"learning_rate": 6.532405063291139e-06,
"loss": 0.0,
"step": 14200
},
{
"epoch": 142.79,
"learning_rate": 6.526075949367089e-06,
"loss": 0.0,
"step": 14225
},
{
"epoch": 143.04,
"learning_rate": 6.519746835443038e-06,
"loss": 0.0,
"step": 14250
},
{
"epoch": 143.29,
"learning_rate": 6.513417721518988e-06,
"loss": 0.0,
"step": 14275
},
{
"epoch": 143.54,
"learning_rate": 6.507088607594937e-06,
"loss": 0.0,
"step": 14300
},
{
"epoch": 143.79,
"learning_rate": 6.5007594936708865e-06,
"loss": 0.0,
"step": 14325
},
{
"epoch": 144.04,
"learning_rate": 6.494430379746836e-06,
"loss": 0.0,
"step": 14350
},
{
"epoch": 144.29,
"learning_rate": 6.4881012658227845e-06,
"loss": 0.0,
"step": 14375
},
{
"epoch": 144.54,
"learning_rate": 6.481772151898734e-06,
"loss": 0.0,
"step": 14400
},
{
"epoch": 144.79,
"learning_rate": 6.475443037974683e-06,
"loss": 0.0,
"step": 14425
},
{
"epoch": 145.04,
"learning_rate": 6.469113924050634e-06,
"loss": 0.0,
"step": 14450
},
{
"epoch": 145.29,
"learning_rate": 6.462784810126583e-06,
"loss": 0.0,
"step": 14475
},
{
"epoch": 145.55,
"learning_rate": 6.4564556962025325e-06,
"loss": 0.0,
"step": 14500
},
{
"epoch": 145.8,
"learning_rate": 6.450126582278482e-06,
"loss": 0.0,
"step": 14525
},
{
"epoch": 146.05,
"learning_rate": 6.443797468354431e-06,
"loss": 0.0,
"step": 14550
},
{
"epoch": 146.3,
"learning_rate": 6.437468354430381e-06,
"loss": 0.0,
"step": 14575
},
{
"epoch": 146.55,
"learning_rate": 6.43113924050633e-06,
"loss": 0.0,
"step": 14600
},
{
"epoch": 146.8,
"learning_rate": 6.42481012658228e-06,
"loss": 0.0,
"step": 14625
},
{
"epoch": 147.05,
"learning_rate": 6.418481012658228e-06,
"loss": 0.0,
"step": 14650
},
{
"epoch": 147.3,
"learning_rate": 6.412151898734178e-06,
"loss": 0.0,
"step": 14675
},
{
"epoch": 147.55,
"learning_rate": 6.405822784810127e-06,
"loss": 0.0,
"step": 14700
},
{
"epoch": 147.8,
"learning_rate": 6.3994936708860765e-06,
"loss": 0.0,
"step": 14725
},
{
"epoch": 148.06,
"learning_rate": 6.393164556962026e-06,
"loss": 0.0,
"step": 14750
},
{
"epoch": 148.31,
"learning_rate": 6.386835443037975e-06,
"loss": 0.0,
"step": 14775
},
{
"epoch": 148.56,
"learning_rate": 6.380506329113925e-06,
"loss": 0.0,
"step": 14800
},
{
"epoch": 148.81,
"learning_rate": 6.374177215189874e-06,
"loss": 0.0,
"step": 14825
},
{
"epoch": 149.06,
"learning_rate": 6.367848101265824e-06,
"loss": 0.0,
"step": 14850
},
{
"epoch": 149.31,
"learning_rate": 6.361518987341772e-06,
"loss": 0.0,
"step": 14875
},
{
"epoch": 149.56,
"learning_rate": 6.355189873417722e-06,
"loss": 0.0,
"step": 14900
},
{
"epoch": 149.81,
"learning_rate": 6.348860759493671e-06,
"loss": 0.0,
"step": 14925
},
{
"epoch": 150.06,
"learning_rate": 6.3425316455696205e-06,
"loss": 0.0,
"step": 14950
},
{
"epoch": 150.31,
"learning_rate": 6.33620253164557e-06,
"loss": 0.0,
"step": 14975
},
{
"epoch": 150.56,
"learning_rate": 6.329873417721519e-06,
"loss": 0.0,
"step": 15000
},
{
"epoch": 150.56,
"eval_loss": 0.3350587785243988,
"eval_runtime": 2827.6479,
"eval_samples_per_second": 4.506,
"eval_steps_per_second": 0.282,
"eval_wer": 7.476160700328278,
"step": 15000
},
{
"epoch": 150.82,
"learning_rate": 6.323544303797469e-06,
"loss": 0.0,
"step": 15025
},
{
"epoch": 151.07,
"learning_rate": 6.317215189873418e-06,
"loss": 0.0,
"step": 15050
},
{
"epoch": 151.32,
"learning_rate": 6.310886075949368e-06,
"loss": 0.0,
"step": 15075
},
{
"epoch": 151.57,
"learning_rate": 6.304556962025316e-06,
"loss": 0.0,
"step": 15100
},
{
"epoch": 151.82,
"learning_rate": 6.298227848101266e-06,
"loss": 0.0,
"step": 15125
},
{
"epoch": 152.07,
"learning_rate": 6.291898734177215e-06,
"loss": 0.0,
"step": 15150
},
{
"epoch": 152.32,
"learning_rate": 6.2855696202531645e-06,
"loss": 0.0,
"step": 15175
},
{
"epoch": 152.57,
"learning_rate": 6.279240506329114e-06,
"loss": 0.0,
"step": 15200
},
{
"epoch": 152.82,
"learning_rate": 6.272911392405063e-06,
"loss": 0.0,
"step": 15225
},
{
"epoch": 153.07,
"learning_rate": 6.266582278481013e-06,
"loss": 0.0,
"step": 15250
},
{
"epoch": 153.32,
"learning_rate": 6.260253164556963e-06,
"loss": 0.0,
"step": 15275
},
{
"epoch": 153.58,
"learning_rate": 6.2539240506329125e-06,
"loss": 0.0,
"step": 15300
},
{
"epoch": 153.83,
"learning_rate": 6.247594936708862e-06,
"loss": 0.0,
"step": 15325
},
{
"epoch": 154.08,
"learning_rate": 6.241265822784811e-06,
"loss": 0.0,
"step": 15350
},
{
"epoch": 154.33,
"learning_rate": 6.234936708860761e-06,
"loss": 0.0,
"step": 15375
},
{
"epoch": 154.58,
"learning_rate": 6.228607594936709e-06,
"loss": 0.0,
"step": 15400
},
{
"epoch": 154.83,
"learning_rate": 6.222278481012659e-06,
"loss": 0.0,
"step": 15425
},
{
"epoch": 155.08,
"learning_rate": 6.215949367088608e-06,
"loss": 0.0,
"step": 15450
},
{
"epoch": 155.33,
"learning_rate": 6.209620253164558e-06,
"loss": 0.0,
"step": 15475
},
{
"epoch": 155.58,
"learning_rate": 6.203291139240507e-06,
"loss": 0.0,
"step": 15500
},
{
"epoch": 155.83,
"learning_rate": 6.1969620253164565e-06,
"loss": 0.0,
"step": 15525
},
{
"epoch": 156.09,
"learning_rate": 6.190632911392406e-06,
"loss": 0.0,
"step": 15550
},
{
"epoch": 156.34,
"learning_rate": 6.184303797468355e-06,
"loss": 0.0,
"step": 15575
},
{
"epoch": 156.59,
"learning_rate": 6.177974683544305e-06,
"loss": 0.0,
"step": 15600
},
{
"epoch": 156.84,
"learning_rate": 6.171645569620253e-06,
"loss": 0.0,
"step": 15625
},
{
"epoch": 157.09,
"learning_rate": 6.165316455696203e-06,
"loss": 0.0,
"step": 15650
},
{
"epoch": 157.34,
"learning_rate": 6.158987341772152e-06,
"loss": 0.0,
"step": 15675
},
{
"epoch": 157.59,
"learning_rate": 6.152658227848102e-06,
"loss": 0.0,
"step": 15700
},
{
"epoch": 157.84,
"learning_rate": 6.146329113924051e-06,
"loss": 0.0,
"step": 15725
},
{
"epoch": 158.09,
"learning_rate": 6.1400000000000005e-06,
"loss": 0.0,
"step": 15750
},
{
"epoch": 158.34,
"learning_rate": 6.13367088607595e-06,
"loss": 0.0,
"step": 15775
},
{
"epoch": 158.59,
"learning_rate": 6.127341772151899e-06,
"loss": 0.0,
"step": 15800
},
{
"epoch": 158.85,
"learning_rate": 6.121012658227849e-06,
"loss": 0.0,
"step": 15825
},
{
"epoch": 159.1,
"learning_rate": 6.114683544303797e-06,
"loss": 0.0,
"step": 15850
},
{
"epoch": 159.35,
"learning_rate": 6.108354430379747e-06,
"loss": 0.0,
"step": 15875
},
{
"epoch": 159.6,
"learning_rate": 6.102025316455696e-06,
"loss": 0.0,
"step": 15900
},
{
"epoch": 159.85,
"learning_rate": 6.095696202531646e-06,
"loss": 0.0,
"step": 15925
},
{
"epoch": 160.1,
"learning_rate": 6.089367088607595e-06,
"loss": 0.0,
"step": 15950
},
{
"epoch": 160.35,
"learning_rate": 6.0830379746835445e-06,
"loss": 0.0,
"step": 15975
},
{
"epoch": 160.6,
"learning_rate": 6.076708860759494e-06,
"loss": 0.0,
"step": 16000
},
{
"epoch": 160.6,
"eval_loss": 0.3459363281726837,
"eval_runtime": 2825.2813,
"eval_samples_per_second": 4.51,
"eval_steps_per_second": 0.282,
"eval_wer": 7.455643270282946,
"step": 16000
},
{
"epoch": 160.85,
"learning_rate": 6.070379746835443e-06,
"loss": 0.0,
"step": 16025
},
{
"epoch": 161.1,
"learning_rate": 6.064050632911393e-06,
"loss": 0.0,
"step": 16050
},
{
"epoch": 161.36,
"learning_rate": 6.057721518987341e-06,
"loss": 0.0,
"step": 16075
},
{
"epoch": 161.61,
"learning_rate": 6.0513924050632925e-06,
"loss": 0.0,
"step": 16100
},
{
"epoch": 161.86,
"learning_rate": 6.045063291139242e-06,
"loss": 0.0,
"step": 16125
},
{
"epoch": 162.11,
"learning_rate": 6.0387341772151905e-06,
"loss": 0.0,
"step": 16150
},
{
"epoch": 162.36,
"learning_rate": 6.03240506329114e-06,
"loss": 0.0,
"step": 16175
},
{
"epoch": 162.61,
"learning_rate": 6.026075949367089e-06,
"loss": 0.0,
"step": 16200
},
{
"epoch": 162.86,
"learning_rate": 6.019746835443039e-06,
"loss": 0.0,
"step": 16225
},
{
"epoch": 163.11,
"learning_rate": 6.013417721518988e-06,
"loss": 0.0,
"step": 16250
},
{
"epoch": 163.36,
"learning_rate": 6.007088607594938e-06,
"loss": 0.0,
"step": 16275
},
{
"epoch": 163.61,
"learning_rate": 6.000759493670887e-06,
"loss": 0.0,
"step": 16300
},
{
"epoch": 163.86,
"learning_rate": 5.9944303797468365e-06,
"loss": 0.0,
"step": 16325
},
{
"epoch": 164.12,
"learning_rate": 5.988101265822786e-06,
"loss": 0.0,
"step": 16350
},
{
"epoch": 164.37,
"learning_rate": 5.9817721518987345e-06,
"loss": 0.0,
"step": 16375
},
{
"epoch": 164.62,
"learning_rate": 5.975443037974684e-06,
"loss": 0.0,
"step": 16400
},
{
"epoch": 164.87,
"learning_rate": 5.969113924050633e-06,
"loss": 0.0,
"step": 16425
},
{
"epoch": 165.12,
"learning_rate": 5.962784810126583e-06,
"loss": 0.0,
"step": 16450
},
{
"epoch": 165.37,
"learning_rate": 5.956455696202532e-06,
"loss": 0.0,
"step": 16475
},
{
"epoch": 165.62,
"learning_rate": 5.950126582278482e-06,
"loss": 0.0,
"step": 16500
},
{
"epoch": 165.87,
"learning_rate": 5.943797468354431e-06,
"loss": 0.0,
"step": 16525
},
{
"epoch": 166.12,
"learning_rate": 5.9374683544303805e-06,
"loss": 0.0,
"step": 16550
},
{
"epoch": 166.37,
"learning_rate": 5.931139240506329e-06,
"loss": 0.0,
"step": 16575
},
{
"epoch": 166.62,
"learning_rate": 5.9248101265822785e-06,
"loss": 0.0,
"step": 16600
},
{
"epoch": 166.88,
"learning_rate": 5.918481012658228e-06,
"loss": 0.0,
"step": 16625
},
{
"epoch": 167.13,
"learning_rate": 5.912151898734177e-06,
"loss": 0.0,
"step": 16650
},
{
"epoch": 167.38,
"learning_rate": 5.905822784810127e-06,
"loss": 0.0,
"step": 16675
},
{
"epoch": 167.63,
"learning_rate": 5.899493670886076e-06,
"loss": 0.0,
"step": 16700
},
{
"epoch": 167.88,
"learning_rate": 5.893164556962026e-06,
"loss": 0.0,
"step": 16725
},
{
"epoch": 168.13,
"learning_rate": 5.886835443037975e-06,
"loss": 0.0,
"step": 16750
},
{
"epoch": 168.38,
"learning_rate": 5.8805063291139245e-06,
"loss": 0.0,
"step": 16775
},
{
"epoch": 168.63,
"learning_rate": 5.874177215189873e-06,
"loss": 0.0,
"step": 16800
},
{
"epoch": 168.88,
"learning_rate": 5.8678481012658225e-06,
"loss": 0.0,
"step": 16825
},
{
"epoch": 169.13,
"learning_rate": 5.861518987341772e-06,
"loss": 0.0,
"step": 16850
},
{
"epoch": 169.39,
"learning_rate": 5.855189873417721e-06,
"loss": 0.0,
"step": 16875
},
{
"epoch": 169.64,
"learning_rate": 5.848860759493671e-06,
"loss": 0.0,
"step": 16900
},
{
"epoch": 169.89,
"learning_rate": 5.842531645569621e-06,
"loss": 0.0,
"step": 16925
},
{
"epoch": 170.14,
"learning_rate": 5.8362025316455705e-06,
"loss": 0.0,
"step": 16950
},
{
"epoch": 170.39,
"learning_rate": 5.82987341772152e-06,
"loss": 0.0,
"step": 16975
},
{
"epoch": 170.64,
"learning_rate": 5.823544303797469e-06,
"loss": 0.0,
"step": 17000
},
{
"epoch": 170.64,
"eval_loss": 0.35653552412986755,
"eval_runtime": 2825.8367,
"eval_samples_per_second": 4.509,
"eval_steps_per_second": 0.282,
"eval_wer": 7.460528372674691,
"step": 17000
},
{
"epoch": 170.89,
"learning_rate": 5.817215189873419e-06,
"loss": 0.0,
"step": 17025
},
{
"epoch": 171.14,
"learning_rate": 5.810886075949368e-06,
"loss": 0.0,
"step": 17050
},
{
"epoch": 171.39,
"learning_rate": 5.804556962025318e-06,
"loss": 0.0,
"step": 17075
},
{
"epoch": 171.64,
"learning_rate": 5.798227848101266e-06,
"loss": 0.0,
"step": 17100
},
{
"epoch": 171.89,
"learning_rate": 5.791898734177216e-06,
"loss": 0.0,
"step": 17125
},
{
"epoch": 172.15,
"learning_rate": 5.785569620253165e-06,
"loss": 0.0,
"step": 17150
},
{
"epoch": 172.4,
"learning_rate": 5.7792405063291145e-06,
"loss": 0.0,
"step": 17175
},
{
"epoch": 172.65,
"learning_rate": 5.772911392405064e-06,
"loss": 0.0,
"step": 17200
},
{
"epoch": 172.9,
"learning_rate": 5.766582278481013e-06,
"loss": 0.0,
"step": 17225
},
{
"epoch": 173.15,
"learning_rate": 5.760253164556963e-06,
"loss": 0.0,
"step": 17250
},
{
"epoch": 173.4,
"learning_rate": 5.753924050632912e-06,
"loss": 0.0,
"step": 17275
},
{
"epoch": 173.65,
"learning_rate": 5.747594936708862e-06,
"loss": 0.0,
"step": 17300
},
{
"epoch": 173.9,
"learning_rate": 5.74126582278481e-06,
"loss": 0.0,
"step": 17325
},
{
"epoch": 174.15,
"learning_rate": 5.73493670886076e-06,
"loss": 0.0,
"step": 17350
},
{
"epoch": 174.4,
"learning_rate": 5.728607594936709e-06,
"loss": 0.0,
"step": 17375
},
{
"epoch": 174.65,
"learning_rate": 5.7222784810126585e-06,
"loss": 0.0,
"step": 17400
},
{
"epoch": 174.91,
"learning_rate": 5.715949367088608e-06,
"loss": 0.0,
"step": 17425
},
{
"epoch": 175.16,
"learning_rate": 5.709620253164557e-06,
"loss": 0.0,
"step": 17450
},
{
"epoch": 175.41,
"learning_rate": 5.703291139240507e-06,
"loss": 0.0,
"step": 17475
},
{
"epoch": 175.66,
"learning_rate": 5.696962025316456e-06,
"loss": 0.0,
"step": 17500
},
{
"epoch": 175.91,
"learning_rate": 5.690632911392406e-06,
"loss": 0.0,
"step": 17525
},
{
"epoch": 176.16,
"learning_rate": 5.684303797468354e-06,
"loss": 0.0,
"step": 17550
},
{
"epoch": 176.41,
"learning_rate": 5.677974683544304e-06,
"loss": 0.0,
"step": 17575
},
{
"epoch": 176.66,
"learning_rate": 5.671645569620253e-06,
"loss": 0.0,
"step": 17600
},
{
"epoch": 176.91,
"learning_rate": 5.6653164556962025e-06,
"loss": 0.0,
"step": 17625
},
{
"epoch": 177.16,
"learning_rate": 5.658987341772152e-06,
"loss": 0.0,
"step": 17650
},
{
"epoch": 177.42,
"learning_rate": 5.652658227848101e-06,
"loss": 0.0,
"step": 17675
},
{
"epoch": 177.67,
"learning_rate": 5.646329113924051e-06,
"loss": 0.0,
"step": 17700
},
{
"epoch": 177.92,
"learning_rate": 5.64e-06,
"loss": 0.0,
"step": 17725
},
{
"epoch": 178.17,
"learning_rate": 5.6336708860759505e-06,
"loss": 0.0,
"step": 17750
},
{
"epoch": 178.42,
"learning_rate": 5.6273417721519e-06,
"loss": 0.0,
"step": 17775
},
{
"epoch": 178.67,
"learning_rate": 5.621012658227849e-06,
"loss": 0.0,
"step": 17800
},
{
"epoch": 178.92,
"learning_rate": 5.614683544303799e-06,
"loss": 0.0,
"step": 17825
},
{
"epoch": 179.17,
"learning_rate": 5.608354430379747e-06,
"loss": 0.0,
"step": 17850
},
{
"epoch": 179.42,
"learning_rate": 5.602025316455697e-06,
"loss": 0.0,
"step": 17875
},
{
"epoch": 179.67,
"learning_rate": 5.595696202531646e-06,
"loss": 0.0,
"step": 17900
},
{
"epoch": 179.92,
"learning_rate": 5.589367088607596e-06,
"loss": 0.0,
"step": 17925
},
{
"epoch": 180.18,
"learning_rate": 5.583037974683545e-06,
"loss": 0.0,
"step": 17950
},
{
"epoch": 180.43,
"learning_rate": 5.5767088607594945e-06,
"loss": 0.0,
"step": 17975
},
{
"epoch": 180.68,
"learning_rate": 5.570379746835444e-06,
"loss": 0.0,
"step": 18000
},
{
"epoch": 180.68,
"eval_loss": 0.36885330080986023,
"eval_runtime": 2834.4693,
"eval_samples_per_second": 4.495,
"eval_steps_per_second": 0.281,
"eval_wer": 7.499609191808661,
"step": 18000
},
{
"epoch": 180.93,
"learning_rate": 5.564050632911393e-06,
"loss": 0.0,
"step": 18025
},
{
"epoch": 181.18,
"learning_rate": 5.557721518987343e-06,
"loss": 0.0,
"step": 18050
},
{
"epoch": 181.43,
"learning_rate": 5.551392405063291e-06,
"loss": 0.0,
"step": 18075
},
{
"epoch": 181.68,
"learning_rate": 5.545063291139241e-06,
"loss": 0.0,
"step": 18100
},
{
"epoch": 181.93,
"learning_rate": 5.53873417721519e-06,
"loss": 0.0,
"step": 18125
},
{
"epoch": 182.18,
"learning_rate": 5.53240506329114e-06,
"loss": 0.0,
"step": 18150
},
{
"epoch": 182.43,
"learning_rate": 5.526075949367089e-06,
"loss": 0.0,
"step": 18175
},
{
"epoch": 182.69,
"learning_rate": 5.5197468354430385e-06,
"loss": 0.0,
"step": 18200
},
{
"epoch": 182.94,
"learning_rate": 5.513417721518988e-06,
"loss": 0.0,
"step": 18225
},
{
"epoch": 183.19,
"learning_rate": 5.507088607594937e-06,
"loss": 0.0,
"step": 18250
},
{
"epoch": 183.44,
"learning_rate": 5.500759493670887e-06,
"loss": 0.0,
"step": 18275
},
{
"epoch": 183.69,
"learning_rate": 5.494430379746835e-06,
"loss": 0.0,
"step": 18300
},
{
"epoch": 183.94,
"learning_rate": 5.488101265822785e-06,
"loss": 0.0,
"step": 18325
},
{
"epoch": 184.19,
"learning_rate": 5.481772151898734e-06,
"loss": 0.0,
"step": 18350
},
{
"epoch": 184.44,
"learning_rate": 5.475443037974684e-06,
"loss": 0.0,
"step": 18375
},
{
"epoch": 184.69,
"learning_rate": 5.469113924050633e-06,
"loss": 0.0,
"step": 18400
},
{
"epoch": 184.94,
"learning_rate": 5.4627848101265825e-06,
"loss": 0.0,
"step": 18425
},
{
"epoch": 185.19,
"learning_rate": 5.456455696202532e-06,
"loss": 0.0,
"step": 18450
},
{
"epoch": 185.45,
"learning_rate": 5.450126582278481e-06,
"loss": 0.0,
"step": 18475
},
{
"epoch": 185.7,
"learning_rate": 5.44379746835443e-06,
"loss": 0.0,
"step": 18500
},
{
"epoch": 185.95,
"learning_rate": 5.437468354430379e-06,
"loss": 0.0,
"step": 18525
},
{
"epoch": 186.2,
"learning_rate": 5.431139240506329e-06,
"loss": 0.0,
"step": 18550
},
{
"epoch": 186.45,
"learning_rate": 5.424810126582279e-06,
"loss": 0.0,
"step": 18575
},
{
"epoch": 186.7,
"learning_rate": 5.4184810126582285e-06,
"loss": 0.0,
"step": 18600
},
{
"epoch": 186.95,
"learning_rate": 5.412151898734178e-06,
"loss": 0.0,
"step": 18625
},
{
"epoch": 187.2,
"learning_rate": 5.405822784810127e-06,
"loss": 0.0,
"step": 18650
},
{
"epoch": 187.45,
"learning_rate": 5.399493670886077e-06,
"loss": 0.0,
"step": 18675
},
{
"epoch": 187.7,
"learning_rate": 5.393164556962026e-06,
"loss": 0.0,
"step": 18700
},
{
"epoch": 187.95,
"learning_rate": 5.386835443037976e-06,
"loss": 0.0,
"step": 18725
},
{
"epoch": 188.21,
"learning_rate": 5.380506329113925e-06,
"loss": 0.0,
"step": 18750
},
{
"epoch": 188.46,
"learning_rate": 5.3741772151898745e-06,
"loss": 0.0,
"step": 18775
},
{
"epoch": 188.71,
"learning_rate": 5.367848101265823e-06,
"loss": 0.0,
"step": 18800
},
{
"epoch": 188.96,
"learning_rate": 5.3615189873417725e-06,
"loss": 0.0,
"step": 18825
},
{
"epoch": 189.21,
"learning_rate": 5.355189873417722e-06,
"loss": 0.0,
"step": 18850
},
{
"epoch": 189.46,
"learning_rate": 5.348860759493671e-06,
"loss": 0.0,
"step": 18875
},
{
"epoch": 189.71,
"learning_rate": 5.342531645569621e-06,
"loss": 0.0,
"step": 18900
},
{
"epoch": 189.96,
"learning_rate": 5.33620253164557e-06,
"loss": 0.0,
"step": 18925
},
{
"epoch": 190.21,
"learning_rate": 5.32987341772152e-06,
"loss": 0.0,
"step": 18950
},
{
"epoch": 190.46,
"learning_rate": 5.323544303797469e-06,
"loss": 0.0,
"step": 18975
},
{
"epoch": 190.72,
"learning_rate": 5.3172151898734185e-06,
"loss": 0.0,
"step": 19000
},
{
"epoch": 190.72,
"eval_loss": 0.38055649399757385,
"eval_runtime": 2838.3594,
"eval_samples_per_second": 4.489,
"eval_steps_per_second": 0.281,
"eval_wer": 7.593403157730186,
"step": 19000
},
{
"epoch": 190.97,
"learning_rate": 5.310886075949367e-06,
"loss": 0.0,
"step": 19025
},
{
"epoch": 191.22,
"learning_rate": 5.3045569620253165e-06,
"loss": 0.0,
"step": 19050
},
{
"epoch": 191.47,
"learning_rate": 5.298227848101266e-06,
"loss": 0.0,
"step": 19075
},
{
"epoch": 191.72,
"learning_rate": 5.291898734177215e-06,
"loss": 0.0,
"step": 19100
},
{
"epoch": 191.97,
"learning_rate": 5.285569620253165e-06,
"loss": 0.0,
"step": 19125
},
{
"epoch": 192.22,
"learning_rate": 5.279240506329114e-06,
"loss": 0.0,
"step": 19150
},
{
"epoch": 192.47,
"learning_rate": 5.272911392405064e-06,
"loss": 0.0,
"step": 19175
},
{
"epoch": 192.72,
"learning_rate": 5.266582278481013e-06,
"loss": 0.0,
"step": 19200
},
{
"epoch": 192.97,
"learning_rate": 5.2602531645569625e-06,
"loss": 0.0,
"step": 19225
},
{
"epoch": 193.22,
"learning_rate": 5.253924050632911e-06,
"loss": 0.0,
"step": 19250
},
{
"epoch": 193.48,
"learning_rate": 5.2475949367088605e-06,
"loss": 0.0,
"step": 19275
},
{
"epoch": 193.73,
"learning_rate": 5.24126582278481e-06,
"loss": 0.0,
"step": 19300
},
{
"epoch": 193.98,
"learning_rate": 5.234936708860759e-06,
"loss": 0.0,
"step": 19325
},
{
"epoch": 194.23,
"learning_rate": 5.228607594936709e-06,
"loss": 0.0,
"step": 19350
},
{
"epoch": 194.48,
"learning_rate": 5.222278481012658e-06,
"loss": 0.0,
"step": 19375
},
{
"epoch": 194.73,
"learning_rate": 5.2159493670886085e-06,
"loss": 0.0,
"step": 19400
},
{
"epoch": 194.98,
"learning_rate": 5.209620253164558e-06,
"loss": 0.0,
"step": 19425
},
{
"epoch": 195.23,
"learning_rate": 5.203291139240507e-06,
"loss": 0.0,
"step": 19450
},
{
"epoch": 195.48,
"learning_rate": 5.196962025316457e-06,
"loss": 0.0,
"step": 19475
},
{
"epoch": 195.73,
"learning_rate": 5.190632911392406e-06,
"loss": 0.0,
"step": 19500
},
{
"epoch": 195.98,
"learning_rate": 5.184303797468356e-06,
"loss": 0.0,
"step": 19525
},
{
"epoch": 196.24,
"learning_rate": 5.177974683544304e-06,
"loss": 0.0,
"step": 19550
},
{
"epoch": 196.49,
"learning_rate": 5.171645569620254e-06,
"loss": 0.0,
"step": 19575
},
{
"epoch": 196.74,
"learning_rate": 5.165316455696203e-06,
"loss": 0.0,
"step": 19600
},
{
"epoch": 196.99,
"learning_rate": 5.1589873417721525e-06,
"loss": 0.0,
"step": 19625
},
{
"epoch": 197.24,
"learning_rate": 5.152911392405063e-06,
"loss": 0.0,
"step": 19650
},
{
"epoch": 197.49,
"learning_rate": 5.1465822784810125e-06,
"loss": 0.0,
"step": 19675
},
{
"epoch": 197.74,
"learning_rate": 5.140253164556962e-06,
"loss": 0.0,
"step": 19700
},
{
"epoch": 197.99,
"learning_rate": 5.133924050632911e-06,
"loss": 0.0,
"step": 19725
},
{
"epoch": 198.24,
"learning_rate": 5.127594936708861e-06,
"loss": 0.0,
"step": 19750
},
{
"epoch": 198.49,
"learning_rate": 5.12126582278481e-06,
"loss": 0.0,
"step": 19775
},
{
"epoch": 198.75,
"learning_rate": 5.1149367088607605e-06,
"loss": 0.0,
"step": 19800
},
{
"epoch": 199.0,
"learning_rate": 5.10860759493671e-06,
"loss": 0.0,
"step": 19825
},
{
"epoch": 199.25,
"learning_rate": 5.102278481012659e-06,
"loss": 0.0,
"step": 19850
},
{
"epoch": 199.5,
"learning_rate": 5.095949367088609e-06,
"loss": 0.0,
"step": 19875
},
{
"epoch": 199.75,
"learning_rate": 5.089620253164557e-06,
"loss": 0.0,
"step": 19900
},
{
"epoch": 200.0,
"learning_rate": 5.083291139240507e-06,
"loss": 0.0,
"step": 19925
},
{
"epoch": 200.25,
"learning_rate": 5.076962025316456e-06,
"loss": 0.0,
"step": 19950
},
{
"epoch": 200.5,
"learning_rate": 5.070632911392406e-06,
"loss": 0.0,
"step": 19975
},
{
"epoch": 200.75,
"learning_rate": 5.064303797468355e-06,
"loss": 0.0,
"step": 20000
},
{
"epoch": 200.75,
"eval_loss": 0.3912152349948883,
"eval_runtime": 2832.4168,
"eval_samples_per_second": 4.499,
"eval_steps_per_second": 0.281,
"eval_wer": 7.6344380178208535,
"step": 20000
},
{
"epoch": 201.0,
"learning_rate": 5.0579746835443045e-06,
"loss": 0.0,
"step": 20025
},
{
"epoch": 201.25,
"learning_rate": 5.051645569620254e-06,
"loss": 0.0,
"step": 20050
},
{
"epoch": 201.51,
"learning_rate": 5.045316455696203e-06,
"loss": 0.0,
"step": 20075
},
{
"epoch": 201.76,
"learning_rate": 5.038987341772153e-06,
"loss": 0.0,
"step": 20100
},
{
"epoch": 202.01,
"learning_rate": 5.032658227848101e-06,
"loss": 0.0,
"step": 20125
},
{
"epoch": 202.26,
"learning_rate": 5.026329113924051e-06,
"loss": 0.0,
"step": 20150
},
{
"epoch": 202.51,
"learning_rate": 5.02e-06,
"loss": 0.0,
"step": 20175
},
{
"epoch": 202.76,
"learning_rate": 5.01367088607595e-06,
"loss": 0.0,
"step": 20200
},
{
"epoch": 203.01,
"learning_rate": 5.007341772151899e-06,
"loss": 0.0,
"step": 20225
},
{
"epoch": 203.26,
"learning_rate": 5.0010126582278485e-06,
"loss": 0.0,
"step": 20250
},
{
"epoch": 203.51,
"learning_rate": 4.994683544303798e-06,
"loss": 0.0,
"step": 20275
},
{
"epoch": 203.76,
"learning_rate": 4.988354430379747e-06,
"loss": 0.0,
"step": 20300
},
{
"epoch": 204.02,
"learning_rate": 4.982025316455697e-06,
"loss": 0.0,
"step": 20325
},
{
"epoch": 204.27,
"learning_rate": 4.975696202531645e-06,
"loss": 0.0,
"step": 20350
},
{
"epoch": 204.52,
"learning_rate": 4.969367088607595e-06,
"loss": 0.0,
"step": 20375
},
{
"epoch": 204.77,
"learning_rate": 4.963037974683545e-06,
"loss": 0.0,
"step": 20400
},
{
"epoch": 205.02,
"learning_rate": 4.9567088607594945e-06,
"loss": 0.0,
"step": 20425
},
{
"epoch": 205.27,
"learning_rate": 4.950379746835444e-06,
"loss": 0.0,
"step": 20450
},
{
"epoch": 205.52,
"learning_rate": 4.944050632911393e-06,
"loss": 0.0,
"step": 20475
},
{
"epoch": 205.77,
"learning_rate": 4.937721518987342e-06,
"loss": 0.0,
"step": 20500
},
{
"epoch": 206.02,
"learning_rate": 4.931392405063291e-06,
"loss": 0.0,
"step": 20525
},
{
"epoch": 206.27,
"learning_rate": 4.925063291139241e-06,
"loss": 0.0,
"step": 20550
},
{
"epoch": 206.52,
"learning_rate": 4.91873417721519e-06,
"loss": 0.0,
"step": 20575
},
{
"epoch": 206.78,
"learning_rate": 4.91240506329114e-06,
"loss": 0.0,
"step": 20600
},
{
"epoch": 207.03,
"learning_rate": 4.906075949367089e-06,
"loss": 0.0,
"step": 20625
},
{
"epoch": 207.28,
"learning_rate": 4.8997468354430385e-06,
"loss": 0.0,
"step": 20650
},
{
"epoch": 207.53,
"learning_rate": 4.893417721518988e-06,
"loss": 0.0,
"step": 20675
},
{
"epoch": 207.78,
"learning_rate": 4.887088607594937e-06,
"loss": 0.0,
"step": 20700
},
{
"epoch": 208.03,
"learning_rate": 4.880759493670886e-06,
"loss": 0.0,
"step": 20725
},
{
"epoch": 208.28,
"learning_rate": 4.874430379746835e-06,
"loss": 0.0,
"step": 20750
},
{
"epoch": 208.53,
"learning_rate": 4.868101265822785e-06,
"loss": 0.0,
"step": 20775
},
{
"epoch": 208.78,
"learning_rate": 4.861772151898734e-06,
"loss": 0.0,
"step": 20800
},
{
"epoch": 209.03,
"learning_rate": 4.8554430379746845e-06,
"loss": 0.0,
"step": 20825
},
{
"epoch": 209.28,
"learning_rate": 4.849113924050634e-06,
"loss": 0.0,
"step": 20850
},
{
"epoch": 209.54,
"learning_rate": 4.8427848101265825e-06,
"loss": 0.0,
"step": 20875
},
{
"epoch": 209.79,
"learning_rate": 4.836455696202532e-06,
"loss": 0.0,
"step": 20900
},
{
"epoch": 210.04,
"learning_rate": 4.830126582278481e-06,
"loss": 0.0,
"step": 20925
},
{
"epoch": 210.29,
"learning_rate": 4.823797468354431e-06,
"loss": 0.0,
"step": 20950
},
{
"epoch": 210.54,
"learning_rate": 4.81746835443038e-06,
"loss": 0.0,
"step": 20975
},
{
"epoch": 210.79,
"learning_rate": 4.81113924050633e-06,
"loss": 0.0,
"step": 21000
},
{
"epoch": 210.79,
"eval_loss": 0.400534451007843,
"eval_runtime": 2829.8565,
"eval_samples_per_second": 4.503,
"eval_steps_per_second": 0.282,
"eval_wer": 7.548460215726122,
"step": 21000
},
{
"epoch": 211.04,
"learning_rate": 4.804810126582279e-06,
"loss": 0.0,
"step": 21025
},
{
"epoch": 211.29,
"learning_rate": 4.7984810126582285e-06,
"loss": 0.0,
"step": 21050
},
{
"epoch": 211.54,
"learning_rate": 4.792151898734178e-06,
"loss": 0.0,
"step": 21075
},
{
"epoch": 211.79,
"learning_rate": 4.7858227848101265e-06,
"loss": 0.0,
"step": 21100
},
{
"epoch": 212.05,
"learning_rate": 4.779493670886076e-06,
"loss": 0.0,
"step": 21125
},
{
"epoch": 212.3,
"learning_rate": 4.773164556962025e-06,
"loss": 0.0,
"step": 21150
},
{
"epoch": 212.55,
"learning_rate": 4.766835443037975e-06,
"loss": 0.0,
"step": 21175
},
{
"epoch": 212.8,
"learning_rate": 4.760506329113924e-06,
"loss": 0.0,
"step": 21200
},
{
"epoch": 213.05,
"learning_rate": 4.7541772151898745e-06,
"loss": 0.0,
"step": 21225
},
{
"epoch": 213.3,
"learning_rate": 4.747848101265823e-06,
"loss": 0.0,
"step": 21250
},
{
"epoch": 213.55,
"learning_rate": 4.7415189873417725e-06,
"loss": 0.0,
"step": 21275
},
{
"epoch": 213.8,
"learning_rate": 4.735189873417722e-06,
"loss": 0.0,
"step": 21300
},
{
"epoch": 214.05,
"learning_rate": 4.728860759493671e-06,
"loss": 0.0,
"step": 21325
},
{
"epoch": 214.3,
"learning_rate": 4.722531645569621e-06,
"loss": 0.0,
"step": 21350
},
{
"epoch": 214.55,
"learning_rate": 4.71620253164557e-06,
"loss": 0.0,
"step": 21375
},
{
"epoch": 214.81,
"learning_rate": 4.70987341772152e-06,
"loss": 0.0,
"step": 21400
},
{
"epoch": 215.06,
"learning_rate": 4.703544303797469e-06,
"loss": 0.0,
"step": 21425
},
{
"epoch": 215.31,
"learning_rate": 4.6972151898734185e-06,
"loss": 0.0,
"step": 21450
},
{
"epoch": 215.56,
"learning_rate": 4.690886075949367e-06,
"loss": 0.0,
"step": 21475
},
{
"epoch": 215.81,
"learning_rate": 4.6845569620253165e-06,
"loss": 0.0,
"step": 21500
},
{
"epoch": 216.06,
"learning_rate": 4.678227848101266e-06,
"loss": 0.0,
"step": 21525
},
{
"epoch": 216.31,
"learning_rate": 4.671898734177215e-06,
"loss": 0.0,
"step": 21550
},
{
"epoch": 216.56,
"learning_rate": 4.665569620253165e-06,
"loss": 0.0,
"step": 21575
},
{
"epoch": 216.81,
"learning_rate": 4.659240506329114e-06,
"loss": 0.0,
"step": 21600
},
{
"epoch": 217.06,
"learning_rate": 4.652911392405064e-06,
"loss": 0.0,
"step": 21625
},
{
"epoch": 217.31,
"learning_rate": 4.646582278481013e-06,
"loss": 0.0,
"step": 21650
},
{
"epoch": 217.57,
"learning_rate": 4.6402531645569625e-06,
"loss": 0.0,
"step": 21675
},
{
"epoch": 217.82,
"learning_rate": 4.633924050632912e-06,
"loss": 0.0,
"step": 21700
},
{
"epoch": 218.07,
"learning_rate": 4.627594936708861e-06,
"loss": 0.0,
"step": 21725
},
{
"epoch": 218.32,
"learning_rate": 4.621265822784811e-06,
"loss": 0.0,
"step": 21750
},
{
"epoch": 218.57,
"learning_rate": 4.61493670886076e-06,
"loss": 0.0,
"step": 21775
},
{
"epoch": 218.82,
"learning_rate": 4.60860759493671e-06,
"loss": 0.0,
"step": 21800
},
{
"epoch": 219.07,
"learning_rate": 4.602278481012658e-06,
"loss": 0.0,
"step": 21825
},
{
"epoch": 219.32,
"learning_rate": 4.595949367088608e-06,
"loss": 0.0,
"step": 21850
},
{
"epoch": 219.57,
"learning_rate": 4.589620253164557e-06,
"loss": 0.0,
"step": 21875
},
{
"epoch": 219.82,
"learning_rate": 4.5832911392405065e-06,
"loss": 0.0,
"step": 21900
},
{
"epoch": 220.08,
"learning_rate": 4.576962025316456e-06,
"loss": 0.0,
"step": 21925
},
{
"epoch": 220.33,
"learning_rate": 4.570632911392405e-06,
"loss": 0.0,
"step": 21950
},
{
"epoch": 220.58,
"learning_rate": 4.564303797468355e-06,
"loss": 0.0,
"step": 21975
},
{
"epoch": 220.83,
"learning_rate": 4.557974683544304e-06,
"loss": 0.0,
"step": 22000
},
{
"epoch": 220.83,
"eval_loss": 0.4101511240005493,
"eval_runtime": 2839.3882,
"eval_samples_per_second": 4.488,
"eval_steps_per_second": 0.281,
"eval_wer": 7.6266218539940605,
"step": 22000
},
{
"epoch": 221.08,
"learning_rate": 4.551645569620254e-06,
"loss": 0.0,
"step": 22025
},
{
"epoch": 221.33,
"learning_rate": 4.545316455696203e-06,
"loss": 0.0,
"step": 22050
},
{
"epoch": 221.58,
"learning_rate": 4.5389873417721525e-06,
"loss": 0.0,
"step": 22075
},
{
"epoch": 221.83,
"learning_rate": 4.532658227848102e-06,
"loss": 0.0,
"step": 22100
},
{
"epoch": 222.08,
"learning_rate": 4.526329113924051e-06,
"loss": 0.0,
"step": 22125
},
{
"epoch": 222.33,
"learning_rate": 4.520000000000001e-06,
"loss": 0.0,
"step": 22150
},
{
"epoch": 222.58,
"learning_rate": 4.51367088607595e-06,
"loss": 0.0,
"step": 22175
},
{
"epoch": 222.84,
"learning_rate": 4.507341772151899e-06,
"loss": 0.0,
"step": 22200
},
{
"epoch": 223.09,
"learning_rate": 4.501012658227848e-06,
"loss": 0.0,
"step": 22225
},
{
"epoch": 223.34,
"learning_rate": 4.494683544303798e-06,
"loss": 0.0,
"step": 22250
},
{
"epoch": 223.59,
"learning_rate": 4.488354430379747e-06,
"loss": 0.0,
"step": 22275
},
{
"epoch": 223.84,
"learning_rate": 4.4820253164556965e-06,
"loss": 0.0,
"step": 22300
},
{
"epoch": 224.09,
"learning_rate": 4.475696202531646e-06,
"loss": 0.0,
"step": 22325
},
{
"epoch": 224.34,
"learning_rate": 4.469367088607595e-06,
"loss": 0.0,
"step": 22350
},
{
"epoch": 224.59,
"learning_rate": 4.463037974683545e-06,
"loss": 0.0,
"step": 22375
},
{
"epoch": 224.84,
"learning_rate": 4.456708860759494e-06,
"loss": 0.0,
"step": 22400
},
{
"epoch": 225.09,
"learning_rate": 4.450379746835443e-06,
"loss": 0.0,
"step": 22425
},
{
"epoch": 225.35,
"learning_rate": 4.444050632911392e-06,
"loss": 0.0,
"step": 22450
},
{
"epoch": 225.6,
"learning_rate": 4.4377215189873425e-06,
"loss": 0.0,
"step": 22475
},
{
"epoch": 225.85,
"learning_rate": 4.431392405063292e-06,
"loss": 0.0,
"step": 22500
},
{
"epoch": 226.1,
"learning_rate": 4.425063291139241e-06,
"loss": 0.0,
"step": 22525
},
{
"epoch": 226.35,
"learning_rate": 4.418734177215191e-06,
"loss": 0.0,
"step": 22550
},
{
"epoch": 226.6,
"learning_rate": 4.412405063291139e-06,
"loss": 0.0,
"step": 22575
},
{
"epoch": 226.85,
"learning_rate": 4.406075949367089e-06,
"loss": 0.0,
"step": 22600
},
{
"epoch": 227.1,
"learning_rate": 4.399746835443038e-06,
"loss": 0.0,
"step": 22625
},
{
"epoch": 227.35,
"learning_rate": 4.393417721518988e-06,
"loss": 0.0,
"step": 22650
},
{
"epoch": 227.6,
"learning_rate": 4.387088607594937e-06,
"loss": 0.0,
"step": 22675
},
{
"epoch": 227.85,
"learning_rate": 4.3807594936708865e-06,
"loss": 0.0,
"step": 22700
},
{
"epoch": 228.11,
"learning_rate": 4.374430379746836e-06,
"loss": 0.0,
"step": 22725
},
{
"epoch": 228.36,
"learning_rate": 4.368101265822785e-06,
"loss": 0.0,
"step": 22750
},
{
"epoch": 228.61,
"learning_rate": 4.361772151898735e-06,
"loss": 0.0,
"step": 22775
},
{
"epoch": 228.86,
"learning_rate": 4.355443037974683e-06,
"loss": 0.0,
"step": 22800
},
{
"epoch": 229.11,
"learning_rate": 4.349113924050633e-06,
"loss": 0.0,
"step": 22825
},
{
"epoch": 229.36,
"learning_rate": 4.342784810126582e-06,
"loss": 0.0,
"step": 22850
},
{
"epoch": 229.61,
"learning_rate": 4.3364556962025325e-06,
"loss": 0.0,
"step": 22875
},
{
"epoch": 229.86,
"learning_rate": 4.330126582278482e-06,
"loss": 0.0,
"step": 22900
},
{
"epoch": 230.11,
"learning_rate": 4.323797468354431e-06,
"loss": 0.0,
"step": 22925
},
{
"epoch": 230.36,
"learning_rate": 4.31746835443038e-06,
"loss": 0.0,
"step": 22950
},
{
"epoch": 230.61,
"learning_rate": 4.311392405063291e-06,
"loss": 0.0074,
"step": 22975
},
{
"epoch": 230.87,
"learning_rate": 4.305063291139241e-06,
"loss": 0.0079,
"step": 23000
},
{
"epoch": 230.87,
"eval_loss": 0.24673040211200714,
"eval_runtime": 2817.1734,
"eval_samples_per_second": 4.523,
"eval_steps_per_second": 0.283,
"eval_wer": 9.165429107394091,
"step": 23000
},
{
"epoch": 231.12,
"learning_rate": 4.298987341772152e-06,
"loss": 0.0049,
"step": 23025
},
{
"epoch": 231.37,
"learning_rate": 4.292658227848102e-06,
"loss": 0.0041,
"step": 23050
},
{
"epoch": 231.62,
"learning_rate": 4.286329113924051e-06,
"loss": 0.0025,
"step": 23075
},
{
"epoch": 231.87,
"learning_rate": 4.2800000000000005e-06,
"loss": 0.0028,
"step": 23100
},
{
"epoch": 232.12,
"learning_rate": 4.27367088607595e-06,
"loss": 0.0018,
"step": 23125
},
{
"epoch": 232.37,
"learning_rate": 4.2673417721518985e-06,
"loss": 0.0009,
"step": 23150
},
{
"epoch": 232.62,
"learning_rate": 4.261012658227848e-06,
"loss": 0.0007,
"step": 23175
},
{
"epoch": 232.87,
"learning_rate": 4.254683544303797e-06,
"loss": 0.0005,
"step": 23200
},
{
"epoch": 233.12,
"learning_rate": 4.248354430379747e-06,
"loss": 0.0003,
"step": 23225
},
{
"epoch": 233.38,
"learning_rate": 4.242025316455697e-06,
"loss": 0.0003,
"step": 23250
},
{
"epoch": 233.63,
"learning_rate": 4.2356962025316465e-06,
"loss": 0.0002,
"step": 23275
},
{
"epoch": 233.88,
"learning_rate": 4.229367088607595e-06,
"loss": 0.0003,
"step": 23300
},
{
"epoch": 234.13,
"learning_rate": 4.2230379746835445e-06,
"loss": 0.0003,
"step": 23325
},
{
"epoch": 234.38,
"learning_rate": 4.216708860759494e-06,
"loss": 0.0001,
"step": 23350
},
{
"epoch": 234.63,
"learning_rate": 4.210379746835443e-06,
"loss": 0.0001,
"step": 23375
},
{
"epoch": 234.88,
"learning_rate": 4.204050632911393e-06,
"loss": 0.0001,
"step": 23400
},
{
"epoch": 235.13,
"learning_rate": 4.197721518987342e-06,
"loss": 0.0001,
"step": 23425
},
{
"epoch": 235.38,
"learning_rate": 4.191392405063292e-06,
"loss": 0.0001,
"step": 23450
},
{
"epoch": 235.63,
"learning_rate": 4.185063291139241e-06,
"loss": 0.0001,
"step": 23475
},
{
"epoch": 235.88,
"learning_rate": 4.1787341772151905e-06,
"loss": 0.0001,
"step": 23500
},
{
"epoch": 236.14,
"learning_rate": 4.172405063291139e-06,
"loss": 0.0001,
"step": 23525
},
{
"epoch": 236.39,
"learning_rate": 4.1660759493670885e-06,
"loss": 0.0,
"step": 23550
},
{
"epoch": 236.64,
"learning_rate": 4.159746835443038e-06,
"loss": 0.0,
"step": 23575
},
{
"epoch": 236.89,
"learning_rate": 4.153417721518987e-06,
"loss": 0.0,
"step": 23600
},
{
"epoch": 237.14,
"learning_rate": 4.147088607594937e-06,
"loss": 0.0001,
"step": 23625
},
{
"epoch": 237.39,
"learning_rate": 4.140759493670886e-06,
"loss": 0.0,
"step": 23650
},
{
"epoch": 237.64,
"learning_rate": 4.134430379746836e-06,
"loss": 0.0001,
"step": 23675
},
{
"epoch": 237.89,
"learning_rate": 4.128101265822785e-06,
"loss": 0.0,
"step": 23700
},
{
"epoch": 238.14,
"learning_rate": 4.1217721518987345e-06,
"loss": 0.0,
"step": 23725
},
{
"epoch": 238.39,
"learning_rate": 4.115443037974684e-06,
"loss": 0.0,
"step": 23750
},
{
"epoch": 238.64,
"learning_rate": 4.109113924050633e-06,
"loss": 0.0001,
"step": 23775
},
{
"epoch": 238.9,
"learning_rate": 4.102784810126583e-06,
"loss": 0.0,
"step": 23800
},
{
"epoch": 239.15,
"learning_rate": 4.096455696202532e-06,
"loss": 0.0,
"step": 23825
},
{
"epoch": 239.4,
"learning_rate": 4.090126582278482e-06,
"loss": 0.0,
"step": 23850
},
{
"epoch": 239.65,
"learning_rate": 4.083797468354431e-06,
"loss": 0.0,
"step": 23875
},
{
"epoch": 239.9,
"learning_rate": 4.07746835443038e-06,
"loss": 0.0001,
"step": 23900
},
{
"epoch": 240.15,
"learning_rate": 4.071139240506329e-06,
"loss": 0.0001,
"step": 23925
},
{
"epoch": 240.4,
"learning_rate": 4.0648101265822785e-06,
"loss": 0.0,
"step": 23950
},
{
"epoch": 240.65,
"learning_rate": 4.058481012658228e-06,
"loss": 0.0,
"step": 23975
},
{
"epoch": 240.9,
"learning_rate": 4.052151898734177e-06,
"loss": 0.0,
"step": 24000
},
{
"epoch": 240.9,
"eval_loss": 0.30968427658081055,
"eval_runtime": 2825.8546,
"eval_samples_per_second": 4.509,
"eval_steps_per_second": 0.282,
"eval_wer": 7.761450680006253,
"step": 24000
},
{
"epoch": 241.15,
"learning_rate": 4.045822784810127e-06,
"loss": 0.0,
"step": 24025
},
{
"epoch": 241.41,
"learning_rate": 4.039493670886076e-06,
"loss": 0.0,
"step": 24050
},
{
"epoch": 241.66,
"learning_rate": 4.033164556962026e-06,
"loss": 0.0,
"step": 24075
},
{
"epoch": 241.91,
"learning_rate": 4.026835443037975e-06,
"loss": 0.0,
"step": 24100
},
{
"epoch": 242.16,
"learning_rate": 4.0205063291139245e-06,
"loss": 0.0,
"step": 24125
},
{
"epoch": 242.41,
"learning_rate": 4.014177215189874e-06,
"loss": 0.0,
"step": 24150
},
{
"epoch": 242.66,
"learning_rate": 4.007848101265823e-06,
"loss": 0.0,
"step": 24175
},
{
"epoch": 242.91,
"learning_rate": 4.001518987341773e-06,
"loss": 0.0,
"step": 24200
},
{
"epoch": 243.16,
"learning_rate": 3.995189873417722e-06,
"loss": 0.0,
"step": 24225
},
{
"epoch": 243.41,
"learning_rate": 3.988860759493672e-06,
"loss": 0.0,
"step": 24250
},
{
"epoch": 243.66,
"learning_rate": 3.98253164556962e-06,
"loss": 0.0,
"step": 24275
},
{
"epoch": 243.91,
"learning_rate": 3.97620253164557e-06,
"loss": 0.0,
"step": 24300
},
{
"epoch": 244.17,
"learning_rate": 3.969873417721519e-06,
"loss": 0.0,
"step": 24325
},
{
"epoch": 244.42,
"learning_rate": 3.9635443037974685e-06,
"loss": 0.0,
"step": 24350
},
{
"epoch": 244.67,
"learning_rate": 3.957215189873418e-06,
"loss": 0.0,
"step": 24375
},
{
"epoch": 244.92,
"learning_rate": 3.950886075949367e-06,
"loss": 0.0,
"step": 24400
},
{
"epoch": 245.17,
"learning_rate": 3.944556962025317e-06,
"loss": 0.0,
"step": 24425
},
{
"epoch": 245.42,
"learning_rate": 3.938227848101266e-06,
"loss": 0.0,
"step": 24450
},
{
"epoch": 245.67,
"learning_rate": 3.931898734177216e-06,
"loss": 0.0,
"step": 24475
},
{
"epoch": 245.92,
"learning_rate": 3.925569620253165e-06,
"loss": 0.0,
"step": 24500
},
{
"epoch": 246.17,
"learning_rate": 3.9192405063291145e-06,
"loss": 0.0,
"step": 24525
},
{
"epoch": 246.42,
"learning_rate": 3.912911392405064e-06,
"loss": 0.0,
"step": 24550
},
{
"epoch": 246.68,
"learning_rate": 3.906582278481013e-06,
"loss": 0.0,
"step": 24575
},
{
"epoch": 246.93,
"learning_rate": 3.900253164556963e-06,
"loss": 0.0,
"step": 24600
},
{
"epoch": 247.18,
"learning_rate": 3.893924050632911e-06,
"loss": 0.0,
"step": 24625
},
{
"epoch": 247.43,
"learning_rate": 3.887594936708861e-06,
"loss": 0.0,
"step": 24650
},
{
"epoch": 247.68,
"learning_rate": 3.88126582278481e-06,
"loss": 0.0,
"step": 24675
},
{
"epoch": 247.93,
"learning_rate": 3.87493670886076e-06,
"loss": 0.0,
"step": 24700
},
{
"epoch": 248.18,
"learning_rate": 3.868607594936709e-06,
"loss": 0.0,
"step": 24725
},
{
"epoch": 248.43,
"learning_rate": 3.8622784810126585e-06,
"loss": 0.0,
"step": 24750
},
{
"epoch": 248.68,
"learning_rate": 3.855949367088608e-06,
"loss": 0.0,
"step": 24775
},
{
"epoch": 248.93,
"learning_rate": 3.849620253164557e-06,
"loss": 0.0,
"step": 24800
},
{
"epoch": 249.18,
"learning_rate": 3.843291139240507e-06,
"loss": 0.0,
"step": 24825
},
{
"epoch": 249.44,
"learning_rate": 3.836962025316455e-06,
"loss": 0.0,
"step": 24850
},
{
"epoch": 249.69,
"learning_rate": 3.830632911392405e-06,
"loss": 0.0,
"step": 24875
},
{
"epoch": 249.94,
"learning_rate": 3.824303797468355e-06,
"loss": 0.0,
"step": 24900
},
{
"epoch": 250.19,
"learning_rate": 3.8179746835443045e-06,
"loss": 0.0,
"step": 24925
},
{
"epoch": 250.44,
"learning_rate": 3.8116455696202535e-06,
"loss": 0.0,
"step": 24950
},
{
"epoch": 250.69,
"learning_rate": 3.805316455696203e-06,
"loss": 0.0,
"step": 24975
},
{
"epoch": 250.94,
"learning_rate": 3.7989873417721524e-06,
"loss": 0.0,
"step": 25000
},
{
"epoch": 250.94,
"eval_loss": 0.3311292827129364,
"eval_runtime": 2833.7855,
"eval_samples_per_second": 4.496,
"eval_steps_per_second": 0.281,
"eval_wer": 7.724323901828982,
"step": 25000
},
{
"epoch": 251.19,
"learning_rate": 3.792658227848102e-06,
"loss": 0.0,
"step": 25025
},
{
"epoch": 251.44,
"learning_rate": 3.786329113924051e-06,
"loss": 0.0,
"step": 25050
},
{
"epoch": 251.69,
"learning_rate": 3.7800000000000002e-06,
"loss": 0.0,
"step": 25075
},
{
"epoch": 251.94,
"learning_rate": 3.7736708860759497e-06,
"loss": 0.0,
"step": 25100
},
{
"epoch": 252.2,
"learning_rate": 3.767341772151899e-06,
"loss": 0.0,
"step": 25125
},
{
"epoch": 252.45,
"learning_rate": 3.7610126582278485e-06,
"loss": 0.0,
"step": 25150
},
{
"epoch": 252.7,
"learning_rate": 3.7546835443037975e-06,
"loss": 0.0,
"step": 25175
},
{
"epoch": 252.95,
"learning_rate": 3.748354430379747e-06,
"loss": 0.0,
"step": 25200
},
{
"epoch": 253.2,
"learning_rate": 3.7420253164556964e-06,
"loss": 0.0,
"step": 25225
},
{
"epoch": 253.45,
"learning_rate": 3.735696202531646e-06,
"loss": 0.0,
"step": 25250
},
{
"epoch": 253.7,
"learning_rate": 3.729367088607595e-06,
"loss": 0.0,
"step": 25275
},
{
"epoch": 253.95,
"learning_rate": 3.7230379746835442e-06,
"loss": 0.0,
"step": 25300
},
{
"epoch": 254.2,
"learning_rate": 3.716708860759494e-06,
"loss": 0.0,
"step": 25325
},
{
"epoch": 254.45,
"learning_rate": 3.7103797468354435e-06,
"loss": 0.0,
"step": 25350
},
{
"epoch": 254.71,
"learning_rate": 3.704050632911393e-06,
"loss": 0.0,
"step": 25375
},
{
"epoch": 254.96,
"learning_rate": 3.6977215189873424e-06,
"loss": 0.0,
"step": 25400
},
{
"epoch": 255.21,
"learning_rate": 3.6913924050632914e-06,
"loss": 0.0,
"step": 25425
},
{
"epoch": 255.46,
"learning_rate": 3.685063291139241e-06,
"loss": 0.0,
"step": 25450
},
{
"epoch": 255.71,
"learning_rate": 3.6787341772151902e-06,
"loss": 0.0,
"step": 25475
},
{
"epoch": 255.96,
"learning_rate": 3.6724050632911397e-06,
"loss": 0.0,
"step": 25500
},
{
"epoch": 256.21,
"learning_rate": 3.666075949367089e-06,
"loss": 0.0,
"step": 25525
},
{
"epoch": 256.46,
"learning_rate": 3.659746835443038e-06,
"loss": 0.0,
"step": 25550
},
{
"epoch": 256.71,
"learning_rate": 3.6534177215189875e-06,
"loss": 0.0,
"step": 25575
},
{
"epoch": 256.96,
"learning_rate": 3.647088607594937e-06,
"loss": 0.0,
"step": 25600
},
{
"epoch": 257.21,
"learning_rate": 3.6407594936708864e-06,
"loss": 0.0,
"step": 25625
},
{
"epoch": 257.47,
"learning_rate": 3.6344303797468354e-06,
"loss": 0.0,
"step": 25650
},
{
"epoch": 257.72,
"learning_rate": 3.628101265822785e-06,
"loss": 0.0,
"step": 25675
},
{
"epoch": 257.97,
"learning_rate": 3.6217721518987342e-06,
"loss": 0.0,
"step": 25700
},
{
"epoch": 258.22,
"learning_rate": 3.615443037974684e-06,
"loss": 0.0,
"step": 25725
},
{
"epoch": 258.47,
"learning_rate": 3.6091139240506335e-06,
"loss": 0.0,
"step": 25750
},
{
"epoch": 258.72,
"learning_rate": 3.602784810126583e-06,
"loss": 0.0,
"step": 25775
},
{
"epoch": 258.97,
"learning_rate": 3.596455696202532e-06,
"loss": 0.0,
"step": 25800
},
{
"epoch": 259.22,
"learning_rate": 3.5901265822784814e-06,
"loss": 0.0,
"step": 25825
},
{
"epoch": 259.47,
"learning_rate": 3.583797468354431e-06,
"loss": 0.0,
"step": 25850
},
{
"epoch": 259.72,
"learning_rate": 3.5774683544303802e-06,
"loss": 0.0,
"step": 25875
},
{
"epoch": 259.97,
"learning_rate": 3.5711392405063292e-06,
"loss": 0.0,
"step": 25900
},
{
"epoch": 260.23,
"learning_rate": 3.5648101265822787e-06,
"loss": 0.0,
"step": 25925
},
{
"epoch": 260.48,
"learning_rate": 3.558481012658228e-06,
"loss": 0.0,
"step": 25950
},
{
"epoch": 260.73,
"learning_rate": 3.5521518987341775e-06,
"loss": 0.0,
"step": 25975
},
{
"epoch": 260.98,
"learning_rate": 3.545822784810127e-06,
"loss": 0.0,
"step": 26000
},
{
"epoch": 260.98,
"eval_loss": 0.3445892930030823,
"eval_runtime": 2827.7825,
"eval_samples_per_second": 4.506,
"eval_steps_per_second": 0.282,
"eval_wer": 7.7028294513053,
"step": 26000
},
{
"epoch": 261.23,
"learning_rate": 3.539493670886076e-06,
"loss": 0.0,
"step": 26025
},
{
"epoch": 261.48,
"learning_rate": 3.5331645569620254e-06,
"loss": 0.0,
"step": 26050
},
{
"epoch": 261.73,
"learning_rate": 3.526835443037975e-06,
"loss": 0.0,
"step": 26075
},
{
"epoch": 261.98,
"learning_rate": 3.5205063291139242e-06,
"loss": 0.0,
"step": 26100
},
{
"epoch": 262.23,
"learning_rate": 3.514177215189874e-06,
"loss": 0.0,
"step": 26125
},
{
"epoch": 262.48,
"learning_rate": 3.5078481012658235e-06,
"loss": 0.0,
"step": 26150
},
{
"epoch": 262.74,
"learning_rate": 3.5015189873417725e-06,
"loss": 0.0,
"step": 26175
},
{
"epoch": 262.99,
"learning_rate": 3.495189873417722e-06,
"loss": 0.0,
"step": 26200
},
{
"epoch": 263.24,
"learning_rate": 3.4888607594936714e-06,
"loss": 0.0,
"step": 26225
},
{
"epoch": 263.49,
"learning_rate": 3.482531645569621e-06,
"loss": 0.0,
"step": 26250
},
{
"epoch": 263.74,
"learning_rate": 3.47620253164557e-06,
"loss": 0.0,
"step": 26275
},
{
"epoch": 263.99,
"learning_rate": 3.4698734177215192e-06,
"loss": 0.0,
"step": 26300
},
{
"epoch": 264.24,
"learning_rate": 3.4635443037974687e-06,
"loss": 0.0,
"step": 26325
},
{
"epoch": 264.49,
"learning_rate": 3.457215189873418e-06,
"loss": 0.0,
"step": 26350
},
{
"epoch": 264.74,
"learning_rate": 3.4508860759493675e-06,
"loss": 0.0,
"step": 26375
},
{
"epoch": 264.99,
"learning_rate": 3.4445569620253165e-06,
"loss": 0.0,
"step": 26400
},
{
"epoch": 265.24,
"learning_rate": 3.438227848101266e-06,
"loss": 0.0,
"step": 26425
},
{
"epoch": 265.5,
"learning_rate": 3.4318987341772154e-06,
"loss": 0.0,
"step": 26450
},
{
"epoch": 265.75,
"learning_rate": 3.425569620253165e-06,
"loss": 0.0,
"step": 26475
},
{
"epoch": 266.0,
"learning_rate": 3.419240506329114e-06,
"loss": 0.0,
"step": 26500
},
{
"epoch": 266.25,
"learning_rate": 3.4129113924050632e-06,
"loss": 0.0,
"step": 26525
},
{
"epoch": 266.5,
"learning_rate": 3.406582278481013e-06,
"loss": 0.0,
"step": 26550
},
{
"epoch": 266.75,
"learning_rate": 3.4002531645569625e-06,
"loss": 0.0,
"step": 26575
},
{
"epoch": 267.0,
"learning_rate": 3.393924050632912e-06,
"loss": 0.0,
"step": 26600
},
{
"epoch": 267.25,
"learning_rate": 3.3875949367088614e-06,
"loss": 0.0,
"step": 26625
},
{
"epoch": 267.5,
"learning_rate": 3.3812658227848104e-06,
"loss": 0.0,
"step": 26650
},
{
"epoch": 267.75,
"learning_rate": 3.37493670886076e-06,
"loss": 0.0,
"step": 26675
},
{
"epoch": 268.01,
"learning_rate": 3.3686075949367092e-06,
"loss": 0.0,
"step": 26700
},
{
"epoch": 268.26,
"learning_rate": 3.3622784810126586e-06,
"loss": 0.0,
"step": 26725
},
{
"epoch": 268.51,
"learning_rate": 3.3559493670886077e-06,
"loss": 0.0,
"step": 26750
},
{
"epoch": 268.76,
"learning_rate": 3.349620253164557e-06,
"loss": 0.0,
"step": 26775
},
{
"epoch": 269.01,
"learning_rate": 3.3432911392405065e-06,
"loss": 0.0,
"step": 26800
},
{
"epoch": 269.26,
"learning_rate": 3.336962025316456e-06,
"loss": 0.0,
"step": 26825
},
{
"epoch": 269.51,
"learning_rate": 3.3306329113924054e-06,
"loss": 0.0,
"step": 26850
},
{
"epoch": 269.76,
"learning_rate": 3.3243037974683544e-06,
"loss": 0.0,
"step": 26875
},
{
"epoch": 270.01,
"learning_rate": 3.317974683544304e-06,
"loss": 0.0,
"step": 26900
},
{
"epoch": 270.26,
"learning_rate": 3.3116455696202532e-06,
"loss": 0.0,
"step": 26925
},
{
"epoch": 270.51,
"learning_rate": 3.305316455696203e-06,
"loss": 0.0,
"step": 26950
},
{
"epoch": 270.77,
"learning_rate": 3.2989873417721525e-06,
"loss": 0.0,
"step": 26975
},
{
"epoch": 271.02,
"learning_rate": 3.292658227848102e-06,
"loss": 0.0,
"step": 27000
},
{
"epoch": 271.02,
"eval_loss": 0.355086088180542,
"eval_runtime": 2825.2162,
"eval_samples_per_second": 4.51,
"eval_steps_per_second": 0.282,
"eval_wer": 7.754611536657809,
"step": 27000
},
{
"epoch": 271.27,
"learning_rate": 3.286329113924051e-06,
"loss": 0.0,
"step": 27025
},
{
"epoch": 271.52,
"learning_rate": 3.2800000000000004e-06,
"loss": 0.0,
"step": 27050
},
{
"epoch": 271.77,
"learning_rate": 3.2736708860759498e-06,
"loss": 0.0,
"step": 27075
},
{
"epoch": 272.02,
"learning_rate": 3.2673417721518992e-06,
"loss": 0.0,
"step": 27100
},
{
"epoch": 272.27,
"learning_rate": 3.2610126582278482e-06,
"loss": 0.0,
"step": 27125
},
{
"epoch": 272.52,
"learning_rate": 3.2546835443037976e-06,
"loss": 0.0,
"step": 27150
},
{
"epoch": 272.77,
"learning_rate": 3.248354430379747e-06,
"loss": 0.0,
"step": 27175
},
{
"epoch": 273.02,
"learning_rate": 3.2420253164556965e-06,
"loss": 0.0,
"step": 27200
},
{
"epoch": 273.27,
"learning_rate": 3.235696202531646e-06,
"loss": 0.0,
"step": 27225
},
{
"epoch": 273.53,
"learning_rate": 3.229367088607595e-06,
"loss": 0.0,
"step": 27250
},
{
"epoch": 273.78,
"learning_rate": 3.2230379746835444e-06,
"loss": 0.0,
"step": 27275
},
{
"epoch": 274.03,
"learning_rate": 3.216708860759494e-06,
"loss": 0.0,
"step": 27300
},
{
"epoch": 274.28,
"learning_rate": 3.2103797468354432e-06,
"loss": 0.0,
"step": 27325
},
{
"epoch": 274.53,
"learning_rate": 3.2040506329113922e-06,
"loss": 0.0,
"step": 27350
},
{
"epoch": 274.78,
"learning_rate": 3.1977215189873425e-06,
"loss": 0.0,
"step": 27375
},
{
"epoch": 275.03,
"learning_rate": 3.1913924050632915e-06,
"loss": 0.0,
"step": 27400
},
{
"epoch": 275.28,
"learning_rate": 3.185063291139241e-06,
"loss": 0.0,
"step": 27425
},
{
"epoch": 275.53,
"learning_rate": 3.1787341772151904e-06,
"loss": 0.0,
"step": 27450
},
{
"epoch": 275.78,
"learning_rate": 3.1724050632911398e-06,
"loss": 0.0,
"step": 27475
},
{
"epoch": 276.04,
"learning_rate": 3.1660759493670888e-06,
"loss": 0.0,
"step": 27500
},
{
"epoch": 276.29,
"learning_rate": 3.1597468354430382e-06,
"loss": 0.0,
"step": 27525
},
{
"epoch": 276.54,
"learning_rate": 3.1534177215189876e-06,
"loss": 0.0,
"step": 27550
},
{
"epoch": 276.79,
"learning_rate": 3.147088607594937e-06,
"loss": 0.0,
"step": 27575
},
{
"epoch": 277.04,
"learning_rate": 3.140759493670886e-06,
"loss": 0.0,
"step": 27600
},
{
"epoch": 277.29,
"learning_rate": 3.1344303797468355e-06,
"loss": 0.0,
"step": 27625
},
{
"epoch": 277.54,
"learning_rate": 3.128101265822785e-06,
"loss": 0.0,
"step": 27650
},
{
"epoch": 277.79,
"learning_rate": 3.1217721518987344e-06,
"loss": 0.0,
"step": 27675
},
{
"epoch": 278.04,
"learning_rate": 3.1154430379746838e-06,
"loss": 0.0,
"step": 27700
},
{
"epoch": 278.29,
"learning_rate": 3.109113924050633e-06,
"loss": 0.0,
"step": 27725
},
{
"epoch": 278.54,
"learning_rate": 3.1027848101265822e-06,
"loss": 0.0,
"step": 27750
},
{
"epoch": 278.8,
"learning_rate": 3.096455696202532e-06,
"loss": 0.0,
"step": 27775
},
{
"epoch": 279.05,
"learning_rate": 3.0901265822784815e-06,
"loss": 0.0,
"step": 27800
},
{
"epoch": 279.3,
"learning_rate": 3.083797468354431e-06,
"loss": 0.0,
"step": 27825
},
{
"epoch": 279.55,
"learning_rate": 3.0774683544303804e-06,
"loss": 0.0,
"step": 27850
},
{
"epoch": 279.8,
"learning_rate": 3.0711392405063294e-06,
"loss": 0.0,
"step": 27875
},
{
"epoch": 280.05,
"learning_rate": 3.0648101265822788e-06,
"loss": 0.0,
"step": 27900
},
{
"epoch": 280.3,
"learning_rate": 3.058481012658228e-06,
"loss": 0.0,
"step": 27925
},
{
"epoch": 280.55,
"learning_rate": 3.0521518987341776e-06,
"loss": 0.0,
"step": 27950
},
{
"epoch": 280.8,
"learning_rate": 3.0458227848101266e-06,
"loss": 0.0,
"step": 27975
},
{
"epoch": 281.05,
"learning_rate": 3.039493670886076e-06,
"loss": 0.0,
"step": 28000
},
{
"epoch": 281.05,
"eval_loss": 0.36458390951156616,
"eval_runtime": 2827.7596,
"eval_samples_per_second": 4.506,
"eval_steps_per_second": 0.282,
"eval_wer": 7.798577458183524,
"step": 28000
},
{
"epoch": 281.3,
"learning_rate": 3.0331645569620255e-06,
"loss": 0.0,
"step": 28025
},
{
"epoch": 281.56,
"learning_rate": 3.026835443037975e-06,
"loss": 0.0,
"step": 28050
},
{
"epoch": 281.81,
"learning_rate": 3.0205063291139244e-06,
"loss": 0.0,
"step": 28075
},
{
"epoch": 282.06,
"learning_rate": 3.0141772151898734e-06,
"loss": 0.0,
"step": 28100
},
{
"epoch": 282.31,
"learning_rate": 3.0078481012658228e-06,
"loss": 0.0,
"step": 28125
},
{
"epoch": 282.56,
"learning_rate": 3.0015189873417722e-06,
"loss": 0.0,
"step": 28150
},
{
"epoch": 282.81,
"learning_rate": 2.9951898734177216e-06,
"loss": 0.0,
"step": 28175
},
{
"epoch": 283.06,
"learning_rate": 2.9888607594936715e-06,
"loss": 0.0,
"step": 28200
},
{
"epoch": 283.31,
"learning_rate": 2.982531645569621e-06,
"loss": 0.0,
"step": 28225
},
{
"epoch": 283.56,
"learning_rate": 2.97620253164557e-06,
"loss": 0.0,
"step": 28250
},
{
"epoch": 283.81,
"learning_rate": 2.9698734177215194e-06,
"loss": 0.0,
"step": 28275
},
{
"epoch": 284.07,
"learning_rate": 2.9635443037974688e-06,
"loss": 0.0,
"step": 28300
},
{
"epoch": 284.32,
"learning_rate": 2.957215189873418e-06,
"loss": 0.0,
"step": 28325
},
{
"epoch": 284.57,
"learning_rate": 2.950886075949367e-06,
"loss": 0.0,
"step": 28350
},
{
"epoch": 284.82,
"learning_rate": 2.9445569620253166e-06,
"loss": 0.0,
"step": 28375
},
{
"epoch": 285.07,
"learning_rate": 2.938227848101266e-06,
"loss": 0.0,
"step": 28400
},
{
"epoch": 285.32,
"learning_rate": 2.9318987341772155e-06,
"loss": 0.0,
"step": 28425
},
{
"epoch": 285.57,
"learning_rate": 2.925569620253165e-06,
"loss": 0.0,
"step": 28450
},
{
"epoch": 285.82,
"learning_rate": 2.919240506329114e-06,
"loss": 0.0,
"step": 28475
},
{
"epoch": 286.07,
"learning_rate": 2.9129113924050634e-06,
"loss": 0.0,
"step": 28500
},
{
"epoch": 286.32,
"learning_rate": 2.9065822784810128e-06,
"loss": 0.0,
"step": 28525
},
{
"epoch": 286.57,
"learning_rate": 2.900253164556962e-06,
"loss": 0.0,
"step": 28550
},
{
"epoch": 286.83,
"learning_rate": 2.8939240506329112e-06,
"loss": 0.0,
"step": 28575
},
{
"epoch": 287.08,
"learning_rate": 2.887594936708861e-06,
"loss": 0.0,
"step": 28600
},
{
"epoch": 287.33,
"learning_rate": 2.8812658227848105e-06,
"loss": 0.0,
"step": 28625
},
{
"epoch": 287.58,
"learning_rate": 2.87493670886076e-06,
"loss": 0.0,
"step": 28650
},
{
"epoch": 287.83,
"learning_rate": 2.8686075949367093e-06,
"loss": 0.0,
"step": 28675
},
{
"epoch": 288.08,
"learning_rate": 2.8622784810126588e-06,
"loss": 0.0,
"step": 28700
},
{
"epoch": 288.33,
"learning_rate": 2.8559493670886078e-06,
"loss": 0.0,
"step": 28725
},
{
"epoch": 288.58,
"learning_rate": 2.849620253164557e-06,
"loss": 0.0,
"step": 28750
},
{
"epoch": 288.83,
"learning_rate": 2.8432911392405066e-06,
"loss": 0.0,
"step": 28775
},
{
"epoch": 289.08,
"learning_rate": 2.836962025316456e-06,
"loss": 0.0,
"step": 28800
},
{
"epoch": 289.34,
"learning_rate": 2.830632911392405e-06,
"loss": 0.0,
"step": 28825
},
{
"epoch": 289.59,
"learning_rate": 2.8243037974683545e-06,
"loss": 0.0,
"step": 28850
},
{
"epoch": 289.84,
"learning_rate": 2.817974683544304e-06,
"loss": 0.0,
"step": 28875
},
{
"epoch": 290.09,
"learning_rate": 2.8116455696202533e-06,
"loss": 0.0,
"step": 28900
},
{
"epoch": 290.34,
"learning_rate": 2.8053164556962028e-06,
"loss": 0.0,
"step": 28925
},
{
"epoch": 290.59,
"learning_rate": 2.7989873417721518e-06,
"loss": 0.0,
"step": 28950
},
{
"epoch": 290.84,
"learning_rate": 2.792658227848101e-06,
"loss": 0.0,
"step": 28975
},
{
"epoch": 291.09,
"learning_rate": 2.7863291139240506e-06,
"loss": 0.0,
"step": 29000
},
{
"epoch": 291.09,
"eval_loss": 0.3728525936603546,
"eval_runtime": 2833.2163,
"eval_samples_per_second": 4.497,
"eval_steps_per_second": 0.281,
"eval_wer": 7.7780600281381895,
"step": 29000
},
{
"epoch": 291.34,
"learning_rate": 2.7800000000000005e-06,
"loss": 0.0,
"step": 29025
},
{
"epoch": 291.59,
"learning_rate": 2.773924050632912e-06,
"loss": 0.0,
"step": 29050
},
{
"epoch": 291.84,
"learning_rate": 2.767594936708861e-06,
"loss": 0.0,
"step": 29075
},
{
"epoch": 292.1,
"learning_rate": 2.7612658227848104e-06,
"loss": 0.0,
"step": 29100
},
{
"epoch": 292.35,
"learning_rate": 2.75493670886076e-06,
"loss": 0.0,
"step": 29125
},
{
"epoch": 292.6,
"learning_rate": 2.7486075949367092e-06,
"loss": 0.0,
"step": 29150
},
{
"epoch": 292.85,
"learning_rate": 2.7422784810126587e-06,
"loss": 0.0,
"step": 29175
},
{
"epoch": 293.1,
"learning_rate": 2.7359493670886077e-06,
"loss": 0.0,
"step": 29200
},
{
"epoch": 293.35,
"learning_rate": 2.729620253164557e-06,
"loss": 0.0,
"step": 29225
},
{
"epoch": 293.6,
"learning_rate": 2.7232911392405065e-06,
"loss": 0.0,
"step": 29250
},
{
"epoch": 293.85,
"learning_rate": 2.716962025316456e-06,
"loss": 0.0,
"step": 29275
},
{
"epoch": 294.1,
"learning_rate": 2.710632911392405e-06,
"loss": 0.0,
"step": 29300
},
{
"epoch": 294.35,
"learning_rate": 2.7043037974683544e-06,
"loss": 0.0,
"step": 29325
},
{
"epoch": 294.6,
"learning_rate": 2.697974683544304e-06,
"loss": 0.0,
"step": 29350
},
{
"epoch": 294.86,
"learning_rate": 2.6916455696202532e-06,
"loss": 0.0,
"step": 29375
},
{
"epoch": 295.11,
"learning_rate": 2.685316455696203e-06,
"loss": 0.0,
"step": 29400
},
{
"epoch": 295.36,
"learning_rate": 2.6789873417721525e-06,
"loss": 0.0,
"step": 29425
},
{
"epoch": 295.61,
"learning_rate": 2.6726582278481015e-06,
"loss": 0.0,
"step": 29450
},
{
"epoch": 295.86,
"learning_rate": 2.666329113924051e-06,
"loss": 0.0,
"step": 29475
},
{
"epoch": 296.11,
"learning_rate": 2.6600000000000004e-06,
"loss": 0.0,
"step": 29500
},
{
"epoch": 296.36,
"learning_rate": 2.65367088607595e-06,
"loss": 0.0,
"step": 29525
},
{
"epoch": 296.61,
"learning_rate": 2.6473417721518992e-06,
"loss": 0.0,
"step": 29550
},
{
"epoch": 296.86,
"learning_rate": 2.6410126582278482e-06,
"loss": 0.0,
"step": 29575
},
{
"epoch": 297.11,
"learning_rate": 2.6346835443037977e-06,
"loss": 0.0,
"step": 29600
},
{
"epoch": 297.37,
"learning_rate": 2.628354430379747e-06,
"loss": 0.0,
"step": 29625
},
{
"epoch": 297.62,
"learning_rate": 2.6220253164556965e-06,
"loss": 0.0,
"step": 29650
},
{
"epoch": 297.87,
"learning_rate": 2.6156962025316455e-06,
"loss": 0.0,
"step": 29675
},
{
"epoch": 298.12,
"learning_rate": 2.609367088607595e-06,
"loss": 0.0,
"step": 29700
},
{
"epoch": 298.37,
"learning_rate": 2.6030379746835444e-06,
"loss": 0.0,
"step": 29725
},
{
"epoch": 298.62,
"learning_rate": 2.596708860759494e-06,
"loss": 0.0,
"step": 29750
},
{
"epoch": 298.87,
"learning_rate": 2.5903797468354432e-06,
"loss": 0.0,
"step": 29775
},
{
"epoch": 299.12,
"learning_rate": 2.5840506329113922e-06,
"loss": 0.0,
"step": 29800
},
{
"epoch": 299.37,
"learning_rate": 2.577721518987342e-06,
"loss": 0.0,
"step": 29825
},
{
"epoch": 299.62,
"learning_rate": 2.5713924050632915e-06,
"loss": 0.0,
"step": 29850
},
{
"epoch": 299.87,
"learning_rate": 2.565063291139241e-06,
"loss": 0.0,
"step": 29875
},
{
"epoch": 300.13,
"learning_rate": 2.5587341772151904e-06,
"loss": 0.0,
"step": 29900
},
{
"epoch": 300.38,
"learning_rate": 2.5524050632911394e-06,
"loss": 0.0,
"step": 29925
},
{
"epoch": 300.63,
"learning_rate": 2.546075949367089e-06,
"loss": 0.0,
"step": 29950
},
{
"epoch": 300.88,
"learning_rate": 2.5397468354430382e-06,
"loss": 0.0,
"step": 29975
},
{
"epoch": 301.13,
"learning_rate": 2.5334177215189876e-06,
"loss": 0.0,
"step": 30000
},
{
"epoch": 301.13,
"eval_loss": 0.38112595677375793,
"eval_runtime": 2830.2491,
"eval_samples_per_second": 4.502,
"eval_steps_per_second": 0.282,
"eval_wer": 7.763404720962952,
"step": 30000
},
{
"epoch": 301.38,
"learning_rate": 2.527088607594937e-06,
"loss": 0.0,
"step": 30025
},
{
"epoch": 301.63,
"learning_rate": 2.520759493670886e-06,
"loss": 0.0,
"step": 30050
},
{
"epoch": 301.88,
"learning_rate": 2.5144303797468355e-06,
"loss": 0.0,
"step": 30075
},
{
"epoch": 302.13,
"learning_rate": 2.508101265822785e-06,
"loss": 0.0,
"step": 30100
},
{
"epoch": 302.38,
"learning_rate": 2.5017721518987344e-06,
"loss": 0.0,
"step": 30125
},
{
"epoch": 302.63,
"learning_rate": 2.495443037974684e-06,
"loss": 0.0,
"step": 30150
},
{
"epoch": 302.89,
"learning_rate": 2.4891139240506332e-06,
"loss": 0.0,
"step": 30175
},
{
"epoch": 303.14,
"learning_rate": 2.4827848101265826e-06,
"loss": 0.0,
"step": 30200
},
{
"epoch": 303.39,
"learning_rate": 2.4764556962025317e-06,
"loss": 0.0,
"step": 30225
},
{
"epoch": 303.64,
"learning_rate": 2.470126582278481e-06,
"loss": 0.0,
"step": 30250
},
{
"epoch": 303.89,
"learning_rate": 2.4637974683544305e-06,
"loss": 0.0,
"step": 30275
},
{
"epoch": 304.14,
"learning_rate": 2.45746835443038e-06,
"loss": 0.0,
"step": 30300
},
{
"epoch": 304.39,
"learning_rate": 2.4511392405063294e-06,
"loss": 0.0,
"step": 30325
},
{
"epoch": 304.64,
"learning_rate": 2.444810126582279e-06,
"loss": 0.0,
"step": 30350
},
{
"epoch": 304.89,
"learning_rate": 2.4384810126582282e-06,
"loss": 0.0,
"step": 30375
},
{
"epoch": 305.14,
"learning_rate": 2.4321518987341776e-06,
"loss": 0.0,
"step": 30400
},
{
"epoch": 305.4,
"learning_rate": 2.4258227848101266e-06,
"loss": 0.0,
"step": 30425
},
{
"epoch": 305.65,
"learning_rate": 2.419493670886076e-06,
"loss": 0.0,
"step": 30450
},
{
"epoch": 305.9,
"learning_rate": 2.4131645569620255e-06,
"loss": 0.0,
"step": 30475
},
{
"epoch": 306.15,
"learning_rate": 2.406835443037975e-06,
"loss": 0.0,
"step": 30500
},
{
"epoch": 306.4,
"learning_rate": 2.400506329113924e-06,
"loss": 0.0,
"step": 30525
},
{
"epoch": 306.65,
"learning_rate": 2.394177215189874e-06,
"loss": 0.0,
"step": 30550
},
{
"epoch": 306.9,
"learning_rate": 2.3878481012658232e-06,
"loss": 0.0,
"step": 30575
},
{
"epoch": 307.15,
"learning_rate": 2.3815189873417722e-06,
"loss": 0.0,
"step": 30600
},
{
"epoch": 307.4,
"learning_rate": 2.3751898734177216e-06,
"loss": 0.0,
"step": 30625
},
{
"epoch": 307.65,
"learning_rate": 2.368860759493671e-06,
"loss": 0.0,
"step": 30650
},
{
"epoch": 307.9,
"learning_rate": 2.3625316455696205e-06,
"loss": 0.0,
"step": 30675
},
{
"epoch": 308.16,
"learning_rate": 2.35620253164557e-06,
"loss": 0.0,
"step": 30700
},
{
"epoch": 308.41,
"learning_rate": 2.349873417721519e-06,
"loss": 0.0,
"step": 30725
},
{
"epoch": 308.66,
"learning_rate": 2.3435443037974688e-06,
"loss": 0.0,
"step": 30750
},
{
"epoch": 308.91,
"learning_rate": 2.337215189873418e-06,
"loss": 0.0,
"step": 30775
},
{
"epoch": 309.16,
"learning_rate": 2.3308860759493672e-06,
"loss": 0.0,
"step": 30800
},
{
"epoch": 309.41,
"learning_rate": 2.3245569620253166e-06,
"loss": 0.0,
"step": 30825
},
{
"epoch": 309.66,
"learning_rate": 2.318227848101266e-06,
"loss": 0.0,
"step": 30850
},
{
"epoch": 309.91,
"learning_rate": 2.3118987341772155e-06,
"loss": 0.0,
"step": 30875
},
{
"epoch": 310.16,
"learning_rate": 2.3055696202531645e-06,
"loss": 0.0,
"step": 30900
},
{
"epoch": 310.41,
"learning_rate": 2.299240506329114e-06,
"loss": 0.0,
"step": 30925
},
{
"epoch": 310.66,
"learning_rate": 2.2929113924050638e-06,
"loss": 0.0,
"step": 30950
},
{
"epoch": 310.92,
"learning_rate": 2.286582278481013e-06,
"loss": 0.0,
"step": 30975
},
{
"epoch": 311.17,
"learning_rate": 2.2802531645569622e-06,
"loss": 0.0,
"step": 31000
},
{
"epoch": 311.17,
"eval_loss": 0.38778597116470337,
"eval_runtime": 2828.9196,
"eval_samples_per_second": 4.504,
"eval_steps_per_second": 0.282,
"eval_wer": 7.7702438643113965,
"step": 31000
},
{
"epoch": 311.42,
"learning_rate": 2.2739240506329116e-06,
"loss": 0.0,
"step": 31025
},
{
"epoch": 311.67,
"learning_rate": 2.267594936708861e-06,
"loss": 0.0,
"step": 31050
},
{
"epoch": 311.92,
"learning_rate": 2.261518987341772e-06,
"loss": 0.0,
"step": 31075
},
{
"epoch": 312.17,
"learning_rate": 2.2551898734177215e-06,
"loss": 0.0,
"step": 31100
},
{
"epoch": 312.42,
"learning_rate": 2.248860759493671e-06,
"loss": 0.0,
"step": 31125
},
{
"epoch": 312.67,
"learning_rate": 2.2425316455696204e-06,
"loss": 0.0,
"step": 31150
},
{
"epoch": 312.92,
"learning_rate": 2.23620253164557e-06,
"loss": 0.0,
"step": 31175
},
{
"epoch": 313.17,
"learning_rate": 2.2298734177215192e-06,
"loss": 0.0,
"step": 31200
},
{
"epoch": 313.43,
"learning_rate": 2.2235443037974687e-06,
"loss": 0.0,
"step": 31225
},
{
"epoch": 313.68,
"learning_rate": 2.217215189873418e-06,
"loss": 0.0,
"step": 31250
},
{
"epoch": 313.93,
"learning_rate": 2.210886075949367e-06,
"loss": 0.0,
"step": 31275
},
{
"epoch": 314.18,
"learning_rate": 2.2045569620253165e-06,
"loss": 0.0,
"step": 31300
},
{
"epoch": 314.43,
"learning_rate": 2.198227848101266e-06,
"loss": 0.0,
"step": 31325
},
{
"epoch": 314.68,
"learning_rate": 2.1918987341772154e-06,
"loss": 0.0,
"step": 31350
},
{
"epoch": 314.93,
"learning_rate": 2.185569620253165e-06,
"loss": 0.0,
"step": 31375
},
{
"epoch": 315.18,
"learning_rate": 2.1792405063291142e-06,
"loss": 0.0,
"step": 31400
},
{
"epoch": 315.43,
"learning_rate": 2.1729113924050637e-06,
"loss": 0.0,
"step": 31425
},
{
"epoch": 315.68,
"learning_rate": 2.1665822784810127e-06,
"loss": 0.0,
"step": 31450
},
{
"epoch": 315.93,
"learning_rate": 2.160253164556962e-06,
"loss": 0.0,
"step": 31475
},
{
"epoch": 316.19,
"learning_rate": 2.1539240506329115e-06,
"loss": 0.0,
"step": 31500
},
{
"epoch": 316.44,
"learning_rate": 2.147594936708861e-06,
"loss": 0.0,
"step": 31525
},
{
"epoch": 316.69,
"learning_rate": 2.1412658227848104e-06,
"loss": 0.0,
"step": 31550
},
{
"epoch": 316.94,
"learning_rate": 2.13493670886076e-06,
"loss": 0.0,
"step": 31575
},
{
"epoch": 317.19,
"learning_rate": 2.1286075949367092e-06,
"loss": 0.0,
"step": 31600
},
{
"epoch": 317.44,
"learning_rate": 2.1222784810126582e-06,
"loss": 0.0,
"step": 31625
},
{
"epoch": 317.69,
"learning_rate": 2.1159493670886077e-06,
"loss": 0.0,
"step": 31650
},
{
"epoch": 317.94,
"learning_rate": 2.109620253164557e-06,
"loss": 0.0,
"step": 31675
},
{
"epoch": 318.19,
"learning_rate": 2.1032911392405065e-06,
"loss": 0.0,
"step": 31700
},
{
"epoch": 318.44,
"learning_rate": 2.096962025316456e-06,
"loss": 0.0,
"step": 31725
},
{
"epoch": 318.7,
"learning_rate": 2.090632911392405e-06,
"loss": 0.0,
"step": 31750
},
{
"epoch": 318.95,
"learning_rate": 2.084303797468355e-06,
"loss": 0.0,
"step": 31775
},
{
"epoch": 319.2,
"learning_rate": 2.0779746835443042e-06,
"loss": 0.0,
"step": 31800
},
{
"epoch": 319.45,
"learning_rate": 2.0716455696202532e-06,
"loss": 0.0,
"step": 31825
},
{
"epoch": 319.7,
"learning_rate": 2.0653164556962027e-06,
"loss": 0.0,
"step": 31850
},
{
"epoch": 319.95,
"learning_rate": 2.058987341772152e-06,
"loss": 0.0,
"step": 31875
},
{
"epoch": 320.2,
"learning_rate": 2.0526582278481015e-06,
"loss": 0.0,
"step": 31900
},
{
"epoch": 320.45,
"learning_rate": 2.0463291139240505e-06,
"loss": 0.0,
"step": 31925
},
{
"epoch": 320.7,
"learning_rate": 2.04e-06,
"loss": 0.0,
"step": 31950
},
{
"epoch": 320.95,
"learning_rate": 2.03367088607595e-06,
"loss": 0.0,
"step": 31975
},
{
"epoch": 321.2,
"learning_rate": 2.027341772151899e-06,
"loss": 0.0,
"step": 32000
},
{
"epoch": 321.2,
"eval_loss": 0.39481475949287415,
"eval_runtime": 2829.7401,
"eval_samples_per_second": 4.503,
"eval_steps_per_second": 0.282,
"eval_wer": 7.772197905268094,
"step": 32000
},
{
"epoch": 321.46,
"learning_rate": 2.0210126582278482e-06,
"loss": 0.0,
"step": 32025
},
{
"epoch": 321.71,
"learning_rate": 2.0146835443037977e-06,
"loss": 0.0,
"step": 32050
},
{
"epoch": 321.96,
"learning_rate": 2.008354430379747e-06,
"loss": 0.0,
"step": 32075
},
{
"epoch": 322.21,
"learning_rate": 2.0020253164556965e-06,
"loss": 0.0,
"step": 32100
},
{
"epoch": 322.46,
"learning_rate": 1.9956962025316455e-06,
"loss": 0.0,
"step": 32125
},
{
"epoch": 322.71,
"learning_rate": 1.989367088607595e-06,
"loss": 0.0,
"step": 32150
},
{
"epoch": 322.96,
"learning_rate": 1.9830379746835444e-06,
"loss": 0.0,
"step": 32175
},
{
"epoch": 323.21,
"learning_rate": 1.976708860759494e-06,
"loss": 0.0,
"step": 32200
},
{
"epoch": 323.46,
"learning_rate": 1.9703797468354432e-06,
"loss": 0.0,
"step": 32225
},
{
"epoch": 323.71,
"learning_rate": 1.9640506329113927e-06,
"loss": 0.0,
"step": 32250
},
{
"epoch": 323.96,
"learning_rate": 1.957721518987342e-06,
"loss": 0.0,
"step": 32275
},
{
"epoch": 324.22,
"learning_rate": 1.951392405063291e-06,
"loss": 0.0,
"step": 32300
},
{
"epoch": 324.47,
"learning_rate": 1.9450632911392405e-06,
"loss": 0.0,
"step": 32325
},
{
"epoch": 324.72,
"learning_rate": 1.93873417721519e-06,
"loss": 0.0,
"step": 32350
},
{
"epoch": 324.97,
"learning_rate": 1.9324050632911394e-06,
"loss": 0.0,
"step": 32375
},
{
"epoch": 325.22,
"learning_rate": 1.926075949367089e-06,
"loss": 0.0,
"step": 32400
},
{
"epoch": 325.47,
"learning_rate": 1.9197468354430382e-06,
"loss": 0.0,
"step": 32425
},
{
"epoch": 325.72,
"learning_rate": 1.9134177215189877e-06,
"loss": 0.0,
"step": 32450
},
{
"epoch": 325.97,
"learning_rate": 1.9070886075949369e-06,
"loss": 0.0,
"step": 32475
},
{
"epoch": 326.22,
"learning_rate": 1.900759493670886e-06,
"loss": 0.0,
"step": 32500
},
{
"epoch": 326.47,
"learning_rate": 1.8944303797468355e-06,
"loss": 0.0,
"step": 32525
},
{
"epoch": 326.73,
"learning_rate": 1.888101265822785e-06,
"loss": 0.0,
"step": 32550
},
{
"epoch": 326.98,
"learning_rate": 1.8817721518987344e-06,
"loss": 0.0,
"step": 32575
},
{
"epoch": 327.23,
"learning_rate": 1.8754430379746838e-06,
"loss": 0.0,
"step": 32600
},
{
"epoch": 327.48,
"learning_rate": 1.8691139240506332e-06,
"loss": 0.0,
"step": 32625
},
{
"epoch": 327.73,
"learning_rate": 1.8627848101265824e-06,
"loss": 0.0,
"step": 32650
},
{
"epoch": 327.98,
"learning_rate": 1.8564556962025319e-06,
"loss": 0.0,
"step": 32675
},
{
"epoch": 328.23,
"learning_rate": 1.850126582278481e-06,
"loss": 0.0,
"step": 32700
},
{
"epoch": 328.48,
"learning_rate": 1.8437974683544305e-06,
"loss": 0.0,
"step": 32725
},
{
"epoch": 328.73,
"learning_rate": 1.8374683544303797e-06,
"loss": 0.0,
"step": 32750
},
{
"epoch": 328.98,
"learning_rate": 1.8311392405063292e-06,
"loss": 0.0,
"step": 32775
},
{
"epoch": 329.23,
"learning_rate": 1.8248101265822788e-06,
"loss": 0.0,
"step": 32800
},
{
"epoch": 329.49,
"learning_rate": 1.818481012658228e-06,
"loss": 0.0,
"step": 32825
},
{
"epoch": 329.74,
"learning_rate": 1.8121518987341774e-06,
"loss": 0.0,
"step": 32850
},
{
"epoch": 329.99,
"learning_rate": 1.8058227848101267e-06,
"loss": 0.0,
"step": 32875
},
{
"epoch": 330.24,
"learning_rate": 1.799493670886076e-06,
"loss": 0.0,
"step": 32900
},
{
"epoch": 330.49,
"learning_rate": 1.7931645569620253e-06,
"loss": 0.0,
"step": 32925
},
{
"epoch": 330.74,
"learning_rate": 1.7868354430379747e-06,
"loss": 0.0,
"step": 32950
},
{
"epoch": 330.99,
"learning_rate": 1.7805063291139242e-06,
"loss": 0.0,
"step": 32975
},
{
"epoch": 331.24,
"learning_rate": 1.7741772151898736e-06,
"loss": 0.0,
"step": 33000
},
{
"epoch": 331.24,
"eval_loss": 0.4002886712551117,
"eval_runtime": 2835.03,
"eval_samples_per_second": 4.494,
"eval_steps_per_second": 0.281,
"eval_wer": 7.730186024699077,
"step": 33000
},
{
"epoch": 331.49,
"learning_rate": 1.767848101265823e-06,
"loss": 0.0,
"step": 33025
},
{
"epoch": 331.74,
"learning_rate": 1.7615189873417724e-06,
"loss": 0.0,
"step": 33050
},
{
"epoch": 331.99,
"learning_rate": 1.7551898734177217e-06,
"loss": 0.0,
"step": 33075
},
{
"epoch": 332.25,
"learning_rate": 1.748860759493671e-06,
"loss": 0.0,
"step": 33100
},
{
"epoch": 332.5,
"learning_rate": 1.7427848101265823e-06,
"loss": 0.0,
"step": 33125
},
{
"epoch": 332.75,
"learning_rate": 1.7364556962025317e-06,
"loss": 0.0,
"step": 33150
},
{
"epoch": 333.0,
"learning_rate": 1.7301265822784814e-06,
"loss": 0.0,
"step": 33175
},
{
"epoch": 333.25,
"learning_rate": 1.7237974683544306e-06,
"loss": 0.0,
"step": 33200
},
{
"epoch": 333.5,
"learning_rate": 1.71746835443038e-06,
"loss": 0.0,
"step": 33225
},
{
"epoch": 333.75,
"learning_rate": 1.7111392405063292e-06,
"loss": 0.0,
"step": 33250
},
{
"epoch": 334.0,
"learning_rate": 1.7048101265822787e-06,
"loss": 0.0,
"step": 33275
},
{
"epoch": 334.25,
"learning_rate": 1.6984810126582279e-06,
"loss": 0.0,
"step": 33300
},
{
"epoch": 334.5,
"learning_rate": 1.6921518987341773e-06,
"loss": 0.0,
"step": 33325
},
{
"epoch": 334.76,
"learning_rate": 1.6858227848101265e-06,
"loss": 0.0,
"step": 33350
},
{
"epoch": 335.01,
"learning_rate": 1.6797468354430382e-06,
"loss": 0.0,
"step": 33375
},
{
"epoch": 335.26,
"learning_rate": 1.6734177215189876e-06,
"loss": 0.0,
"step": 33400
},
{
"epoch": 335.51,
"learning_rate": 1.6670886075949368e-06,
"loss": 0.0,
"step": 33425
},
{
"epoch": 335.76,
"learning_rate": 1.6607594936708863e-06,
"loss": 0.0,
"step": 33450
},
{
"epoch": 336.01,
"learning_rate": 1.6544303797468355e-06,
"loss": 0.0,
"step": 33475
},
{
"epoch": 336.26,
"learning_rate": 1.648101265822785e-06,
"loss": 0.0,
"step": 33500
},
{
"epoch": 336.51,
"learning_rate": 1.6417721518987343e-06,
"loss": 0.0,
"step": 33525
},
{
"epoch": 336.76,
"learning_rate": 1.6354430379746836e-06,
"loss": 0.0,
"step": 33550
},
{
"epoch": 337.01,
"learning_rate": 1.6291139240506332e-06,
"loss": 0.0,
"step": 33575
},
{
"epoch": 337.26,
"learning_rate": 1.6227848101265824e-06,
"loss": 0.0,
"step": 33600
},
{
"epoch": 337.52,
"learning_rate": 1.6164556962025318e-06,
"loss": 0.0,
"step": 33625
},
{
"epoch": 337.77,
"learning_rate": 1.6101265822784813e-06,
"loss": 0.0,
"step": 33650
},
{
"epoch": 338.02,
"learning_rate": 1.6037974683544305e-06,
"loss": 0.0,
"step": 33675
},
{
"epoch": 338.27,
"learning_rate": 1.59746835443038e-06,
"loss": 0.0,
"step": 33700
},
{
"epoch": 338.52,
"learning_rate": 1.5911392405063291e-06,
"loss": 0.0,
"step": 33725
},
{
"epoch": 338.77,
"learning_rate": 1.5848101265822786e-06,
"loss": 0.0,
"step": 33750
},
{
"epoch": 339.02,
"learning_rate": 1.5784810126582278e-06,
"loss": 0.0,
"step": 33775
},
{
"epoch": 339.27,
"learning_rate": 1.5721518987341774e-06,
"loss": 0.0,
"step": 33800
},
{
"epoch": 339.52,
"learning_rate": 1.5658227848101268e-06,
"loss": 0.0,
"step": 33825
},
{
"epoch": 339.77,
"learning_rate": 1.559493670886076e-06,
"loss": 0.0,
"step": 33850
},
{
"epoch": 340.03,
"learning_rate": 1.5531645569620255e-06,
"loss": 0.0,
"step": 33875
},
{
"epoch": 340.28,
"learning_rate": 1.5468354430379747e-06,
"loss": 0.0,
"step": 33900
},
{
"epoch": 340.53,
"learning_rate": 1.5405063291139241e-06,
"loss": 0.0,
"step": 33925
},
{
"epoch": 340.78,
"learning_rate": 1.5341772151898736e-06,
"loss": 0.0,
"step": 33950
},
{
"epoch": 341.03,
"learning_rate": 1.5278481012658228e-06,
"loss": 0.0,
"step": 33975
},
{
"epoch": 341.28,
"learning_rate": 1.5215189873417724e-06,
"loss": 0.0,
"step": 34000
},
{
"epoch": 341.28,
"eval_loss": 0.4057931900024414,
"eval_runtime": 2832.6042,
"eval_samples_per_second": 4.498,
"eval_steps_per_second": 0.281,
"eval_wer": 7.731163045177427,
"step": 34000
},
{
"epoch": 341.53,
"learning_rate": 1.5151898734177216e-06,
"loss": 0.0,
"step": 34025
},
{
"epoch": 341.78,
"learning_rate": 1.508860759493671e-06,
"loss": 0.0,
"step": 34050
},
{
"epoch": 342.03,
"learning_rate": 1.5025316455696205e-06,
"loss": 0.0,
"step": 34075
},
{
"epoch": 342.28,
"learning_rate": 1.4962025316455697e-06,
"loss": 0.0,
"step": 34100
},
{
"epoch": 342.53,
"learning_rate": 1.4898734177215191e-06,
"loss": 0.0,
"step": 34125
},
{
"epoch": 342.79,
"learning_rate": 1.4835443037974683e-06,
"loss": 0.0,
"step": 34150
},
{
"epoch": 343.04,
"learning_rate": 1.4772151898734178e-06,
"loss": 0.0,
"step": 34175
},
{
"epoch": 343.29,
"learning_rate": 1.4708860759493674e-06,
"loss": 0.0,
"step": 34200
},
{
"epoch": 343.54,
"learning_rate": 1.4645569620253166e-06,
"loss": 0.0,
"step": 34225
},
{
"epoch": 343.79,
"learning_rate": 1.458227848101266e-06,
"loss": 0.0,
"step": 34250
},
{
"epoch": 344.04,
"learning_rate": 1.4518987341772153e-06,
"loss": 0.0,
"step": 34275
},
{
"epoch": 344.29,
"learning_rate": 1.4455696202531647e-06,
"loss": 0.0,
"step": 34300
},
{
"epoch": 344.54,
"learning_rate": 1.439240506329114e-06,
"loss": 0.0,
"step": 34325
},
{
"epoch": 344.79,
"learning_rate": 1.4329113924050633e-06,
"loss": 0.0,
"step": 34350
},
{
"epoch": 345.04,
"learning_rate": 1.4265822784810128e-06,
"loss": 0.0,
"step": 34375
},
{
"epoch": 345.29,
"learning_rate": 1.4202531645569622e-06,
"loss": 0.0,
"step": 34400
},
{
"epoch": 345.55,
"learning_rate": 1.4139240506329116e-06,
"loss": 0.0,
"step": 34425
},
{
"epoch": 345.8,
"learning_rate": 1.4075949367088608e-06,
"loss": 0.0,
"step": 34450
},
{
"epoch": 346.05,
"learning_rate": 1.4012658227848103e-06,
"loss": 0.0,
"step": 34475
},
{
"epoch": 346.3,
"learning_rate": 1.3949367088607597e-06,
"loss": 0.0,
"step": 34500
},
{
"epoch": 346.55,
"learning_rate": 1.388607594936709e-06,
"loss": 0.0,
"step": 34525
},
{
"epoch": 346.8,
"learning_rate": 1.3822784810126583e-06,
"loss": 0.0,
"step": 34550
},
{
"epoch": 347.05,
"learning_rate": 1.3759493670886076e-06,
"loss": 0.0,
"step": 34575
},
{
"epoch": 347.3,
"learning_rate": 1.3696202531645572e-06,
"loss": 0.0,
"step": 34600
},
{
"epoch": 347.55,
"learning_rate": 1.3632911392405066e-06,
"loss": 0.0,
"step": 34625
},
{
"epoch": 347.8,
"learning_rate": 1.3569620253164558e-06,
"loss": 0.0,
"step": 34650
},
{
"epoch": 348.06,
"learning_rate": 1.3506329113924053e-06,
"loss": 0.0,
"step": 34675
},
{
"epoch": 348.31,
"learning_rate": 1.3443037974683545e-06,
"loss": 0.0,
"step": 34700
},
{
"epoch": 348.56,
"learning_rate": 1.337974683544304e-06,
"loss": 0.0,
"step": 34725
},
{
"epoch": 348.81,
"learning_rate": 1.3316455696202531e-06,
"loss": 0.0,
"step": 34750
},
{
"epoch": 349.06,
"learning_rate": 1.3253164556962025e-06,
"loss": 0.0,
"step": 34775
},
{
"epoch": 349.31,
"learning_rate": 1.318987341772152e-06,
"loss": 0.0,
"step": 34800
},
{
"epoch": 349.56,
"learning_rate": 1.3126582278481014e-06,
"loss": 0.0,
"step": 34825
},
{
"epoch": 349.81,
"learning_rate": 1.3063291139240508e-06,
"loss": 0.0,
"step": 34850
},
{
"epoch": 350.06,
"learning_rate": 1.3e-06,
"loss": 0.0,
"step": 34875
},
{
"epoch": 350.31,
"learning_rate": 1.2936708860759495e-06,
"loss": 0.0,
"step": 34900
},
{
"epoch": 350.56,
"learning_rate": 1.287341772151899e-06,
"loss": 0.0,
"step": 34925
},
{
"epoch": 350.82,
"learning_rate": 1.2810126582278481e-06,
"loss": 0.0,
"step": 34950
},
{
"epoch": 351.07,
"learning_rate": 1.2746835443037975e-06,
"loss": 0.0,
"step": 34975
},
{
"epoch": 351.32,
"learning_rate": 1.2683544303797468e-06,
"loss": 0.0,
"step": 35000
},
{
"epoch": 351.32,
"eval_loss": 0.41078662872314453,
"eval_runtime": 2834.2574,
"eval_samples_per_second": 4.496,
"eval_steps_per_second": 0.281,
"eval_wer": 7.729209004220729,
"step": 35000
},
{
"epoch": 351.57,
"learning_rate": 1.2620253164556964e-06,
"loss": 0.0,
"step": 35025
},
{
"epoch": 351.82,
"learning_rate": 1.2556962025316458e-06,
"loss": 0.0,
"step": 35050
},
{
"epoch": 352.07,
"learning_rate": 1.249367088607595e-06,
"loss": 0.0,
"step": 35075
},
{
"epoch": 352.32,
"learning_rate": 1.2430379746835445e-06,
"loss": 0.0,
"step": 35100
},
{
"epoch": 352.57,
"learning_rate": 1.2367088607594937e-06,
"loss": 0.0,
"step": 35125
},
{
"epoch": 352.82,
"learning_rate": 1.2303797468354431e-06,
"loss": 0.0,
"step": 35150
},
{
"epoch": 353.07,
"learning_rate": 1.2240506329113925e-06,
"loss": 0.0,
"step": 35175
},
{
"epoch": 353.32,
"learning_rate": 1.217721518987342e-06,
"loss": 0.0,
"step": 35200
},
{
"epoch": 353.58,
"learning_rate": 1.2113924050632912e-06,
"loss": 0.0,
"step": 35225
},
{
"epoch": 353.83,
"learning_rate": 1.2050632911392406e-06,
"loss": 0.0,
"step": 35250
},
{
"epoch": 354.08,
"learning_rate": 1.19873417721519e-06,
"loss": 0.0,
"step": 35275
},
{
"epoch": 354.33,
"learning_rate": 1.1924050632911393e-06,
"loss": 0.0,
"step": 35300
},
{
"epoch": 354.58,
"learning_rate": 1.1860759493670887e-06,
"loss": 0.0,
"step": 35325
},
{
"epoch": 354.83,
"learning_rate": 1.1797468354430381e-06,
"loss": 0.0,
"step": 35350
},
{
"epoch": 355.08,
"learning_rate": 1.1734177215189875e-06,
"loss": 0.0,
"step": 35375
},
{
"epoch": 355.33,
"learning_rate": 1.1670886075949368e-06,
"loss": 0.0,
"step": 35400
},
{
"epoch": 355.58,
"learning_rate": 1.1607594936708862e-06,
"loss": 0.0,
"step": 35425
},
{
"epoch": 355.83,
"learning_rate": 1.1544303797468354e-06,
"loss": 0.0,
"step": 35450
},
{
"epoch": 356.09,
"learning_rate": 1.148101265822785e-06,
"loss": 0.0,
"step": 35475
},
{
"epoch": 356.34,
"learning_rate": 1.1417721518987343e-06,
"loss": 0.0,
"step": 35500
},
{
"epoch": 356.59,
"learning_rate": 1.1354430379746837e-06,
"loss": 0.0,
"step": 35525
},
{
"epoch": 356.84,
"learning_rate": 1.129113924050633e-06,
"loss": 0.0,
"step": 35550
},
{
"epoch": 357.09,
"learning_rate": 1.1227848101265823e-06,
"loss": 0.0,
"step": 35575
},
{
"epoch": 357.34,
"learning_rate": 1.1164556962025318e-06,
"loss": 0.0,
"step": 35600
},
{
"epoch": 357.59,
"learning_rate": 1.1101265822784812e-06,
"loss": 0.0,
"step": 35625
},
{
"epoch": 357.84,
"learning_rate": 1.1037974683544304e-06,
"loss": 0.0,
"step": 35650
},
{
"epoch": 358.09,
"learning_rate": 1.0974683544303798e-06,
"loss": 0.0,
"step": 35675
},
{
"epoch": 358.34,
"learning_rate": 1.0911392405063293e-06,
"loss": 0.0,
"step": 35700
},
{
"epoch": 358.59,
"learning_rate": 1.0848101265822787e-06,
"loss": 0.0,
"step": 35725
},
{
"epoch": 358.85,
"learning_rate": 1.078481012658228e-06,
"loss": 0.0,
"step": 35750
},
{
"epoch": 359.1,
"learning_rate": 1.0721518987341773e-06,
"loss": 0.0,
"step": 35775
},
{
"epoch": 359.35,
"learning_rate": 1.0658227848101268e-06,
"loss": 0.0,
"step": 35800
},
{
"epoch": 359.6,
"learning_rate": 1.059493670886076e-06,
"loss": 0.0,
"step": 35825
},
{
"epoch": 359.85,
"learning_rate": 1.0531645569620254e-06,
"loss": 0.0,
"step": 35850
},
{
"epoch": 360.1,
"learning_rate": 1.0468354430379746e-06,
"loss": 0.0,
"step": 35875
},
{
"epoch": 360.35,
"learning_rate": 1.0405063291139243e-06,
"loss": 0.0,
"step": 35900
},
{
"epoch": 360.6,
"learning_rate": 1.0341772151898735e-06,
"loss": 0.0,
"step": 35925
},
{
"epoch": 360.85,
"learning_rate": 1.027848101265823e-06,
"loss": 0.0,
"step": 35950
},
{
"epoch": 361.1,
"learning_rate": 1.0215189873417721e-06,
"loss": 0.0,
"step": 35975
},
{
"epoch": 361.36,
"learning_rate": 1.0151898734177218e-06,
"loss": 0.0,
"step": 36000
},
{
"epoch": 361.36,
"eval_loss": 0.4141576886177063,
"eval_runtime": 2833.1664,
"eval_samples_per_second": 4.497,
"eval_steps_per_second": 0.281,
"eval_wer": 7.732140065655776,
"step": 36000
},
{
"epoch": 361.61,
"learning_rate": 1.008860759493671e-06,
"loss": 0.0,
"step": 36025
},
{
"epoch": 361.86,
"learning_rate": 1.0025316455696204e-06,
"loss": 0.0,
"step": 36050
},
{
"epoch": 362.11,
"learning_rate": 9.962025316455696e-07,
"loss": 0.0,
"step": 36075
},
{
"epoch": 362.36,
"learning_rate": 9.89873417721519e-07,
"loss": 0.0,
"step": 36100
},
{
"epoch": 362.61,
"learning_rate": 9.835443037974685e-07,
"loss": 0.0,
"step": 36125
},
{
"epoch": 362.86,
"learning_rate": 9.77215189873418e-07,
"loss": 0.0,
"step": 36150
},
{
"epoch": 363.11,
"learning_rate": 9.708860759493671e-07,
"loss": 0.0,
"step": 36175
},
{
"epoch": 363.36,
"learning_rate": 9.645569620253165e-07,
"loss": 0.0,
"step": 36200
},
{
"epoch": 363.61,
"learning_rate": 9.58227848101266e-07,
"loss": 0.0,
"step": 36225
},
{
"epoch": 363.86,
"learning_rate": 9.518987341772153e-07,
"loss": 0.0,
"step": 36250
},
{
"epoch": 364.12,
"learning_rate": 9.455696202531646e-07,
"loss": 0.0,
"step": 36275
},
{
"epoch": 364.37,
"learning_rate": 9.39240506329114e-07,
"loss": 0.0,
"step": 36300
},
{
"epoch": 364.62,
"learning_rate": 9.329113924050634e-07,
"loss": 0.0,
"step": 36325
},
{
"epoch": 364.87,
"learning_rate": 9.265822784810127e-07,
"loss": 0.0,
"step": 36350
},
{
"epoch": 365.12,
"learning_rate": 9.202531645569621e-07,
"loss": 0.0,
"step": 36375
},
{
"epoch": 365.37,
"learning_rate": 9.139240506329115e-07,
"loss": 0.0,
"step": 36400
},
{
"epoch": 365.62,
"learning_rate": 9.075949367088609e-07,
"loss": 0.0,
"step": 36425
},
{
"epoch": 365.87,
"learning_rate": 9.012658227848102e-07,
"loss": 0.0,
"step": 36450
},
{
"epoch": 366.12,
"learning_rate": 8.949367088607595e-07,
"loss": 0.0,
"step": 36475
},
{
"epoch": 366.37,
"learning_rate": 8.886075949367088e-07,
"loss": 0.0,
"step": 36500
},
{
"epoch": 366.62,
"learning_rate": 8.822784810126584e-07,
"loss": 0.0,
"step": 36525
},
{
"epoch": 366.88,
"learning_rate": 8.759493670886077e-07,
"loss": 0.0,
"step": 36550
},
{
"epoch": 367.13,
"learning_rate": 8.69620253164557e-07,
"loss": 0.0,
"step": 36575
},
{
"epoch": 367.38,
"learning_rate": 8.632911392405063e-07,
"loss": 0.0,
"step": 36600
},
{
"epoch": 367.63,
"learning_rate": 8.569620253164559e-07,
"loss": 0.0,
"step": 36625
},
{
"epoch": 367.88,
"learning_rate": 8.506329113924052e-07,
"loss": 0.0,
"step": 36650
},
{
"epoch": 368.13,
"learning_rate": 8.443037974683545e-07,
"loss": 0.0,
"step": 36675
},
{
"epoch": 368.38,
"learning_rate": 8.379746835443038e-07,
"loss": 0.0,
"step": 36700
},
{
"epoch": 368.63,
"learning_rate": 8.316455696202532e-07,
"loss": 0.0,
"step": 36725
},
{
"epoch": 368.88,
"learning_rate": 8.253164556962026e-07,
"loss": 0.0,
"step": 36750
},
{
"epoch": 369.13,
"learning_rate": 8.189873417721519e-07,
"loss": 0.0,
"step": 36775
},
{
"epoch": 369.39,
"learning_rate": 8.126582278481013e-07,
"loss": 0.0,
"step": 36800
},
{
"epoch": 369.64,
"learning_rate": 8.063291139240507e-07,
"loss": 0.0,
"step": 36825
},
{
"epoch": 369.89,
"learning_rate": 8.000000000000001e-07,
"loss": 0.0,
"step": 36850
},
{
"epoch": 370.14,
"learning_rate": 7.936708860759494e-07,
"loss": 0.0,
"step": 36875
},
{
"epoch": 370.39,
"learning_rate": 7.873417721518987e-07,
"loss": 0.0,
"step": 36900
},
{
"epoch": 370.64,
"learning_rate": 7.810126582278482e-07,
"loss": 0.0,
"step": 36925
},
{
"epoch": 370.89,
"learning_rate": 7.746835443037976e-07,
"loss": 0.0,
"step": 36950
},
{
"epoch": 371.14,
"learning_rate": 7.683544303797469e-07,
"loss": 0.0,
"step": 36975
},
{
"epoch": 371.39,
"learning_rate": 7.620253164556962e-07,
"loss": 0.0,
"step": 37000
},
{
"epoch": 371.39,
"eval_loss": 0.4170127809047699,
"eval_runtime": 2836.3086,
"eval_samples_per_second": 4.492,
"eval_steps_per_second": 0.281,
"eval_wer": 7.720415819915585,
"step": 37000
},
{
"epoch": 371.64,
"learning_rate": 7.556962025316456e-07,
"loss": 0.0,
"step": 37025
},
{
"epoch": 371.89,
"learning_rate": 7.493670886075951e-07,
"loss": 0.0,
"step": 37050
},
{
"epoch": 372.15,
"learning_rate": 7.430379746835444e-07,
"loss": 0.0,
"step": 37075
},
{
"epoch": 372.4,
"learning_rate": 7.367088607594937e-07,
"loss": 0.0,
"step": 37100
},
{
"epoch": 372.65,
"learning_rate": 7.303797468354431e-07,
"loss": 0.0,
"step": 37125
},
{
"epoch": 372.9,
"learning_rate": 7.240506329113925e-07,
"loss": 0.0,
"step": 37150
},
{
"epoch": 373.15,
"learning_rate": 7.177215189873418e-07,
"loss": 0.0,
"step": 37175
},
{
"epoch": 373.4,
"learning_rate": 7.113924050632912e-07,
"loss": 0.0,
"step": 37200
},
{
"epoch": 373.65,
"learning_rate": 7.050632911392406e-07,
"loss": 0.0,
"step": 37225
},
{
"epoch": 373.9,
"learning_rate": 6.9873417721519e-07,
"loss": 0.0,
"step": 37250
},
{
"epoch": 374.15,
"learning_rate": 6.924050632911393e-07,
"loss": 0.0,
"step": 37275
},
{
"epoch": 374.4,
"learning_rate": 6.860759493670886e-07,
"loss": 0.0,
"step": 37300
},
{
"epoch": 374.65,
"learning_rate": 6.797468354430379e-07,
"loss": 0.0,
"step": 37325
},
{
"epoch": 374.91,
"learning_rate": 6.734177215189875e-07,
"loss": 0.0,
"step": 37350
},
{
"epoch": 375.16,
"learning_rate": 6.670886075949368e-07,
"loss": 0.0,
"step": 37375
},
{
"epoch": 375.41,
"learning_rate": 6.607594936708861e-07,
"loss": 0.0,
"step": 37400
},
{
"epoch": 375.66,
"learning_rate": 6.544303797468354e-07,
"loss": 0.0,
"step": 37425
},
{
"epoch": 375.91,
"learning_rate": 6.483544303797469e-07,
"loss": 0.0,
"step": 37450
},
{
"epoch": 376.16,
"learning_rate": 6.420253164556962e-07,
"loss": 0.0,
"step": 37475
},
{
"epoch": 376.41,
"learning_rate": 6.356962025316456e-07,
"loss": 0.0,
"step": 37500
},
{
"epoch": 376.66,
"learning_rate": 6.29367088607595e-07,
"loss": 0.0,
"step": 37525
},
{
"epoch": 376.91,
"learning_rate": 6.230379746835444e-07,
"loss": 0.0,
"step": 37550
},
{
"epoch": 377.16,
"learning_rate": 6.167088607594937e-07,
"loss": 0.0,
"step": 37575
},
{
"epoch": 377.42,
"learning_rate": 6.103797468354431e-07,
"loss": 0.0,
"step": 37600
},
{
"epoch": 377.67,
"learning_rate": 6.040506329113924e-07,
"loss": 0.0,
"step": 37625
},
{
"epoch": 377.92,
"learning_rate": 5.977215189873419e-07,
"loss": 0.0,
"step": 37650
},
{
"epoch": 378.17,
"learning_rate": 5.913924050632912e-07,
"loss": 0.0,
"step": 37675
},
{
"epoch": 378.42,
"learning_rate": 5.850632911392406e-07,
"loss": 0.0,
"step": 37700
},
{
"epoch": 378.67,
"learning_rate": 5.787341772151899e-07,
"loss": 0.0,
"step": 37725
},
{
"epoch": 378.92,
"learning_rate": 5.724050632911393e-07,
"loss": 0.0,
"step": 37750
},
{
"epoch": 379.17,
"learning_rate": 5.660759493670887e-07,
"loss": 0.0,
"step": 37775
},
{
"epoch": 379.42,
"learning_rate": 5.59746835443038e-07,
"loss": 0.0,
"step": 37800
},
{
"epoch": 379.67,
"learning_rate": 5.534177215189873e-07,
"loss": 0.0,
"step": 37825
},
{
"epoch": 379.92,
"learning_rate": 5.470886075949368e-07,
"loss": 0.0,
"step": 37850
},
{
"epoch": 380.18,
"learning_rate": 5.407594936708861e-07,
"loss": 0.0,
"step": 37875
},
{
"epoch": 380.43,
"learning_rate": 5.344303797468354e-07,
"loss": 0.0,
"step": 37900
},
{
"epoch": 380.68,
"learning_rate": 5.281012658227848e-07,
"loss": 0.0,
"step": 37925
},
{
"epoch": 380.93,
"learning_rate": 5.217721518987342e-07,
"loss": 0.0,
"step": 37950
},
{
"epoch": 381.18,
"learning_rate": 5.154430379746836e-07,
"loss": 0.0,
"step": 37975
},
{
"epoch": 381.43,
"learning_rate": 5.091139240506329e-07,
"loss": 0.0,
"step": 38000
},
{
"epoch": 381.43,
"eval_loss": 0.4188634753227234,
"eval_runtime": 2829.9673,
"eval_samples_per_second": 4.503,
"eval_steps_per_second": 0.282,
"eval_wer": 7.725300922307332,
"step": 38000
},
{
"epoch": 381.68,
"learning_rate": 5.027848101265823e-07,
"loss": 0.0,
"step": 38025
},
{
"epoch": 381.93,
"learning_rate": 4.964556962025317e-07,
"loss": 0.0,
"step": 38050
},
{
"epoch": 382.18,
"learning_rate": 4.901265822784811e-07,
"loss": 0.0,
"step": 38075
},
{
"epoch": 382.43,
"learning_rate": 4.837974683544304e-07,
"loss": 0.0,
"step": 38100
},
{
"epoch": 382.69,
"learning_rate": 4.774683544303798e-07,
"loss": 0.0,
"step": 38125
},
{
"epoch": 382.94,
"learning_rate": 4.711392405063291e-07,
"loss": 0.0,
"step": 38150
},
{
"epoch": 383.19,
"learning_rate": 4.6481012658227853e-07,
"loss": 0.0,
"step": 38175
},
{
"epoch": 383.44,
"learning_rate": 4.5848101265822785e-07,
"loss": 0.0,
"step": 38200
},
{
"epoch": 383.69,
"learning_rate": 4.521518987341773e-07,
"loss": 0.0,
"step": 38225
},
{
"epoch": 383.94,
"learning_rate": 4.458227848101266e-07,
"loss": 0.0,
"step": 38250
},
{
"epoch": 384.19,
"learning_rate": 4.39493670886076e-07,
"loss": 0.0,
"step": 38275
},
{
"epoch": 384.44,
"learning_rate": 4.3316455696202535e-07,
"loss": 0.0,
"step": 38300
},
{
"epoch": 384.69,
"learning_rate": 4.268354430379747e-07,
"loss": 0.0,
"step": 38325
},
{
"epoch": 384.94,
"learning_rate": 4.2050632911392405e-07,
"loss": 0.0,
"step": 38350
},
{
"epoch": 385.19,
"learning_rate": 4.141772151898735e-07,
"loss": 0.0,
"step": 38375
},
{
"epoch": 385.45,
"learning_rate": 4.078481012658228e-07,
"loss": 0.0,
"step": 38400
},
{
"epoch": 385.7,
"learning_rate": 4.015189873417722e-07,
"loss": 0.0,
"step": 38425
},
{
"epoch": 385.95,
"learning_rate": 3.9518987341772155e-07,
"loss": 0.0,
"step": 38450
},
{
"epoch": 386.2,
"learning_rate": 3.888607594936709e-07,
"loss": 0.0,
"step": 38475
},
{
"epoch": 386.45,
"learning_rate": 3.825316455696203e-07,
"loss": 0.0,
"step": 38500
},
{
"epoch": 386.7,
"learning_rate": 3.7620253164556967e-07,
"loss": 0.0,
"step": 38525
},
{
"epoch": 386.95,
"learning_rate": 3.69873417721519e-07,
"loss": 0.0,
"step": 38550
},
{
"epoch": 387.2,
"learning_rate": 3.635443037974684e-07,
"loss": 0.0,
"step": 38575
},
{
"epoch": 387.45,
"learning_rate": 3.5721518987341774e-07,
"loss": 0.0,
"step": 38600
},
{
"epoch": 387.7,
"learning_rate": 3.5088607594936717e-07,
"loss": 0.0,
"step": 38625
},
{
"epoch": 387.95,
"learning_rate": 3.445569620253165e-07,
"loss": 0.0,
"step": 38650
},
{
"epoch": 388.21,
"learning_rate": 3.3822784810126587e-07,
"loss": 0.0,
"step": 38675
},
{
"epoch": 388.46,
"learning_rate": 3.318987341772152e-07,
"loss": 0.0,
"step": 38700
},
{
"epoch": 388.71,
"learning_rate": 3.255696202531646e-07,
"loss": 0.0,
"step": 38725
},
{
"epoch": 388.96,
"learning_rate": 3.1924050632911394e-07,
"loss": 0.0,
"step": 38750
},
{
"epoch": 389.21,
"learning_rate": 3.1291139240506326e-07,
"loss": 0.0,
"step": 38775
},
{
"epoch": 389.46,
"learning_rate": 3.065822784810127e-07,
"loss": 0.0,
"step": 38800
},
{
"epoch": 389.71,
"learning_rate": 3.0025316455696206e-07,
"loss": 0.0,
"step": 38825
},
{
"epoch": 389.96,
"learning_rate": 2.9392405063291144e-07,
"loss": 0.0,
"step": 38850
},
{
"epoch": 390.21,
"learning_rate": 2.875949367088608e-07,
"loss": 0.0,
"step": 38875
},
{
"epoch": 390.46,
"learning_rate": 2.8126582278481013e-07,
"loss": 0.0,
"step": 38900
},
{
"epoch": 390.72,
"learning_rate": 2.749367088607595e-07,
"loss": 0.0,
"step": 38925
},
{
"epoch": 390.97,
"learning_rate": 2.686075949367089e-07,
"loss": 0.0,
"step": 38950
},
{
"epoch": 391.22,
"learning_rate": 2.6227848101265826e-07,
"loss": 0.0,
"step": 38975
},
{
"epoch": 391.47,
"learning_rate": 2.5594936708860763e-07,
"loss": 0.0,
"step": 39000
},
{
"epoch": 391.47,
"eval_loss": 0.4201821982860565,
"eval_runtime": 2852.7738,
"eval_samples_per_second": 4.467,
"eval_steps_per_second": 0.279,
"eval_wer": 7.726277942785681,
"step": 39000
},
{
"epoch": 391.72,
"learning_rate": 2.49620253164557e-07,
"loss": 0.0,
"step": 39025
},
{
"epoch": 391.97,
"learning_rate": 2.432911392405064e-07,
"loss": 0.0,
"step": 39050
},
{
"epoch": 392.22,
"learning_rate": 2.3696202531645573e-07,
"loss": 0.0,
"step": 39075
},
{
"epoch": 392.47,
"learning_rate": 2.306329113924051e-07,
"loss": 0.0,
"step": 39100
},
{
"epoch": 392.72,
"learning_rate": 2.2430379746835445e-07,
"loss": 0.0,
"step": 39125
},
{
"epoch": 392.97,
"learning_rate": 2.1797468354430383e-07,
"loss": 0.0,
"step": 39150
},
{
"epoch": 393.22,
"learning_rate": 2.116455696202532e-07,
"loss": 0.0,
"step": 39175
},
{
"epoch": 393.48,
"learning_rate": 2.0531645569620258e-07,
"loss": 0.0,
"step": 39200
},
{
"epoch": 393.73,
"learning_rate": 1.989873417721519e-07,
"loss": 0.0,
"step": 39225
},
{
"epoch": 393.98,
"learning_rate": 1.9265822784810127e-07,
"loss": 0.0,
"step": 39250
},
{
"epoch": 394.23,
"learning_rate": 1.8632911392405062e-07,
"loss": 0.0,
"step": 39275
},
{
"epoch": 394.48,
"learning_rate": 1.8e-07,
"loss": 0.0,
"step": 39300
},
{
"epoch": 394.73,
"learning_rate": 1.7367088607594937e-07,
"loss": 0.0,
"step": 39325
},
{
"epoch": 394.98,
"learning_rate": 1.6734177215189875e-07,
"loss": 0.0,
"step": 39350
},
{
"epoch": 395.23,
"learning_rate": 1.610126582278481e-07,
"loss": 0.0,
"step": 39375
},
{
"epoch": 395.48,
"learning_rate": 1.546835443037975e-07,
"loss": 0.0,
"step": 39400
},
{
"epoch": 395.73,
"learning_rate": 1.4835443037974684e-07,
"loss": 0.0,
"step": 39425
},
{
"epoch": 395.98,
"learning_rate": 1.4202531645569622e-07,
"loss": 0.0,
"step": 39450
},
{
"epoch": 396.24,
"learning_rate": 1.3569620253164557e-07,
"loss": 0.0,
"step": 39475
},
{
"epoch": 396.49,
"learning_rate": 1.2936708860759494e-07,
"loss": 0.0,
"step": 39500
},
{
"epoch": 396.74,
"learning_rate": 1.2329113924050634e-07,
"loss": 0.0,
"step": 39525
},
{
"epoch": 396.99,
"learning_rate": 1.169620253164557e-07,
"loss": 0.0,
"step": 39550
},
{
"epoch": 397.24,
"learning_rate": 1.1063291139240506e-07,
"loss": 0.0,
"step": 39575
},
{
"epoch": 397.49,
"learning_rate": 1.0430379746835444e-07,
"loss": 0.0,
"step": 39600
},
{
"epoch": 397.74,
"learning_rate": 9.79746835443038e-08,
"loss": 0.0,
"step": 39625
},
{
"epoch": 397.99,
"learning_rate": 9.164556962025317e-08,
"loss": 0.0,
"step": 39650
},
{
"epoch": 398.24,
"learning_rate": 8.531645569620254e-08,
"loss": 0.0,
"step": 39675
},
{
"epoch": 398.49,
"learning_rate": 7.898734177215191e-08,
"loss": 0.0,
"step": 39700
},
{
"epoch": 398.75,
"learning_rate": 7.265822784810127e-08,
"loss": 0.0,
"step": 39725
},
{
"epoch": 399.0,
"learning_rate": 6.632911392405063e-08,
"loss": 0.0,
"step": 39750
},
{
"epoch": 399.25,
"learning_rate": 6.000000000000001e-08,
"loss": 0.0,
"step": 39775
},
{
"epoch": 399.5,
"learning_rate": 5.3670886075949376e-08,
"loss": 0.0,
"step": 39800
},
{
"epoch": 399.75,
"learning_rate": 4.7341772151898744e-08,
"loss": 0.0,
"step": 39825
},
{
"epoch": 400.0,
"learning_rate": 4.1012658227848106e-08,
"loss": 0.0,
"step": 39850
},
{
"epoch": 400.25,
"learning_rate": 3.4683544303797474e-08,
"loss": 0.0,
"step": 39875
},
{
"epoch": 400.5,
"learning_rate": 2.835443037974684e-08,
"loss": 0.0,
"step": 39900
},
{
"epoch": 400.75,
"learning_rate": 2.2025316455696203e-08,
"loss": 0.0,
"step": 39925
},
{
"epoch": 401.0,
"learning_rate": 1.569620253164557e-08,
"loss": 0.0,
"step": 39950
},
{
"epoch": 401.25,
"learning_rate": 9.367088607594938e-09,
"loss": 0.0,
"step": 39975
},
{
"epoch": 401.51,
"learning_rate": 3.037974683544304e-09,
"loss": 0.0,
"step": 40000
},
{
"epoch": 401.51,
"eval_loss": 0.42060527205467224,
"eval_runtime": 2833.1072,
"eval_samples_per_second": 4.498,
"eval_steps_per_second": 0.281,
"eval_wer": 7.720415819915585,
"step": 40000
},
{
"epoch": 401.51,
"step": 40000,
"total_flos": 2.172424342140513e+22,
"train_loss": 0.004165954868968765,
"train_runtime": 1001494.6755,
"train_samples_per_second": 10.225,
"train_steps_per_second": 0.04
}
],
"logging_steps": 25,
"max_steps": 40000,
"num_input_tokens_seen": 0,
"num_train_epochs": 405,
"save_steps": 1000,
"total_flos": 2.172424342140513e+22,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}