End of training
Browse files- all_results.json +6 -6
- eval_results.json +3 -3
- runs/Aug11_06-50-36_dsai-server/events.out.tfevents.1691720181.dsai-server +3 -0
- train_results.json +3 -3
- trainer_state.json +18 -18
all_results.json
CHANGED
@@ -1,12 +1,12 @@
|
|
1 |
{
|
2 |
"epoch": 4.84,
|
3 |
"eval_loss": 0.42781996726989746,
|
4 |
-
"eval_runtime":
|
5 |
-
"eval_samples_per_second": 5.
|
6 |
-
"eval_steps_per_second": 1.
|
7 |
"eval_wer": 17.437313089487002,
|
8 |
"train_loss": 0.2648608121991158,
|
9 |
-
"train_runtime":
|
10 |
-
"train_samples_per_second": 4.
|
11 |
-
"train_steps_per_second": 0.
|
12 |
}
|
|
|
1 |
{
|
2 |
"epoch": 4.84,
|
3 |
"eval_loss": 0.42781996726989746,
|
4 |
+
"eval_runtime": 617.6877,
|
5 |
+
"eval_samples_per_second": 5.864,
|
6 |
+
"eval_steps_per_second": 1.467,
|
7 |
"eval_wer": 17.437313089487002,
|
8 |
"train_loss": 0.2648608121991158,
|
9 |
+
"train_runtime": 8065.0347,
|
10 |
+
"train_samples_per_second": 4.96,
|
11 |
+
"train_steps_per_second": 0.62
|
12 |
}
|
eval_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 4.84,
|
3 |
"eval_loss": 0.42781996726989746,
|
4 |
-
"eval_runtime":
|
5 |
-
"eval_samples_per_second": 5.
|
6 |
-
"eval_steps_per_second": 1.
|
7 |
"eval_wer": 17.437313089487002
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 4.84,
|
3 |
"eval_loss": 0.42781996726989746,
|
4 |
+
"eval_runtime": 617.6877,
|
5 |
+
"eval_samples_per_second": 5.864,
|
6 |
+
"eval_steps_per_second": 1.467,
|
7 |
"eval_wer": 17.437313089487002
|
8 |
}
|
runs/Aug11_06-50-36_dsai-server/events.out.tfevents.1691720181.dsai-server
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b833ddab66184857775d2478b3a52b02da9f0f6020bc81c2fb2469716a9d2a1
|
3 |
+
size 40
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 4.84,
|
3 |
"train_loss": 0.2648608121991158,
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second": 4.
|
6 |
-
"train_steps_per_second": 0.
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 4.84,
|
3 |
"train_loss": 0.2648608121991158,
|
4 |
+
"train_runtime": 8065.0347,
|
5 |
+
"train_samples_per_second": 4.96,
|
6 |
+
"train_steps_per_second": 0.62
|
7 |
}
|
trainer_state.json
CHANGED
@@ -250,9 +250,9 @@
|
|
250 |
{
|
251 |
"epoch": 0.97,
|
252 |
"eval_loss": 0.6284407377243042,
|
253 |
-
"eval_runtime":
|
254 |
-
"eval_samples_per_second": 5.
|
255 |
-
"eval_steps_per_second": 1.
|
256 |
"eval_wer": 31.727628249367378,
|
257 |
"step": 1000
|
258 |
},
|
@@ -499,9 +499,9 @@
|
|
499 |
{
|
500 |
"epoch": 1.94,
|
501 |
"eval_loss": 0.5209963321685791,
|
502 |
-
"eval_runtime":
|
503 |
-
"eval_samples_per_second": 5.
|
504 |
-
"eval_steps_per_second": 1.
|
505 |
"eval_wer": 25.43823326432022,
|
506 |
"step": 2000
|
507 |
},
|
@@ -748,9 +748,9 @@
|
|
748 |
{
|
749 |
"epoch": 2.9,
|
750 |
"eval_loss": 0.4795286953449249,
|
751 |
-
"eval_runtime":
|
752 |
-
"eval_samples_per_second": 5.
|
753 |
-
"eval_steps_per_second": 1.
|
754 |
"eval_wer": 22.921555095468136,
|
755 |
"step": 3000
|
756 |
},
|
@@ -997,9 +997,9 @@
|
|
997 |
{
|
998 |
"epoch": 3.87,
|
999 |
"eval_loss": 0.45125144720077515,
|
1000 |
-
"eval_runtime":
|
1001 |
-
"eval_samples_per_second": 5.
|
1002 |
-
"eval_steps_per_second": 1.
|
1003 |
"eval_wer": 19.871175523349436,
|
1004 |
"step": 4000
|
1005 |
},
|
@@ -1246,9 +1246,9 @@
|
|
1246 |
{
|
1247 |
"epoch": 4.84,
|
1248 |
"eval_loss": 0.42781996726989746,
|
1249 |
-
"eval_runtime":
|
1250 |
-
"eval_samples_per_second": 5.
|
1251 |
-
"eval_steps_per_second": 1.
|
1252 |
"eval_wer": 17.437313089487002,
|
1253 |
"step": 5000
|
1254 |
},
|
@@ -1257,9 +1257,9 @@
|
|
1257 |
"step": 5000,
|
1258 |
"total_flos": 1.153995298799616e+19,
|
1259 |
"train_loss": 0.2648608121991158,
|
1260 |
-
"train_runtime":
|
1261 |
-
"train_samples_per_second": 4.
|
1262 |
-
"train_steps_per_second": 0.
|
1263 |
}
|
1264 |
],
|
1265 |
"max_steps": 5000,
|
|
|
250 |
{
|
251 |
"epoch": 0.97,
|
252 |
"eval_loss": 0.6284407377243042,
|
253 |
+
"eval_runtime": 637.2881,
|
254 |
+
"eval_samples_per_second": 5.683,
|
255 |
+
"eval_steps_per_second": 1.422,
|
256 |
"eval_wer": 31.727628249367378,
|
257 |
"step": 1000
|
258 |
},
|
|
|
499 |
{
|
500 |
"epoch": 1.94,
|
501 |
"eval_loss": 0.5209963321685791,
|
502 |
+
"eval_runtime": 640.3753,
|
503 |
+
"eval_samples_per_second": 5.656,
|
504 |
+
"eval_steps_per_second": 1.415,
|
505 |
"eval_wer": 25.43823326432022,
|
506 |
"step": 2000
|
507 |
},
|
|
|
748 |
{
|
749 |
"epoch": 2.9,
|
750 |
"eval_loss": 0.4795286953449249,
|
751 |
+
"eval_runtime": 628.7529,
|
752 |
+
"eval_samples_per_second": 5.761,
|
753 |
+
"eval_steps_per_second": 1.441,
|
754 |
"eval_wer": 22.921555095468136,
|
755 |
"step": 3000
|
756 |
},
|
|
|
997 |
{
|
998 |
"epoch": 3.87,
|
999 |
"eval_loss": 0.45125144720077515,
|
1000 |
+
"eval_runtime": 625.0491,
|
1001 |
+
"eval_samples_per_second": 5.795,
|
1002 |
+
"eval_steps_per_second": 1.449,
|
1003 |
"eval_wer": 19.871175523349436,
|
1004 |
"step": 4000
|
1005 |
},
|
|
|
1246 |
{
|
1247 |
"epoch": 4.84,
|
1248 |
"eval_loss": 0.42781996726989746,
|
1249 |
+
"eval_runtime": 622.9975,
|
1250 |
+
"eval_samples_per_second": 5.814,
|
1251 |
+
"eval_steps_per_second": 1.454,
|
1252 |
"eval_wer": 17.437313089487002,
|
1253 |
"step": 5000
|
1254 |
},
|
|
|
1257 |
"step": 5000,
|
1258 |
"total_flos": 1.153995298799616e+19,
|
1259 |
"train_loss": 0.2648608121991158,
|
1260 |
+
"train_runtime": 8065.0347,
|
1261 |
+
"train_samples_per_second": 4.96,
|
1262 |
+
"train_steps_per_second": 0.62
|
1263 |
}
|
1264 |
],
|
1265 |
"max_steps": 5000,
|